[{"id": 1, "image": "COCO_val2014_000000310196.jpg", "conversations": [{"from": "human", "value": "Is there a snowboard in the image?"}, {"from": "gpt", "value": "This image contains snowboard, person, skis. Based on this, is there a snowboard in the image?"}]}, {"id": 2, "image": "COCO_val2014_000000310196.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains snowboard, person, skis. Based on this, is there a backpack in the image?"}]}, {"id": 3, "image": "COCO_val2014_000000310196.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains snowboard, person, skis. Based on this, is there a person in the image?"}]}, {"id": 4, "image": "COCO_val2014_000000310196.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains snowboard, person, skis. Based on this, is there a car in the image?"}]}, {"id": 5, "image": "COCO_val2014_000000310196.jpg", "conversations": [{"from": "human", "value": "Is there a skis in the image?"}, {"from": "gpt", "value": "This image contains snowboard, person, skis. Based on this, is there a skis in the image?"}]}, {"id": 6, "image": "COCO_val2014_000000310196.jpg", "conversations": [{"from": "human", "value": "Is there a dog in the image?"}, {"from": "gpt", "value": "This image contains snowboard, person, skis. Based on this, is there a dog in the image?"}]}, {"id": 7, "image": "COCO_val2014_000000210789.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains truck, person, umbrella. Based on this, is there a truck in the image?"}]}, {"id": 8, "image": "COCO_val2014_000000210789.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains truck, person, umbrella. Based on this, is there a car in the image?"}]}, {"id": 9, "image": "COCO_val2014_000000210789.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains truck, person, umbrella. Based on this, is there a person in the image?"}]}, {"id": 10, "image": "COCO_val2014_000000210789.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains truck, person, umbrella. Based on this, is there a dining table in the image?"}]}, {"id": 11, "image": "COCO_val2014_000000210789.jpg", "conversations": [{"from": "human", "value": "Is there an umbrella in the image?"}, {"from": "gpt", "value": "This image contains truck, person, umbrella. Based on this, is there an umbrella in the image?"}]}, {"id": 12, "image": "COCO_val2014_000000210789.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains truck, person, umbrella. Based on this, is there a handbag in the image?"}]}, {"id": 13, "image": "COCO_val2014_000000429109.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, bicycle, car, train, bus. Based on this, is there a person in the image?"}]}, {"id": 14, "image": "COCO_val2014_000000429109.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, bicycle, car, train, bus. Based on this, is there a dining table in the image?"}]}, {"id": 15, "image": "COCO_val2014_000000429109.jpg", "conversations": [{"from": "human", "value": "Is there a bicycle in the image?"}, {"from": "gpt", "value": "This image contains person, bicycle, car, train, bus. Based on this, is there a bicycle in the image?"}]}, {"id": 16, "image": "COCO_val2014_000000429109.jpg", "conversations": [{"from": "human", "value": "Is there a motorcycle in the image?"}, {"from": "gpt", "value": "This image contains person, bicycle, car, train, bus. Based on this, is there a motorcycle in the image?"}]}, {"id": 17, "image": "COCO_val2014_000000429109.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, bicycle, car, train, bus. Based on this, is there a car in the image?"}]}, {"id": 18, "image": "COCO_val2014_000000429109.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains person, bicycle, car, train, bus. Based on this, is there a truck in the image?"}]}, {"id": 19, "image": "COCO_val2014_000000211674.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, potted plant, car, bus. Based on this, is there a person in the image?"}]}, {"id": 20, "image": "COCO_val2014_000000211674.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, potted plant, car, bus. Based on this, is there a dining table in the image?"}]}, {"id": 21, "image": "COCO_val2014_000000211674.jpg", "conversations": [{"from": "human", "value": "Is there a potted plant in the image?"}, {"from": "gpt", "value": "This image contains person, potted plant, car, bus. Based on this, is there a potted plant in the image?"}]}, {"id": 22, "image": "COCO_val2014_000000211674.jpg", "conversations": [{"from": "human", "value": "Is there a vase in the image?"}, {"from": "gpt", "value": "This image contains person, potted plant, car, bus. Based on this, is there a vase in the image?"}]}, {"id": 23, "image": "COCO_val2014_000000211674.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, potted plant, car, bus. Based on this, is there a car in the image?"}]}, {"id": 24, "image": "COCO_val2014_000000211674.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains person, potted plant, car, bus. Based on this, is there a truck in the image?"}]}, {"id": 25, "image": "COCO_val2014_000000458338.jpg", "conversations": [{"from": "human", "value": "Is there a traffic light in the image?"}, {"from": "gpt", "value": "This image contains traffic light, person, car, clock. Based on this, is there a traffic light in the image?"}]}, {"id": 26, "image": "COCO_val2014_000000458338.jpg", "conversations": [{"from": "human", "value": "Is there a bus in the image?"}, {"from": "gpt", "value": "This image contains traffic light, person, car, clock. Based on this, is there a bus in the image?"}]}, {"id": 27, "image": "COCO_val2014_000000458338.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains traffic light, person, car, clock. Based on this, is there a person in the image?"}]}, {"id": 28, "image": "COCO_val2014_000000458338.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains traffic light, person, car, clock. Based on this, is there a dining table in the image?"}]}, {"id": 29, "image": "COCO_val2014_000000458338.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains traffic light, person, car, clock. Based on this, is there a car in the image?"}]}, {"id": 30, "image": "COCO_val2014_000000458338.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains traffic light, person, car, clock. Based on this, is there a truck in the image?"}]}, {"id": 31, "image": "COCO_val2014_000000283412.jpg", "conversations": [{"from": "human", "value": "Is there a dog in the image?"}, {"from": "gpt", "value": "This image contains dog, dining table, bed, cup. Based on this, is there a dog in the image?"}]}, {"id": 32, "image": "COCO_val2014_000000283412.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains dog, dining table, bed, cup. Based on this, is there a person in the image?"}]}, {"id": 33, "image": "COCO_val2014_000000283412.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains dog, dining table, bed, cup. Based on this, is there a dining table in the image?"}]}, {"id": 34, "image": "COCO_val2014_000000283412.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains dog, dining table, bed, cup. Based on this, is there a chair in the image?"}]}, {"id": 35, "image": "COCO_val2014_000000283412.jpg", "conversations": [{"from": "human", "value": "Is there a bed in the image?"}, {"from": "gpt", "value": "This image contains dog, dining table, bed, cup. Based on this, is there a bed in the image?"}]}, {"id": 36, "image": "COCO_val2014_000000283412.jpg", "conversations": [{"from": "human", "value": "Is there a book in the image?"}, {"from": "gpt", "value": "This image contains dog, dining table, bed, cup. Based on this, is there a book in the image?"}]}, {"id": 37, "image": "COCO_val2014_000000265719.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, spoon, fork, donut, cake. Based on this, is there a person in the image?"}]}, {"id": 38, "image": "COCO_val2014_000000265719.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, spoon, fork, donut, cake. Based on this, is there a car in the image?"}]}, {"id": 39, "image": "COCO_val2014_000000265719.jpg", "conversations": [{"from": "human", "value": "Is there a spoon in the image?"}, {"from": "gpt", "value": "This image contains person, spoon, fork, donut, cake. Based on this, is there a spoon in the image?"}]}, {"id": 40, "image": "COCO_val2014_000000265719.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains person, spoon, fork, donut, cake. Based on this, is there a cup in the image?"}]}, {"id": 41, "image": "COCO_val2014_000000265719.jpg", "conversations": [{"from": "human", "value": "Is there a fork in the image?"}, {"from": "gpt", "value": "This image contains person, spoon, fork, donut, cake. Based on this, is there a fork in the image?"}]}, {"id": 42, "image": "COCO_val2014_000000265719.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, spoon, fork, donut, cake. Based on this, is there a dining table in the image?"}]}, {"id": 43, "image": "COCO_val2014_000000461331.jpg", "conversations": [{"from": "human", "value": "Is there a tv in the image?"}, {"from": "gpt", "value": "This image contains tv, toaster, microwave, oven. Based on this, is there a tv in the image?"}]}, {"id": 44, "image": "COCO_val2014_000000461331.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains tv, toaster, microwave, oven. Based on this, is there a person in the image?"}]}, {"id": 45, "image": "COCO_val2014_000000461331.jpg", "conversations": [{"from": "human", "value": "Is there a toaster in the image?"}, {"from": "gpt", "value": "This image contains tv, toaster, microwave, oven. Based on this, is there a toaster in the image?"}]}, {"id": 46, "image": "COCO_val2014_000000461331.jpg", "conversations": [{"from": "human", "value": "Is there a book in the image?"}, {"from": "gpt", "value": "This image contains tv, toaster, microwave, oven. Based on this, is there a book in the image?"}]}, {"id": 47, "image": "COCO_val2014_000000461331.jpg", "conversations": [{"from": "human", "value": "Is there a microwave in the image?"}, {"from": "gpt", "value": "This image contains tv, toaster, microwave, oven. Based on this, is there a microwave in the image?"}]}, {"id": 48, "image": "COCO_val2014_000000461331.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains tv, toaster, microwave, oven. Based on this, is there a bottle in the image?"}]}, {"id": 49, "image": "COCO_val2014_000000544456.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, skis. Based on this, is there a backpack in the image?"}]}, {"id": 50, "image": "COCO_val2014_000000544456.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, skis. Based on this, is there a handbag in the image?"}]}, {"id": 51, "image": "COCO_val2014_000000544456.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, skis. Based on this, is there a person in the image?"}]}, {"id": 52, "image": "COCO_val2014_000000544456.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, skis. Based on this, is there a car in the image?"}]}, {"id": 53, "image": "COCO_val2014_000000544456.jpg", "conversations": [{"from": "human", "value": "Is there a skis in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, skis. Based on this, is there a skis in the image?"}]}, {"id": 54, "image": "COCO_val2014_000000544456.jpg", "conversations": [{"from": "human", "value": "Is there a snowboard in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, skis. Based on this, is there a snowboard in the image?"}]}, {"id": 55, "image": "COCO_val2014_000000017708.jpg", "conversations": [{"from": "human", "value": "Is there a bird in the image?"}, {"from": "gpt", "value": "This image contains bird, person, boat. Based on this, is there a bird in the image?"}]}, {"id": 56, "image": "COCO_val2014_000000017708.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains bird, person, boat. Based on this, is there a handbag in the image?"}]}, {"id": 57, "image": "COCO_val2014_000000017708.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains bird, person, boat. Based on this, is there a person in the image?"}]}, {"id": 58, "image": "COCO_val2014_000000017708.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains bird, person, boat. Based on this, is there a car in the image?"}]}, {"id": 59, "image": "COCO_val2014_000000017708.jpg", "conversations": [{"from": "human", "value": "Is there a boat in the image?"}, {"from": "gpt", "value": "This image contains bird, person, boat. Based on this, is there a boat in the image?"}]}, {"id": 60, "image": "COCO_val2014_000000017708.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains bird, person, boat. Based on this, is there a chair in the image?"}]}, {"id": 61, "image": "COCO_val2014_000000574692.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, orange, bottle. Based on this, is there a person in the image?"}]}, {"id": 62, "image": "COCO_val2014_000000574692.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, orange, bottle. Based on this, is there a car in the image?"}]}, {"id": 63, "image": "COCO_val2014_000000574692.jpg", "conversations": [{"from": "human", "value": "Is there an orange in the image?"}, {"from": "gpt", "value": "This image contains person, orange, bottle. Based on this, is there an orange in the image?"}]}, {"id": 64, "image": "COCO_val2014_000000574692.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, orange, bottle. Based on this, is there a dining table in the image?"}]}, {"id": 65, "image": "COCO_val2014_000000574692.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains person, orange, bottle. Based on this, is there a bottle in the image?"}]}, {"id": 66, "image": "COCO_val2014_000000574692.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains person, orange, bottle. Based on this, is there a cup in the image?"}]}, {"id": 67, "image": "COCO_val2014_000000353180.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, bus. Based on this, is there a backpack in the image?"}]}, {"id": 68, "image": "COCO_val2014_000000353180.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, bus. Based on this, is there a handbag in the image?"}]}, {"id": 69, "image": "COCO_val2014_000000353180.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, bus. Based on this, is there a person in the image?"}]}, {"id": 70, "image": "COCO_val2014_000000353180.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, bus. Based on this, is there a car in the image?"}]}, {"id": 71, "image": "COCO_val2014_000000353180.jpg", "conversations": [{"from": "human", "value": "Is there a bus in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, bus. Based on this, is there a bus in the image?"}]}, {"id": 72, "image": "COCO_val2014_000000353180.jpg", "conversations": [{"from": "human", "value": "Is there a traffic light in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, bus. Based on this, is there a traffic light in the image?"}]}, {"id": 73, "image": "COCO_val2014_000000239444.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, dining table, chair, pizza, microwave, oven. Based on this, is there a person in the image?"}]}, {"id": 74, "image": "COCO_val2014_000000239444.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, dining table, chair, pizza, microwave, oven. Based on this, is there a car in the image?"}]}, {"id": 75, "image": "COCO_val2014_000000239444.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, dining table, chair, pizza, microwave, oven. Based on this, is there a dining table in the image?"}]}, {"id": 76, "image": "COCO_val2014_000000239444.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains person, dining table, chair, pizza, microwave, oven. Based on this, is there a cup in the image?"}]}, {"id": 77, "image": "COCO_val2014_000000239444.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains person, dining table, chair, pizza, microwave, oven. Based on this, is there a chair in the image?"}]}, {"id": 78, "image": "COCO_val2014_000000239444.jpg", "conversations": [{"from": "human", "value": "Is there a couch in the image?"}, {"from": "gpt", "value": "This image contains person, dining table, chair, pizza, microwave, oven. Based on this, is there a couch in the image?"}]}, {"id": 79, "image": "COCO_val2014_000000569839.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, sandwich, hot dog, dining table, chair, cup. Based on this, is there a person in the image?"}]}, {"id": 80, "image": "COCO_val2014_000000569839.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, sandwich, hot dog, dining table, chair, cup. Based on this, is there a car in the image?"}]}, {"id": 81, "image": "COCO_val2014_000000569839.jpg", "conversations": [{"from": "human", "value": "Is there a sandwich in the image?"}, {"from": "gpt", "value": "This image contains person, sandwich, hot dog, dining table, chair, cup. Based on this, is there a sandwich in the image?"}]}, {"id": 82, "image": "COCO_val2014_000000569839.jpg", "conversations": [{"from": "human", "value": "Is there a bowl in the image?"}, {"from": "gpt", "value": "This image contains person, sandwich, hot dog, dining table, chair, cup. Based on this, is there a bowl in the image?"}]}, {"id": 83, "image": "COCO_val2014_000000569839.jpg", "conversations": [{"from": "human", "value": "Is there a hot dog in the image?"}, {"from": "gpt", "value": "This image contains person, sandwich, hot dog, dining table, chair, cup. Based on this, is there a hot dog in the image?"}]}, {"id": 84, "image": "COCO_val2014_000000569839.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains person, sandwich, hot dog, dining table, chair, cup. Based on this, is there a handbag in the image?"}]}, {"id": 85, "image": "COCO_val2014_000000219622.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, car, frisbee. Based on this, is there a person in the image?"}]}, {"id": 86, "image": "COCO_val2014_000000219622.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, car, frisbee. Based on this, is there a dining table in the image?"}]}, {"id": 87, "image": "COCO_val2014_000000219622.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, car, frisbee. Based on this, is there a car in the image?"}]}, {"id": 88, "image": "COCO_val2014_000000219622.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains person, car, frisbee. Based on this, is there a truck in the image?"}]}, {"id": 89, "image": "COCO_val2014_000000219622.jpg", "conversations": [{"from": "human", "value": "Is there a frisbee in the image?"}, {"from": "gpt", "value": "This image contains person, car, frisbee. Based on this, is there a frisbee in the image?"}]}, {"id": 90, "image": "COCO_val2014_000000219622.jpg", "conversations": [{"from": "human", "value": "Is there a dog in the image?"}, {"from": "gpt", "value": "This image contains person, car, frisbee. Based on this, is there a dog in the image?"}]}, {"id": 91, "image": "COCO_val2014_000000300368.jpg", "conversations": [{"from": "human", "value": "Is there a knife in the image?"}, {"from": "gpt", "value": "This image contains knife, person, cake, dining table. Based on this, is there a knife in the image?"}]}, {"id": 92, "image": "COCO_val2014_000000300368.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains knife, person, cake, dining table. Based on this, is there a cup in the image?"}]}, {"id": 93, "image": "COCO_val2014_000000300368.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains knife, person, cake, dining table. Based on this, is there a person in the image?"}]}, {"id": 94, "image": "COCO_val2014_000000300368.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains knife, person, cake, dining table. Based on this, is there a car in the image?"}]}, {"id": 95, "image": "COCO_val2014_000000300368.jpg", "conversations": [{"from": "human", "value": "Is there a cake in the image?"}, {"from": "gpt", "value": "This image contains knife, person, cake, dining table. Based on this, is there a cake in the image?"}]}, {"id": 96, "image": "COCO_val2014_000000300368.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains knife, person, cake, dining table. Based on this, is there a bottle in the image?"}]}, {"id": 97, "image": "COCO_val2014_000000482476.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, remote, handbag, cell phone. Based on this, is there a person in the image?"}]}, {"id": 98, "image": "COCO_val2014_000000482476.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, remote, handbag, cell phone. Based on this, is there a car in the image?"}]}, {"id": 99, "image": "COCO_val2014_000000482476.jpg", "conversations": [{"from": "human", "value": "Is there a remote in the image?"}, {"from": "gpt", "value": "This image contains person, remote, handbag, cell phone. Based on this, is there a remote in the image?"}]}, {"id": 100, "image": "COCO_val2014_000000482476.jpg", "conversations": [{"from": "human", "value": "Is there a tv in the image?"}, {"from": "gpt", "value": "This image contains person, remote, handbag, cell phone. Based on this, is there a tv in the image?"}]}, {"id": 101, "image": "COCO_val2014_000000482476.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains person, remote, handbag, cell phone. Based on this, is there a handbag in the image?"}]}, {"id": 102, "image": "COCO_val2014_000000482476.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains person, remote, handbag, cell phone. Based on this, is there a backpack in the image?"}]}, {"id": 103, "image": "COCO_val2014_000000131115.jpg", "conversations": [{"from": "human", "value": "Is there a baseball glove in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, baseball bat. Based on this, is there a baseball glove in the image?"}]}, {"id": 104, "image": "COCO_val2014_000000131115.jpg", "conversations": [{"from": "human", "value": "Is there a sports ball in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, baseball bat. Based on this, is there a sports ball in the image?"}]}, {"id": 105, "image": "COCO_val2014_000000131115.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, baseball bat. Based on this, is there a person in the image?"}]}, {"id": 106, "image": "COCO_val2014_000000131115.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, baseball bat. Based on this, is there a car in the image?"}]}, {"id": 107, "image": "COCO_val2014_000000131115.jpg", "conversations": [{"from": "human", "value": "Is there a baseball bat in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, baseball bat. Based on this, is there a baseball bat in the image?"}]}, {"id": 108, "image": "COCO_val2014_000000131115.jpg", "conversations": [{"from": "human", "value": "Is there a bench in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, baseball bat. Based on this, is there a bench in the image?"}]}, {"id": 109, "image": "COCO_val2014_000000157084.jpg", "conversations": [{"from": "human", "value": "Is there a sink in the image?"}, {"from": "gpt", "value": "This image contains sink, bench, toilet. Based on this, is there a sink in the image?"}]}, {"id": 110, "image": "COCO_val2014_000000157084.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains sink, bench, toilet. Based on this, is there a bottle in the image?"}]}, {"id": 111, "image": "COCO_val2014_000000157084.jpg", "conversations": [{"from": "human", "value": "Is there a bench in the image?"}, {"from": "gpt", "value": "This image contains sink, bench, toilet. Based on this, is there a bench in the image?"}]}, {"id": 112, "image": "COCO_val2014_000000157084.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains sink, bench, toilet. Based on this, is there a person in the image?"}]}, {"id": 113, "image": "COCO_val2014_000000157084.jpg", "conversations": [{"from": "human", "value": "Is there a toilet in the image?"}, {"from": "gpt", "value": "This image contains sink, bench, toilet. Based on this, is there a toilet in the image?"}]}, {"id": 114, "image": "COCO_val2014_000000157084.jpg", "conversations": [{"from": "human", "value": "Is there a vase in the image?"}, {"from": "gpt", "value": "This image contains sink, bench, toilet. Based on this, is there a vase in the image?"}]}, {"id": 115, "image": "COCO_val2014_000000381895.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, teddy bear, bear. Based on this, is there a person in the image?"}]}, {"id": 116, "image": "COCO_val2014_000000381895.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, teddy bear, bear. Based on this, is there a car in the image?"}]}, {"id": 117, "image": "COCO_val2014_000000381895.jpg", "conversations": [{"from": "human", "value": "Is there a teddy bear in the image?"}, {"from": "gpt", "value": "This image contains person, teddy bear, bear. Based on this, is there a teddy bear in the image?"}]}, {"id": 118, "image": "COCO_val2014_000000381895.jpg", "conversations": [{"from": "human", "value": "Is there a bed in the image?"}, {"from": "gpt", "value": "This image contains person, teddy bear, bear. Based on this, is there a bed in the image?"}]}, {"id": 119, "image": "COCO_val2014_000000381895.jpg", "conversations": [{"from": "human", "value": "Is there a bear in the image?"}, {"from": "gpt", "value": "This image contains person, teddy bear, bear. Based on this, is there a bear in the image?"}]}, {"id": 120, "image": "COCO_val2014_000000381895.jpg", "conversations": [{"from": "human", "value": "Is there a couch in the image?"}, {"from": "gpt", "value": "This image contains person, teddy bear, bear. Based on this, is there a couch in the image?"}]}, {"id": 121, "image": "COCO_val2014_000000336872.jpg", "conversations": [{"from": "human", "value": "Is there a bowl in the image?"}, {"from": "gpt", "value": "This image contains bowl, spoon, sandwich, dining table. Based on this, is there a bowl in the image?"}]}, {"id": 122, "image": "COCO_val2014_000000336872.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains bowl, spoon, sandwich, dining table. Based on this, is there a cup in the image?"}]}, {"id": 123, "image": "COCO_val2014_000000336872.jpg", "conversations": [{"from": "human", "value": "Is there a spoon in the image?"}, {"from": "gpt", "value": "This image contains bowl, spoon, sandwich, dining table. Based on this, is there a spoon in the image?"}]}, {"id": 124, "image": "COCO_val2014_000000336872.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains bowl, spoon, sandwich, dining table. Based on this, is there a bottle in the image?"}]}, {"id": 125, "image": "COCO_val2014_000000336872.jpg", "conversations": [{"from": "human", "value": "Is there a sandwich in the image?"}, {"from": "gpt", "value": "This image contains bowl, spoon, sandwich, dining table. Based on this, is there a sandwich in the image?"}]}, {"id": 126, "image": "COCO_val2014_000000336872.jpg", "conversations": [{"from": "human", "value": "Is there a fork in the image?"}, {"from": "gpt", "value": "This image contains bowl, spoon, sandwich, dining table. Based on this, is there a fork in the image?"}]}, {"id": 127, "image": "COCO_val2014_000000075591.jpg", "conversations": [{"from": "human", "value": "Is there a bed in the image?"}, {"from": "gpt", "value": "This image contains bed, cat, book. Based on this, is there a bed in the image?"}]}, {"id": 128, "image": "COCO_val2014_000000075591.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains bed, cat, book. Based on this, is there a person in the image?"}]}, {"id": 129, "image": "COCO_val2014_000000075591.jpg", "conversations": [{"from": "human", "value": "Is there a cat in the image?"}, {"from": "gpt", "value": "This image contains bed, cat, book. Based on this, is there a cat in the image?"}]}, {"id": 130, "image": "COCO_val2014_000000075591.jpg", "conversations": [{"from": "human", "value": "Is there a couch in the image?"}, {"from": "gpt", "value": "This image contains bed, cat, book. Based on this, is there a couch in the image?"}]}, {"id": 131, "image": "COCO_val2014_000000075591.jpg", "conversations": [{"from": "human", "value": "Is there a book in the image?"}, {"from": "gpt", "value": "This image contains bed, cat, book. Based on this, is there a book in the image?"}]}, {"id": 132, "image": "COCO_val2014_000000075591.jpg", "conversations": [{"from": "human", "value": "Is there a tv in the image?"}, {"from": "gpt", "value": "This image contains bed, cat, book. Based on this, is there a tv in the image?"}]}, {"id": 133, "image": "COCO_val2014_000000516916.jpg", "conversations": [{"from": "human", "value": "Is there a tv in the image?"}, {"from": "gpt", "value": "This image contains tv, mouse, laptop, dining table, chair, keyboard, cell phone. Based on this, is there a tv in the image?"}]}, {"id": 134, "image": "COCO_val2014_000000516916.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains tv, mouse, laptop, dining table, chair, keyboard, cell phone. Based on this, is there a person in the image?"}]}, {"id": 135, "image": "COCO_val2014_000000516916.jpg", "conversations": [{"from": "human", "value": "Is there a mouse in the image?"}, {"from": "gpt", "value": "This image contains tv, mouse, laptop, dining table, chair, keyboard, cell phone. Based on this, is there a mouse in the image?"}]}, {"id": 136, "image": "COCO_val2014_000000516916.jpg", "conversations": [{"from": "human", "value": "Is there a book in the image?"}, {"from": "gpt", "value": "This image contains tv, mouse, laptop, dining table, chair, keyboard, cell phone. Based on this, is there a book in the image?"}]}, {"id": 137, "image": "COCO_val2014_000000516916.jpg", "conversations": [{"from": "human", "value": "Is there a laptop in the image?"}, {"from": "gpt", "value": "This image contains tv, mouse, laptop, dining table, chair, keyboard, cell phone. Based on this, is there a laptop in the image?"}]}, {"id": 138, "image": "COCO_val2014_000000516916.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains tv, mouse, laptop, dining table, chair, keyboard, cell phone. Based on this, is there a bottle in the image?"}]}, {"id": 139, "image": "COCO_val2014_000000542145.jpg", "conversations": [{"from": "human", "value": "Is there a sink in the image?"}, {"from": "gpt", "value": "This image contains sink, toothbrush, bottle, toilet. Based on this, is there a sink in the image?"}]}, {"id": 140, "image": "COCO_val2014_000000542145.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains sink, toothbrush, bottle, toilet. Based on this, is there a person in the image?"}]}, {"id": 141, "image": "COCO_val2014_000000542145.jpg", "conversations": [{"from": "human", "value": "Is there a toothbrush in the image?"}, {"from": "gpt", "value": "This image contains sink, toothbrush, bottle, toilet. Based on this, is there a toothbrush in the image?"}]}, {"id": 142, "image": "COCO_val2014_000000542145.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains sink, toothbrush, bottle, toilet. Based on this, is there a cup in the image?"}]}, {"id": 143, "image": "COCO_val2014_000000542145.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains sink, toothbrush, bottle, toilet. Based on this, is there a bottle in the image?"}]}, {"id": 144, "image": "COCO_val2014_000000542145.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains sink, toothbrush, bottle, toilet. Based on this, is there a dining table in the image?"}]}, {"id": 145, "image": "COCO_val2014_000000218224.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains truck, airplane, car. Based on this, is there a truck in the image?"}]}, {"id": 146, "image": "COCO_val2014_000000218224.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains truck, airplane, car. Based on this, is there a person in the image?"}]}, {"id": 147, "image": "COCO_val2014_000000218224.jpg", "conversations": [{"from": "human", "value": "Is there an airplane in the image?"}, {"from": "gpt", "value": "This image contains truck, airplane, car. Based on this, is there an airplane in the image?"}]}, {"id": 148, "image": "COCO_val2014_000000218224.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains truck, airplane, car. Based on this, is there a backpack in the image?"}]}, {"id": 149, "image": "COCO_val2014_000000218224.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains truck, airplane, car. Based on this, is there a car in the image?"}]}, {"id": 150, "image": "COCO_val2014_000000218224.jpg", "conversations": [{"from": "human", "value": "Is there a bus in the image?"}, {"from": "gpt", "value": "This image contains truck, airplane, car. Based on this, is there a bus in the image?"}]}, {"id": 151, "image": "COCO_val2014_000000297078.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, skis. Based on this, is there a backpack in the image?"}]}, {"id": 152, "image": "COCO_val2014_000000297078.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, skis. Based on this, is there a handbag in the image?"}]}, {"id": 153, "image": "COCO_val2014_000000297078.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, skis. Based on this, is there a person in the image?"}]}, {"id": 154, "image": "COCO_val2014_000000297078.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, skis. Based on this, is there a car in the image?"}]}, {"id": 155, "image": "COCO_val2014_000000297078.jpg", "conversations": [{"from": "human", "value": "Is there a skis in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, skis. Based on this, is there a skis in the image?"}]}, {"id": 156, "image": "COCO_val2014_000000297078.jpg", "conversations": [{"from": "human", "value": "Is there a snowboard in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, skis. Based on this, is there a snowboard in the image?"}]}, {"id": 157, "image": "COCO_val2014_000000033270.jpg", "conversations": [{"from": "human", "value": "Is there a tv in the image?"}, {"from": "gpt", "value": "This image contains tv, person, couch, refrigerator, orange, book. Based on this, is there a tv in the image?"}]}, {"id": 158, "image": "COCO_val2014_000000033270.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains tv, person, couch, refrigerator, orange, book. Based on this, is there a dining table in the image?"}]}, {"id": 159, "image": "COCO_val2014_000000033270.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains tv, person, couch, refrigerator, orange, book. Based on this, is there a person in the image?"}]}, {"id": 160, "image": "COCO_val2014_000000033270.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains tv, person, couch, refrigerator, orange, book. Based on this, is there a car in the image?"}]}, {"id": 161, "image": "COCO_val2014_000000033270.jpg", "conversations": [{"from": "human", "value": "Is there a couch in the image?"}, {"from": "gpt", "value": "This image contains tv, person, couch, refrigerator, orange, book. Based on this, is there a couch in the image?"}]}, {"id": 162, "image": "COCO_val2014_000000033270.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains tv, person, couch, refrigerator, orange, book. Based on this, is there a chair in the image?"}]}, {"id": 163, "image": "COCO_val2014_000000140583.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains truck, person, cow, sheep. Based on this, is there a truck in the image?"}]}, {"id": 164, "image": "COCO_val2014_000000140583.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains truck, person, cow, sheep. Based on this, is there a car in the image?"}]}, {"id": 165, "image": "COCO_val2014_000000140583.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains truck, person, cow, sheep. Based on this, is there a person in the image?"}]}, {"id": 166, "image": "COCO_val2014_000000140583.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains truck, person, cow, sheep. Based on this, is there a dining table in the image?"}]}, {"id": 167, "image": "COCO_val2014_000000140583.jpg", "conversations": [{"from": "human", "value": "Is there a cow in the image?"}, {"from": "gpt", "value": "This image contains truck, person, cow, sheep. Based on this, is there a cow in the image?"}]}, {"id": 168, "image": "COCO_val2014_000000140583.jpg", "conversations": [{"from": "human", "value": "Is there a bicycle in the image?"}, {"from": "gpt", "value": "This image contains truck, person, cow, sheep. Based on this, is there a bicycle in the image?"}]}, {"id": 169, "image": "COCO_val2014_000000421455.jpg", "conversations": [{"from": "human", "value": "Is there a dog in the image?"}, {"from": "gpt", "value": "This image contains dog, truck, person, car, cell phone. Based on this, is there a dog in the image?"}]}, {"id": 170, "image": "COCO_val2014_000000421455.jpg", "conversations": [{"from": "human", "value": "Is there a frisbee in the image?"}, {"from": "gpt", "value": "This image contains dog, truck, person, car, cell phone. Based on this, is there a frisbee in the image?"}]}, {"id": 171, "image": "COCO_val2014_000000421455.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains dog, truck, person, car, cell phone. Based on this, is there a truck in the image?"}]}, {"id": 172, "image": "COCO_val2014_000000421455.jpg", "conversations": [{"from": "human", "value": "Is there a traffic light in the image?"}, {"from": "gpt", "value": "This image contains dog, truck, person, car, cell phone. Based on this, is there a traffic light in the image?"}]}, {"id": 173, "image": "COCO_val2014_000000421455.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains dog, truck, person, car, cell phone. Based on this, is there a person in the image?"}]}, {"id": 174, "image": "COCO_val2014_000000421455.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains dog, truck, person, car, cell phone. Based on this, is there a dining table in the image?"}]}, {"id": 175, "image": "COCO_val2014_000000288639.jpg", "conversations": [{"from": "human", "value": "Is there a sink in the image?"}, {"from": "gpt", "value": "This image contains sink, toothbrush, bottle, cat. Based on this, is there a sink in the image?"}]}, {"id": 176, "image": "COCO_val2014_000000288639.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains sink, toothbrush, bottle, cat. Based on this, is there a person in the image?"}]}, {"id": 177, "image": "COCO_val2014_000000288639.jpg", "conversations": [{"from": "human", "value": "Is there a toothbrush in the image?"}, {"from": "gpt", "value": "This image contains sink, toothbrush, bottle, cat. Based on this, is there a toothbrush in the image?"}]}, {"id": 178, "image": "COCO_val2014_000000288639.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains sink, toothbrush, bottle, cat. Based on this, is there a cup in the image?"}]}, {"id": 179, "image": "COCO_val2014_000000288639.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains sink, toothbrush, bottle, cat. Based on this, is there a bottle in the image?"}]}, {"id": 180, "image": "COCO_val2014_000000288639.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains sink, toothbrush, bottle, cat. Based on this, is there a dining table in the image?"}]}, {"id": 181, "image": "COCO_val2014_000000291936.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, bicycle, umbrella. Based on this, is there a person in the image?"}]}, {"id": 182, "image": "COCO_val2014_000000291936.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, bicycle, umbrella. Based on this, is there a car in the image?"}]}, {"id": 183, "image": "COCO_val2014_000000291936.jpg", "conversations": [{"from": "human", "value": "Is there a bicycle in the image?"}, {"from": "gpt", "value": "This image contains person, bicycle, umbrella. Based on this, is there a bicycle in the image?"}]}, {"id": 184, "image": "COCO_val2014_000000291936.jpg", "conversations": [{"from": "human", "value": "Is there a motorcycle in the image?"}, {"from": "gpt", "value": "This image contains person, bicycle, umbrella. Based on this, is there a motorcycle in the image?"}]}, {"id": 185, "image": "COCO_val2014_000000291936.jpg", "conversations": [{"from": "human", "value": "Is there an umbrella in the image?"}, {"from": "gpt", "value": "This image contains person, bicycle, umbrella. Based on this, is there an umbrella in the image?"}]}, {"id": 186, "image": "COCO_val2014_000000291936.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains person, bicycle, umbrella. Based on this, is there a handbag in the image?"}]}, {"id": 187, "image": "COCO_val2014_000000063953.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, bicycle, skateboard. Based on this, is there a person in the image?"}]}, {"id": 188, "image": "COCO_val2014_000000063953.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, bicycle, skateboard. Based on this, is there a car in the image?"}]}, {"id": 189, "image": "COCO_val2014_000000063953.jpg", "conversations": [{"from": "human", "value": "Is there a bicycle in the image?"}, {"from": "gpt", "value": "This image contains person, bicycle, skateboard. Based on this, is there a bicycle in the image?"}]}, {"id": 190, "image": "COCO_val2014_000000063953.jpg", "conversations": [{"from": "human", "value": "Is there a motorcycle in the image?"}, {"from": "gpt", "value": "This image contains person, bicycle, skateboard. Based on this, is there a motorcycle in the image?"}]}, {"id": 191, "image": "COCO_val2014_000000063953.jpg", "conversations": [{"from": "human", "value": "Is there a skateboard in the image?"}, {"from": "gpt", "value": "This image contains person, bicycle, skateboard. Based on this, is there a skateboard in the image?"}]}, {"id": 192, "image": "COCO_val2014_000000063953.jpg", "conversations": [{"from": "human", "value": "Is there a bench in the image?"}, {"from": "gpt", "value": "This image contains person, bicycle, skateboard. Based on this, is there a bench in the image?"}]}, {"id": 193, "image": "COCO_val2014_000000526321.jpg", "conversations": [{"from": "human", "value": "Is there a laptop in the image?"}, {"from": "gpt", "value": "This image contains laptop, remote, dining table, cell phone, tv, mouse, keyboard, book. Based on this, is there a laptop in the image?"}]}, {"id": 194, "image": "COCO_val2014_000000526321.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains laptop, remote, dining table, cell phone, tv, mouse, keyboard, book. Based on this, is there a person in the image?"}]}, {"id": 195, "image": "COCO_val2014_000000526321.jpg", "conversations": [{"from": "human", "value": "Is there a remote in the image?"}, {"from": "gpt", "value": "This image contains laptop, remote, dining table, cell phone, tv, mouse, keyboard, book. Based on this, is there a remote in the image?"}]}, {"id": 196, "image": "COCO_val2014_000000526321.jpg", "conversations": [{"from": "human", "value": "Is there a couch in the image?"}, {"from": "gpt", "value": "This image contains laptop, remote, dining table, cell phone, tv, mouse, keyboard, book. Based on this, is there a couch in the image?"}]}, {"id": 197, "image": "COCO_val2014_000000526321.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains laptop, remote, dining table, cell phone, tv, mouse, keyboard, book. Based on this, is there a dining table in the image?"}]}, {"id": 198, "image": "COCO_val2014_000000526321.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains laptop, remote, dining table, cell phone, tv, mouse, keyboard, book. Based on this, is there a cup in the image?"}]}, {"id": 199, "image": "COCO_val2014_000000042190.jpg", "conversations": [{"from": "human", "value": "Is there a snowboard in the image?"}, {"from": "gpt", "value": "This image contains snowboard, person, surfboard. Based on this, is there a snowboard in the image?"}]}, {"id": 200, "image": "COCO_val2014_000000042190.jpg", "conversations": [{"from": "human", "value": "Is there a skis in the image?"}, {"from": "gpt", "value": "This image contains snowboard, person, surfboard. Based on this, is there a skis in the image?"}]}, {"id": 201, "image": "COCO_val2014_000000042190.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains snowboard, person, surfboard. Based on this, is there a person in the image?"}]}, {"id": 202, "image": "COCO_val2014_000000042190.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains snowboard, person, surfboard. Based on this, is there a car in the image?"}]}, {"id": 203, "image": "COCO_val2014_000000042190.jpg", "conversations": [{"from": "human", "value": "Is there a surfboard in the image?"}, {"from": "gpt", "value": "This image contains snowboard, person, surfboard. Based on this, is there a surfboard in the image?"}]}, {"id": 204, "image": "COCO_val2014_000000042190.jpg", "conversations": [{"from": "human", "value": "Is there an umbrella in the image?"}, {"from": "gpt", "value": "This image contains snowboard, person, surfboard. Based on this, is there an umbrella in the image?"}]}, {"id": 205, "image": "COCO_val2014_000000553165.jpg", "conversations": [{"from": "human", "value": "Is there a bird in the image?"}, {"from": "gpt", "value": "This image contains bird, person, boat. Based on this, is there a bird in the image?"}]}, {"id": 206, "image": "COCO_val2014_000000553165.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains bird, person, boat. Based on this, is there a handbag in the image?"}]}, {"id": 207, "image": "COCO_val2014_000000553165.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains bird, person, boat. Based on this, is there a person in the image?"}]}, {"id": 208, "image": "COCO_val2014_000000553165.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains bird, person, boat. Based on this, is there a car in the image?"}]}, {"id": 209, "image": "COCO_val2014_000000553165.jpg", "conversations": [{"from": "human", "value": "Is there a boat in the image?"}, {"from": "gpt", "value": "This image contains bird, person, boat. Based on this, is there a boat in the image?"}]}, {"id": 210, "image": "COCO_val2014_000000553165.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains bird, person, boat. Based on this, is there a chair in the image?"}]}, {"id": 211, "image": "COCO_val2014_000000170517.jpg", "conversations": [{"from": "human", "value": "Is there a dog in the image?"}, {"from": "gpt", "value": "This image contains dog, person, car, umbrella. Based on this, is there a dog in the image?"}]}, {"id": 212, "image": "COCO_val2014_000000170517.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains dog, person, car, umbrella. Based on this, is there a truck in the image?"}]}, {"id": 213, "image": "COCO_val2014_000000170517.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains dog, person, car, umbrella. Based on this, is there a person in the image?"}]}, {"id": 214, "image": "COCO_val2014_000000170517.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains dog, person, car, umbrella. Based on this, is there a dining table in the image?"}]}, {"id": 215, "image": "COCO_val2014_000000170517.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains dog, person, car, umbrella. Based on this, is there a car in the image?"}]}, {"id": 216, "image": "COCO_val2014_000000170517.jpg", "conversations": [{"from": "human", "value": "Is there a bus in the image?"}, {"from": "gpt", "value": "This image contains dog, person, car, umbrella. Based on this, is there a bus in the image?"}]}, {"id": 217, "image": "COCO_val2014_000000498759.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, skateboard, car. Based on this, is there a person in the image?"}]}, {"id": 218, "image": "COCO_val2014_000000498759.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, skateboard, car. Based on this, is there a dining table in the image?"}]}, {"id": 219, "image": "COCO_val2014_000000498759.jpg", "conversations": [{"from": "human", "value": "Is there a skateboard in the image?"}, {"from": "gpt", "value": "This image contains person, skateboard, car. Based on this, is there a skateboard in the image?"}]}, {"id": 220, "image": "COCO_val2014_000000498759.jpg", "conversations": [{"from": "human", "value": "Is there a bicycle in the image?"}, {"from": "gpt", "value": "This image contains person, skateboard, car. Based on this, is there a bicycle in the image?"}]}, {"id": 221, "image": "COCO_val2014_000000498759.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, skateboard, car. Based on this, is there a car in the image?"}]}, {"id": 222, "image": "COCO_val2014_000000498759.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains person, skateboard, car. Based on this, is there a truck in the image?"}]}, {"id": 223, "image": "COCO_val2014_000000360600.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, fork, knife, pizza, cup. Based on this, is there a person in the image?"}]}, {"id": 224, "image": "COCO_val2014_000000360600.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, fork, knife, pizza, cup. Based on this, is there a car in the image?"}]}, {"id": 225, "image": "COCO_val2014_000000360600.jpg", "conversations": [{"from": "human", "value": "Is there a fork in the image?"}, {"from": "gpt", "value": "This image contains person, fork, knife, pizza, cup. Based on this, is there a fork in the image?"}]}, {"id": 226, "image": "COCO_val2014_000000360600.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, fork, knife, pizza, cup. Based on this, is there a dining table in the image?"}]}, {"id": 227, "image": "COCO_val2014_000000360600.jpg", "conversations": [{"from": "human", "value": "Is there a knife in the image?"}, {"from": "gpt", "value": "This image contains person, fork, knife, pizza, cup. Based on this, is there a knife in the image?"}]}, {"id": 228, "image": "COCO_val2014_000000360600.jpg", "conversations": [{"from": "human", "value": "Is there a spoon in the image?"}, {"from": "gpt", "value": "This image contains person, fork, knife, pizza, cup. Based on this, is there a spoon in the image?"}]}, {"id": 229, "image": "COCO_val2014_000000031773.jpg", "conversations": [{"from": "human", "value": "Is there a tv in the image?"}, {"from": "gpt", "value": "This image contains tv, person, mouse, potted plant, laptop, dining table, keyboard. Based on this, is there a tv in the image?"}]}, {"id": 230, "image": "COCO_val2014_000000031773.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains tv, person, mouse, potted plant, laptop, dining table, keyboard. Based on this, is there a chair in the image?"}]}, {"id": 231, "image": "COCO_val2014_000000031773.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains tv, person, mouse, potted plant, laptop, dining table, keyboard. Based on this, is there a person in the image?"}]}, {"id": 232, "image": "COCO_val2014_000000031773.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains tv, person, mouse, potted plant, laptop, dining table, keyboard. Based on this, is there a car in the image?"}]}, {"id": 233, "image": "COCO_val2014_000000031773.jpg", "conversations": [{"from": "human", "value": "Is there a mouse in the image?"}, {"from": "gpt", "value": "This image contains tv, person, mouse, potted plant, laptop, dining table, keyboard. Based on this, is there a mouse in the image?"}]}, {"id": 234, "image": "COCO_val2014_000000031773.jpg", "conversations": [{"from": "human", "value": "Is there a cell phone in the image?"}, {"from": "gpt", "value": "This image contains tv, person, mouse, potted plant, laptop, dining table, keyboard. Based on this, is there a cell phone in the image?"}]}, {"id": 235, "image": "COCO_val2014_000000500257.jpg", "conversations": [{"from": "human", "value": "Is there a tv in the image?"}, {"from": "gpt", "value": "This image contains tv, backpack, person, suitcase. Based on this, is there a tv in the image?"}]}, {"id": 236, "image": "COCO_val2014_000000500257.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains tv, backpack, person, suitcase. Based on this, is there a dining table in the image?"}]}, {"id": 237, "image": "COCO_val2014_000000500257.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains tv, backpack, person, suitcase. Based on this, is there a backpack in the image?"}]}, {"id": 238, "image": "COCO_val2014_000000500257.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains tv, backpack, person, suitcase. Based on this, is there a handbag in the image?"}]}, {"id": 239, "image": "COCO_val2014_000000500257.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains tv, backpack, person, suitcase. Based on this, is there a person in the image?"}]}, {"id": 240, "image": "COCO_val2014_000000500257.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains tv, backpack, person, suitcase. Based on this, is there a car in the image?"}]}, {"id": 241, "image": "COCO_val2014_000000574057.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains car, train, bed. Based on this, is there a car in the image?"}]}, {"id": 242, "image": "COCO_val2014_000000574057.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains car, train, bed. Based on this, is there a person in the image?"}]}, {"id": 243, "image": "COCO_val2014_000000574057.jpg", "conversations": [{"from": "human", "value": "Is there a train in the image?"}, {"from": "gpt", "value": "This image contains car, train, bed. Based on this, is there a train in the image?"}]}, {"id": 244, "image": "COCO_val2014_000000574057.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains car, train, bed. Based on this, is there a truck in the image?"}]}, {"id": 245, "image": "COCO_val2014_000000574057.jpg", "conversations": [{"from": "human", "value": "Is there a bed in the image?"}, {"from": "gpt", "value": "This image contains car, train, bed. Based on this, is there a bed in the image?"}]}, {"id": 246, "image": "COCO_val2014_000000574057.jpg", "conversations": [{"from": "human", "value": "Is there a book in the image?"}, {"from": "gpt", "value": "This image contains car, train, bed. Based on this, is there a book in the image?"}]}, {"id": 247, "image": "COCO_val2014_000000456178.jpg", "conversations": [{"from": "human", "value": "Is there a traffic light in the image?"}, {"from": "gpt", "value": "This image contains traffic light, truck, clock, person, car. Based on this, is there a traffic light in the image?"}]}, {"id": 248, "image": "COCO_val2014_000000456178.jpg", "conversations": [{"from": "human", "value": "Is there a bus in the image?"}, {"from": "gpt", "value": "This image contains traffic light, truck, clock, person, car. Based on this, is there a bus in the image?"}]}, {"id": 249, "image": "COCO_val2014_000000456178.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains traffic light, truck, clock, person, car. Based on this, is there a truck in the image?"}]}, {"id": 250, "image": "COCO_val2014_000000456178.jpg", "conversations": [{"from": "human", "value": "Is there a motorcycle in the image?"}, {"from": "gpt", "value": "This image contains traffic light, truck, clock, person, car. Based on this, is there a motorcycle in the image?"}]}, {"id": 251, "image": "COCO_val2014_000000456178.jpg", "conversations": [{"from": "human", "value": "Is there a clock in the image?"}, {"from": "gpt", "value": "This image contains traffic light, truck, clock, person, car. Based on this, is there a clock in the image?"}]}, {"id": 252, "image": "COCO_val2014_000000456178.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains traffic light, truck, clock, person, car. Based on this, is there a chair in the image?"}]}, {"id": 253, "image": "COCO_val2014_000000565941.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, bottle, dining table, chair, cake, cup. Based on this, is there a person in the image?"}]}, {"id": 254, "image": "COCO_val2014_000000565941.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, bottle, dining table, chair, cake, cup. Based on this, is there a car in the image?"}]}, {"id": 255, "image": "COCO_val2014_000000565941.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains person, bottle, dining table, chair, cake, cup. Based on this, is there a bottle in the image?"}]}, {"id": 256, "image": "COCO_val2014_000000565941.jpg", "conversations": [{"from": "human", "value": "Is there a spoon in the image?"}, {"from": "gpt", "value": "This image contains person, bottle, dining table, chair, cake, cup. Based on this, is there a spoon in the image?"}]}, {"id": 257, "image": "COCO_val2014_000000565941.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, bottle, dining table, chair, cake, cup. Based on this, is there a dining table in the image?"}]}, {"id": 258, "image": "COCO_val2014_000000565941.jpg", "conversations": [{"from": "human", "value": "Is there a laptop in the image?"}, {"from": "gpt", "value": "This image contains person, bottle, dining table, chair, cake, cup. Based on this, is there a laptop in the image?"}]}, {"id": 259, "image": "COCO_val2014_000000485564.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains car, person, sports ball. Based on this, is there a car in the image?"}]}, {"id": 260, "image": "COCO_val2014_000000485564.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains car, person, sports ball. Based on this, is there a truck in the image?"}]}, {"id": 261, "image": "COCO_val2014_000000485564.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains car, person, sports ball. Based on this, is there a person in the image?"}]}, {"id": 262, "image": "COCO_val2014_000000485564.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains car, person, sports ball. Based on this, is there a dining table in the image?"}]}, {"id": 263, "image": "COCO_val2014_000000485564.jpg", "conversations": [{"from": "human", "value": "Is there a sports ball in the image?"}, {"from": "gpt", "value": "This image contains car, person, sports ball. Based on this, is there a sports ball in the image?"}]}, {"id": 264, "image": "COCO_val2014_000000485564.jpg", "conversations": [{"from": "human", "value": "Is there a tennis racket in the image?"}, {"from": "gpt", "value": "This image contains car, person, sports ball. Based on this, is there a tennis racket in the image?"}]}, {"id": 265, "image": "COCO_val2014_000000454642.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains truck, person, motorcycle, car. Based on this, is there a truck in the image?"}]}, {"id": 266, "image": "COCO_val2014_000000454642.jpg", "conversations": [{"from": "human", "value": "Is there a traffic light in the image?"}, {"from": "gpt", "value": "This image contains truck, person, motorcycle, car. Based on this, is there a traffic light in the image?"}]}, {"id": 267, "image": "COCO_val2014_000000454642.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains truck, person, motorcycle, car. Based on this, is there a person in the image?"}]}, {"id": 268, "image": "COCO_val2014_000000454642.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains truck, person, motorcycle, car. Based on this, is there a dining table in the image?"}]}, {"id": 269, "image": "COCO_val2014_000000454642.jpg", "conversations": [{"from": "human", "value": "Is there a motorcycle in the image?"}, {"from": "gpt", "value": "This image contains truck, person, motorcycle, car. Based on this, is there a motorcycle in the image?"}]}, {"id": 270, "image": "COCO_val2014_000000454642.jpg", "conversations": [{"from": "human", "value": "Is there a bicycle in the image?"}, {"from": "gpt", "value": "This image contains truck, person, motorcycle, car. Based on this, is there a bicycle in the image?"}]}, {"id": 271, "image": "COCO_val2014_000000205729.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, skis. Based on this, is there a backpack in the image?"}]}, {"id": 272, "image": "COCO_val2014_000000205729.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, skis. Based on this, is there a handbag in the image?"}]}, {"id": 273, "image": "COCO_val2014_000000205729.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, skis. Based on this, is there a person in the image?"}]}, {"id": 274, "image": "COCO_val2014_000000205729.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, skis. Based on this, is there a car in the image?"}]}, {"id": 275, "image": "COCO_val2014_000000205729.jpg", "conversations": [{"from": "human", "value": "Is there a skis in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, skis. Based on this, is there a skis in the image?"}]}, {"id": 276, "image": "COCO_val2014_000000205729.jpg", "conversations": [{"from": "human", "value": "Is there a snowboard in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, skis. Based on this, is there a snowboard in the image?"}]}, {"id": 277, "image": "COCO_val2014_000000424792.jpg", "conversations": [{"from": "human", "value": "Is there a couch in the image?"}, {"from": "gpt", "value": "This image contains couch, chair, vase, bed, cat. Based on this, is there a couch in the image?"}]}, {"id": 278, "image": "COCO_val2014_000000424792.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains couch, chair, vase, bed, cat. Based on this, is there a person in the image?"}]}, {"id": 279, "image": "COCO_val2014_000000424792.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains couch, chair, vase, bed, cat. Based on this, is there a chair in the image?"}]}, {"id": 280, "image": "COCO_val2014_000000424792.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains couch, chair, vase, bed, cat. Based on this, is there a dining table in the image?"}]}, {"id": 281, "image": "COCO_val2014_000000424792.jpg", "conversations": [{"from": "human", "value": "Is there a vase in the image?"}, {"from": "gpt", "value": "This image contains couch, chair, vase, bed, cat. Based on this, is there a vase in the image?"}]}, {"id": 282, "image": "COCO_val2014_000000424792.jpg", "conversations": [{"from": "human", "value": "Is there a potted plant in the image?"}, {"from": "gpt", "value": "This image contains couch, chair, vase, bed, cat. Based on this, is there a potted plant in the image?"}]}, {"id": 283, "image": "COCO_val2014_000000329717.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, suitcase, handbag. Based on this, is there a person in the image?"}]}, {"id": 284, "image": "COCO_val2014_000000329717.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, suitcase, handbag. Based on this, is there a car in the image?"}]}, {"id": 285, "image": "COCO_val2014_000000329717.jpg", "conversations": [{"from": "human", "value": "Is there a suitcase in the image?"}, {"from": "gpt", "value": "This image contains person, suitcase, handbag. Based on this, is there a suitcase in the image?"}]}, {"id": 286, "image": "COCO_val2014_000000329717.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains person, suitcase, handbag. Based on this, is there a backpack in the image?"}]}, {"id": 287, "image": "COCO_val2014_000000329717.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains person, suitcase, handbag. Based on this, is there a handbag in the image?"}]}, {"id": 288, "image": "COCO_val2014_000000329717.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, suitcase, handbag. Based on this, is there a dining table in the image?"}]}, {"id": 289, "image": "COCO_val2014_000000012333.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains chair, person, horse. Based on this, is there a chair in the image?"}]}, {"id": 290, "image": "COCO_val2014_000000012333.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains chair, person, horse. Based on this, is there a dining table in the image?"}]}, {"id": 291, "image": "COCO_val2014_000000012333.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains chair, person, horse. Based on this, is there a person in the image?"}]}, {"id": 292, "image": "COCO_val2014_000000012333.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains chair, person, horse. Based on this, is there a car in the image?"}]}, {"id": 293, "image": "COCO_val2014_000000012333.jpg", "conversations": [{"from": "human", "value": "Is there a horse in the image?"}, {"from": "gpt", "value": "This image contains chair, person, horse. Based on this, is there a horse in the image?"}]}, {"id": 294, "image": "COCO_val2014_000000012333.jpg", "conversations": [{"from": "human", "value": "Is there a dog in the image?"}, {"from": "gpt", "value": "This image contains chair, person, horse. Based on this, is there a dog in the image?"}]}, {"id": 295, "image": "COCO_val2014_000000480122.jpg", "conversations": [{"from": "human", "value": "Is there a banana in the image?"}, {"from": "gpt", "value": "This image contains banana, spoon, bowl, dining table, chair, knife, sink, refrigerator, bottle, oven. Based on this, is there a banana in the image?"}]}, {"id": 296, "image": "COCO_val2014_000000480122.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains banana, spoon, bowl, dining table, chair, knife, sink, refrigerator, bottle, oven. Based on this, is there a person in the image?"}]}, {"id": 297, "image": "COCO_val2014_000000480122.jpg", "conversations": [{"from": "human", "value": "Is there a spoon in the image?"}, {"from": "gpt", "value": "This image contains banana, spoon, bowl, dining table, chair, knife, sink, refrigerator, bottle, oven. Based on this, is there a spoon in the image?"}]}, {"id": 298, "image": "COCO_val2014_000000480122.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains banana, spoon, bowl, dining table, chair, knife, sink, refrigerator, bottle, oven. Based on this, is there a cup in the image?"}]}, {"id": 299, "image": "COCO_val2014_000000480122.jpg", "conversations": [{"from": "human", "value": "Is there a bowl in the image?"}, {"from": "gpt", "value": "This image contains banana, spoon, bowl, dining table, chair, knife, sink, refrigerator, bottle, oven. Based on this, is there a bowl in the image?"}]}, {"id": 300, "image": "COCO_val2014_000000480122.jpg", "conversations": [{"from": "human", "value": "Is there a sandwich in the image?"}, {"from": "gpt", "value": "This image contains banana, spoon, bowl, dining table, chair, knife, sink, refrigerator, bottle, oven. Based on this, is there a sandwich in the image?"}]}, {"id": 301, "image": "COCO_val2014_000000515904.jpg", "conversations": [{"from": "human", "value": "Is there a vase in the image?"}, {"from": "gpt", "value": "This image contains vase, sink, potted plant, toilet. Based on this, is there a vase in the image?"}]}, {"id": 302, "image": "COCO_val2014_000000515904.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains vase, sink, potted plant, toilet. Based on this, is there a dining table in the image?"}]}, {"id": 303, "image": "COCO_val2014_000000515904.jpg", "conversations": [{"from": "human", "value": "Is there a sink in the image?"}, {"from": "gpt", "value": "This image contains vase, sink, potted plant, toilet. Based on this, is there a sink in the image?"}]}, {"id": 304, "image": "COCO_val2014_000000515904.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains vase, sink, potted plant, toilet. Based on this, is there a bottle in the image?"}]}, {"id": 305, "image": "COCO_val2014_000000515904.jpg", "conversations": [{"from": "human", "value": "Is there a potted plant in the image?"}, {"from": "gpt", "value": "This image contains vase, sink, potted plant, toilet. Based on this, is there a potted plant in the image?"}]}, {"id": 306, "image": "COCO_val2014_000000515904.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains vase, sink, potted plant, toilet. Based on this, is there a person in the image?"}]}, {"id": 307, "image": "COCO_val2014_000000437347.jpg", "conversations": [{"from": "human", "value": "Is there a baseball glove in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball. Based on this, is there a baseball glove in the image?"}]}, {"id": 308, "image": "COCO_val2014_000000437347.jpg", "conversations": [{"from": "human", "value": "Is there a baseball bat in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball. Based on this, is there a baseball bat in the image?"}]}, {"id": 309, "image": "COCO_val2014_000000437347.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball. Based on this, is there a person in the image?"}]}, {"id": 310, "image": "COCO_val2014_000000437347.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball. Based on this, is there a car in the image?"}]}, {"id": 311, "image": "COCO_val2014_000000437347.jpg", "conversations": [{"from": "human", "value": "Is there a sports ball in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball. Based on this, is there a sports ball in the image?"}]}, {"id": 312, "image": "COCO_val2014_000000437347.jpg", "conversations": [{"from": "human", "value": "Is there a tennis racket in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball. Based on this, is there a tennis racket in the image?"}]}, {"id": 313, "image": "COCO_val2014_000000354229.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, car, bus. Based on this, is there a person in the image?"}]}, {"id": 314, "image": "COCO_val2014_000000354229.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, car, bus. Based on this, is there a dining table in the image?"}]}, {"id": 315, "image": "COCO_val2014_000000354229.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, car, bus. Based on this, is there a car in the image?"}]}, {"id": 316, "image": "COCO_val2014_000000354229.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains person, car, bus. Based on this, is there a truck in the image?"}]}, {"id": 317, "image": "COCO_val2014_000000354229.jpg", "conversations": [{"from": "human", "value": "Is there a bus in the image?"}, {"from": "gpt", "value": "This image contains person, car, bus. Based on this, is there a bus in the image?"}]}, {"id": 318, "image": "COCO_val2014_000000354229.jpg", "conversations": [{"from": "human", "value": "Is there a traffic light in the image?"}, {"from": "gpt", "value": "This image contains person, car, bus. Based on this, is there a traffic light in the image?"}]}, {"id": 319, "image": "COCO_val2014_000000538236.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, dining table, handbag, hot dog. Based on this, is there a person in the image?"}]}, {"id": 320, "image": "COCO_val2014_000000538236.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, dining table, handbag, hot dog. Based on this, is there a car in the image?"}]}, {"id": 321, "image": "COCO_val2014_000000538236.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, dining table, handbag, hot dog. Based on this, is there a dining table in the image?"}]}, {"id": 322, "image": "COCO_val2014_000000538236.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains person, dining table, handbag, hot dog. Based on this, is there a cup in the image?"}]}, {"id": 323, "image": "COCO_val2014_000000538236.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains person, dining table, handbag, hot dog. Based on this, is there a handbag in the image?"}]}, {"id": 324, "image": "COCO_val2014_000000538236.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains person, dining table, handbag, hot dog. Based on this, is there a backpack in the image?"}]}, {"id": 325, "image": "COCO_val2014_000000236865.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, orange, car, frisbee. Based on this, is there a person in the image?"}]}, {"id": 326, "image": "COCO_val2014_000000236865.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, orange, car, frisbee. Based on this, is there a dining table in the image?"}]}, {"id": 327, "image": "COCO_val2014_000000236865.jpg", "conversations": [{"from": "human", "value": "Is there an orange in the image?"}, {"from": "gpt", "value": "This image contains person, orange, car, frisbee. Based on this, is there an orange in the image?"}]}, {"id": 328, "image": "COCO_val2014_000000236865.jpg", "conversations": [{"from": "human", "value": "Is there a bowl in the image?"}, {"from": "gpt", "value": "This image contains person, orange, car, frisbee. Based on this, is there a bowl in the image?"}]}, {"id": 329, "image": "COCO_val2014_000000236865.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, orange, car, frisbee. Based on this, is there a car in the image?"}]}, {"id": 330, "image": "COCO_val2014_000000236865.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains person, orange, car, frisbee. Based on this, is there a truck in the image?"}]}, {"id": 331, "image": "COCO_val2014_000000217397.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, wine glass, bottle, fork, dining table, cell phone. Based on this, is there a person in the image?"}]}, {"id": 332, "image": "COCO_val2014_000000217397.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, wine glass, bottle, fork, dining table, cell phone. Based on this, is there a car in the image?"}]}, {"id": 333, "image": "COCO_val2014_000000217397.jpg", "conversations": [{"from": "human", "value": "Is there a wine glass in the image?"}, {"from": "gpt", "value": "This image contains person, wine glass, bottle, fork, dining table, cell phone. Based on this, is there a wine glass in the image?"}]}, {"id": 334, "image": "COCO_val2014_000000217397.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains person, wine glass, bottle, fork, dining table, cell phone. Based on this, is there a cup in the image?"}]}, {"id": 335, "image": "COCO_val2014_000000217397.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains person, wine glass, bottle, fork, dining table, cell phone. Based on this, is there a bottle in the image?"}]}, {"id": 336, "image": "COCO_val2014_000000217397.jpg", "conversations": [{"from": "human", "value": "Is there a spoon in the image?"}, {"from": "gpt", "value": "This image contains person, wine glass, bottle, fork, dining table, cell phone. Based on this, is there a spoon in the image?"}]}, {"id": 337, "image": "COCO_val2014_000000060213.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains backpack, bed, book. Based on this, is there a backpack in the image?"}]}, {"id": 338, "image": "COCO_val2014_000000060213.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains backpack, bed, book. Based on this, is there a person in the image?"}]}, {"id": 339, "image": "COCO_val2014_000000060213.jpg", "conversations": [{"from": "human", "value": "Is there a bed in the image?"}, {"from": "gpt", "value": "This image contains backpack, bed, book. Based on this, is there a bed in the image?"}]}, {"id": 340, "image": "COCO_val2014_000000060213.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains backpack, bed, book. Based on this, is there a dining table in the image?"}]}, {"id": 341, "image": "COCO_val2014_000000060213.jpg", "conversations": [{"from": "human", "value": "Is there a book in the image?"}, {"from": "gpt", "value": "This image contains backpack, bed, book. Based on this, is there a book in the image?"}]}, {"id": 342, "image": "COCO_val2014_000000060213.jpg", "conversations": [{"from": "human", "value": "Is there a tv in the image?"}, {"from": "gpt", "value": "This image contains backpack, bed, book. Based on this, is there a tv in the image?"}]}, {"id": 343, "image": "COCO_val2014_000000054025.jpg", "conversations": [{"from": "human", "value": "Is there a traffic light in the image?"}, {"from": "gpt", "value": "This image contains traffic light, person, backpack, handbag, car, bus. Based on this, is there a traffic light in the image?"}]}, {"id": 344, "image": "COCO_val2014_000000054025.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains traffic light, person, backpack, handbag, car, bus. Based on this, is there a truck in the image?"}]}, {"id": 345, "image": "COCO_val2014_000000054025.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains traffic light, person, backpack, handbag, car, bus. Based on this, is there a person in the image?"}]}, {"id": 346, "image": "COCO_val2014_000000054025.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains traffic light, person, backpack, handbag, car, bus. Based on this, is there a dining table in the image?"}]}, {"id": 347, "image": "COCO_val2014_000000054025.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains traffic light, person, backpack, handbag, car, bus. Based on this, is there a backpack in the image?"}]}, {"id": 348, "image": "COCO_val2014_000000054025.jpg", "conversations": [{"from": "human", "value": "Is there a skis in the image?"}, {"from": "gpt", "value": "This image contains traffic light, person, backpack, handbag, car, bus. Based on this, is there a skis in the image?"}]}, {"id": 349, "image": "COCO_val2014_000000084447.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, motorcycle, bicycle. Based on this, is there a person in the image?"}]}, {"id": 350, "image": "COCO_val2014_000000084447.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, motorcycle, bicycle. Based on this, is there a car in the image?"}]}, {"id": 351, "image": "COCO_val2014_000000084447.jpg", "conversations": [{"from": "human", "value": "Is there a motorcycle in the image?"}, {"from": "gpt", "value": "This image contains person, motorcycle, bicycle. Based on this, is there a motorcycle in the image?"}]}, {"id": 352, "image": "COCO_val2014_000000084447.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains person, motorcycle, bicycle. Based on this, is there a truck in the image?"}]}, {"id": 353, "image": "COCO_val2014_000000084447.jpg", "conversations": [{"from": "human", "value": "Is there a bicycle in the image?"}, {"from": "gpt", "value": "This image contains person, motorcycle, bicycle. Based on this, is there a bicycle in the image?"}]}, {"id": 354, "image": "COCO_val2014_000000084447.jpg", "conversations": [{"from": "human", "value": "Is there a bus in the image?"}, {"from": "gpt", "value": "This image contains person, motorcycle, bicycle. Based on this, is there a bus in the image?"}]}, {"id": 355, "image": "COCO_val2014_000000192660.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, dining table, refrigerator, bench, orange. Based on this, is there a person in the image?"}]}, {"id": 356, "image": "COCO_val2014_000000192660.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, dining table, refrigerator, bench, orange. Based on this, is there a car in the image?"}]}, {"id": 357, "image": "COCO_val2014_000000192660.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, dining table, refrigerator, bench, orange. Based on this, is there a dining table in the image?"}]}, {"id": 358, "image": "COCO_val2014_000000192660.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains person, dining table, refrigerator, bench, orange. Based on this, is there a cup in the image?"}]}, {"id": 359, "image": "COCO_val2014_000000192660.jpg", "conversations": [{"from": "human", "value": "Is there a refrigerator in the image?"}, {"from": "gpt", "value": "This image contains person, dining table, refrigerator, bench, orange. Based on this, is there a refrigerator in the image?"}]}, {"id": 360, "image": "COCO_val2014_000000192660.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains person, dining table, refrigerator, bench, orange. Based on this, is there a bottle in the image?"}]}, {"id": 361, "image": "COCO_val2014_000000575755.jpg", "conversations": [{"from": "human", "value": "Is there a sandwich in the image?"}, {"from": "gpt", "value": "This image contains sandwich, carrot, broccoli, dining table. Based on this, is there a sandwich in the image?"}]}, {"id": 362, "image": "COCO_val2014_000000575755.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains sandwich, carrot, broccoli, dining table. Based on this, is there a cup in the image?"}]}, {"id": 363, "image": "COCO_val2014_000000575755.jpg", "conversations": [{"from": "human", "value": "Is there a carrot in the image?"}, {"from": "gpt", "value": "This image contains sandwich, carrot, broccoli, dining table. Based on this, is there a carrot in the image?"}]}, {"id": 364, "image": "COCO_val2014_000000575755.jpg", "conversations": [{"from": "human", "value": "Is there a bowl in the image?"}, {"from": "gpt", "value": "This image contains sandwich, carrot, broccoli, dining table. Based on this, is there a bowl in the image?"}]}, {"id": 365, "image": "COCO_val2014_000000575755.jpg", "conversations": [{"from": "human", "value": "Is there a broccoli in the image?"}, {"from": "gpt", "value": "This image contains sandwich, carrot, broccoli, dining table. Based on this, is there a broccoli in the image?"}]}, {"id": 366, "image": "COCO_val2014_000000575755.jpg", "conversations": [{"from": "human", "value": "Is there a knife in the image?"}, {"from": "gpt", "value": "This image contains sandwich, carrot, broccoli, dining table. Based on this, is there a knife in the image?"}]}, {"id": 367, "image": "COCO_val2014_000000354088.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, car, dining table, orange, apple, bus, umbrella. Based on this, is there a person in the image?"}]}, {"id": 368, "image": "COCO_val2014_000000354088.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains person, car, dining table, orange, apple, bus, umbrella. Based on this, is there a chair in the image?"}]}, {"id": 369, "image": "COCO_val2014_000000354088.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, car, dining table, orange, apple, bus, umbrella. Based on this, is there a car in the image?"}]}, {"id": 370, "image": "COCO_val2014_000000354088.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains person, car, dining table, orange, apple, bus, umbrella. Based on this, is there a truck in the image?"}]}, {"id": 371, "image": "COCO_val2014_000000354088.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, car, dining table, orange, apple, bus, umbrella. Based on this, is there a dining table in the image?"}]}, {"id": 372, "image": "COCO_val2014_000000354088.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains person, car, dining table, orange, apple, bus, umbrella. Based on this, is there a cup in the image?"}]}, {"id": 373, "image": "COCO_val2014_000000311327.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, boat, handbag. Based on this, is there a person in the image?"}]}, {"id": 374, "image": "COCO_val2014_000000311327.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, boat, handbag. Based on this, is there a car in the image?"}]}, {"id": 375, "image": "COCO_val2014_000000311327.jpg", "conversations": [{"from": "human", "value": "Is there a boat in the image?"}, {"from": "gpt", "value": "This image contains person, boat, handbag. Based on this, is there a boat in the image?"}]}, {"id": 376, "image": "COCO_val2014_000000311327.jpg", "conversations": [{"from": "human", "value": "Is there a bird in the image?"}, {"from": "gpt", "value": "This image contains person, boat, handbag. Based on this, is there a bird in the image?"}]}, {"id": 377, "image": "COCO_val2014_000000311327.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains person, boat, handbag. Based on this, is there a handbag in the image?"}]}, {"id": 378, "image": "COCO_val2014_000000311327.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains person, boat, handbag. Based on this, is there a backpack in the image?"}]}, {"id": 379, "image": "COCO_val2014_000000456552.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, bench, skateboard. Based on this, is there a person in the image?"}]}, {"id": 380, "image": "COCO_val2014_000000456552.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, bench, skateboard. Based on this, is there a car in the image?"}]}, {"id": 381, "image": "COCO_val2014_000000456552.jpg", "conversations": [{"from": "human", "value": "Is there a bench in the image?"}, {"from": "gpt", "value": "This image contains person, bench, skateboard. Based on this, is there a bench in the image?"}]}, {"id": 382, "image": "COCO_val2014_000000456552.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, bench, skateboard. Based on this, is there a dining table in the image?"}]}, {"id": 383, "image": "COCO_val2014_000000456552.jpg", "conversations": [{"from": "human", "value": "Is there a skateboard in the image?"}, {"from": "gpt", "value": "This image contains person, bench, skateboard. Based on this, is there a skateboard in the image?"}]}, {"id": 384, "image": "COCO_val2014_000000456552.jpg", "conversations": [{"from": "human", "value": "Is there a bicycle in the image?"}, {"from": "gpt", "value": "This image contains person, bench, skateboard. Based on this, is there a bicycle in the image?"}]}, {"id": 385, "image": "COCO_val2014_000000350898.jpg", "conversations": [{"from": "human", "value": "Is there a spoon in the image?"}, {"from": "gpt", "value": "This image contains spoon, bottle, refrigerator, oven, cup. Based on this, is there a spoon in the image?"}]}, {"id": 386, "image": "COCO_val2014_000000350898.jpg", "conversations": [{"from": "human", "value": "Is there a bowl in the image?"}, {"from": "gpt", "value": "This image contains spoon, bottle, refrigerator, oven, cup. Based on this, is there a bowl in the image?"}]}, {"id": 387, "image": "COCO_val2014_000000350898.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains spoon, bottle, refrigerator, oven, cup. Based on this, is there a bottle in the image?"}]}, {"id": 388, "image": "COCO_val2014_000000350898.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains spoon, bottle, refrigerator, oven, cup. Based on this, is there a person in the image?"}]}, {"id": 389, "image": "COCO_val2014_000000350898.jpg", "conversations": [{"from": "human", "value": "Is there a refrigerator in the image?"}, {"from": "gpt", "value": "This image contains spoon, bottle, refrigerator, oven, cup. Based on this, is there a refrigerator in the image?"}]}, {"id": 390, "image": "COCO_val2014_000000350898.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains spoon, bottle, refrigerator, oven, cup. Based on this, is there a chair in the image?"}]}, {"id": 391, "image": "COCO_val2014_000000170365.jpg", "conversations": [{"from": "human", "value": "Is there a sink in the image?"}, {"from": "gpt", "value": "This image contains sink, potted plant, toilet. Based on this, is there a sink in the image?"}]}, {"id": 392, "image": "COCO_val2014_000000170365.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains sink, potted plant, toilet. Based on this, is there a bottle in the image?"}]}, {"id": 393, "image": "COCO_val2014_000000170365.jpg", "conversations": [{"from": "human", "value": "Is there a potted plant in the image?"}, {"from": "gpt", "value": "This image contains sink, potted plant, toilet. Based on this, is there a potted plant in the image?"}]}, {"id": 394, "image": "COCO_val2014_000000170365.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains sink, potted plant, toilet. Based on this, is there a person in the image?"}]}, {"id": 395, "image": "COCO_val2014_000000170365.jpg", "conversations": [{"from": "human", "value": "Is there a toilet in the image?"}, {"from": "gpt", "value": "This image contains sink, potted plant, toilet. Based on this, is there a toilet in the image?"}]}, {"id": 396, "image": "COCO_val2014_000000170365.jpg", "conversations": [{"from": "human", "value": "Is there a vase in the image?"}, {"from": "gpt", "value": "This image contains sink, potted plant, toilet. Based on this, is there a vase in the image?"}]}, {"id": 397, "image": "COCO_val2014_000000021645.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains backpack, clock, couch, dining table, chair, book. Based on this, is there a backpack in the image?"}]}, {"id": 398, "image": "COCO_val2014_000000021645.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains backpack, clock, couch, dining table, chair, book. Based on this, is there a person in the image?"}]}, {"id": 399, "image": "COCO_val2014_000000021645.jpg", "conversations": [{"from": "human", "value": "Is there a clock in the image?"}, {"from": "gpt", "value": "This image contains backpack, clock, couch, dining table, chair, book. Based on this, is there a clock in the image?"}]}, {"id": 400, "image": "COCO_val2014_000000021645.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains backpack, clock, couch, dining table, chair, book. Based on this, is there a car in the image?"}]}, {"id": 401, "image": "COCO_val2014_000000021645.jpg", "conversations": [{"from": "human", "value": "Is there a couch in the image?"}, {"from": "gpt", "value": "This image contains backpack, clock, couch, dining table, chair, book. Based on this, is there a couch in the image?"}]}, {"id": 402, "image": "COCO_val2014_000000021645.jpg", "conversations": [{"from": "human", "value": "Is there a tv in the image?"}, {"from": "gpt", "value": "This image contains backpack, clock, couch, dining table, chair, book. Based on this, is there a tv in the image?"}]}, {"id": 403, "image": "COCO_val2014_000000528905.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, car, frisbee. Based on this, is there a person in the image?"}]}, {"id": 404, "image": "COCO_val2014_000000528905.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, car, frisbee. Based on this, is there a dining table in the image?"}]}, {"id": 405, "image": "COCO_val2014_000000528905.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, car, frisbee. Based on this, is there a car in the image?"}]}, {"id": 406, "image": "COCO_val2014_000000528905.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains person, car, frisbee. Based on this, is there a truck in the image?"}]}, {"id": 407, "image": "COCO_val2014_000000528905.jpg", "conversations": [{"from": "human", "value": "Is there a frisbee in the image?"}, {"from": "gpt", "value": "This image contains person, car, frisbee. Based on this, is there a frisbee in the image?"}]}, {"id": 408, "image": "COCO_val2014_000000528905.jpg", "conversations": [{"from": "human", "value": "Is there a dog in the image?"}, {"from": "gpt", "value": "This image contains person, car, frisbee. Based on this, is there a dog in the image?"}]}, {"id": 409, "image": "COCO_val2014_000000239347.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, bed, tie. Based on this, is there a person in the image?"}]}, {"id": 410, "image": "COCO_val2014_000000239347.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, bed, tie. Based on this, is there a car in the image?"}]}, {"id": 411, "image": "COCO_val2014_000000239347.jpg", "conversations": [{"from": "human", "value": "Is there a bed in the image?"}, {"from": "gpt", "value": "This image contains person, bed, tie. Based on this, is there a bed in the image?"}]}, {"id": 412, "image": "COCO_val2014_000000239347.jpg", "conversations": [{"from": "human", "value": "Is there a book in the image?"}, {"from": "gpt", "value": "This image contains person, bed, tie. Based on this, is there a book in the image?"}]}, {"id": 413, "image": "COCO_val2014_000000239347.jpg", "conversations": [{"from": "human", "value": "Is there a tie in the image?"}, {"from": "gpt", "value": "This image contains person, bed, tie. Based on this, is there a tie in the image?"}]}, {"id": 414, "image": "COCO_val2014_000000239347.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, bed, tie. Based on this, is there a dining table in the image?"}]}, {"id": 415, "image": "COCO_val2014_000000007320.jpg", "conversations": [{"from": "human", "value": "Is there a tv in the image?"}, {"from": "gpt", "value": "This image contains tv, person, remote, dining table. Based on this, is there a tv in the image?"}]}, {"id": 416, "image": "COCO_val2014_000000007320.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains tv, person, remote, dining table. Based on this, is there a chair in the image?"}]}, {"id": 417, "image": "COCO_val2014_000000007320.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains tv, person, remote, dining table. Based on this, is there a person in the image?"}]}, {"id": 418, "image": "COCO_val2014_000000007320.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains tv, person, remote, dining table. Based on this, is there a car in the image?"}]}, {"id": 419, "image": "COCO_val2014_000000007320.jpg", "conversations": [{"from": "human", "value": "Is there a remote in the image?"}, {"from": "gpt", "value": "This image contains tv, person, remote, dining table. Based on this, is there a remote in the image?"}]}, {"id": 420, "image": "COCO_val2014_000000007320.jpg", "conversations": [{"from": "human", "value": "Is there a couch in the image?"}, {"from": "gpt", "value": "This image contains tv, person, remote, dining table. Based on this, is there a couch in the image?"}]}, {"id": 421, "image": "COCO_val2014_000000249715.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains chair, person, remote. Based on this, is there a chair in the image?"}]}, {"id": 422, "image": "COCO_val2014_000000249715.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains chair, person, remote. Based on this, is there a dining table in the image?"}]}, {"id": 423, "image": "COCO_val2014_000000249715.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains chair, person, remote. Based on this, is there a person in the image?"}]}, {"id": 424, "image": "COCO_val2014_000000249715.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains chair, person, remote. Based on this, is there a car in the image?"}]}, {"id": 425, "image": "COCO_val2014_000000249715.jpg", "conversations": [{"from": "human", "value": "Is there a remote in the image?"}, {"from": "gpt", "value": "This image contains chair, person, remote. Based on this, is there a remote in the image?"}]}, {"id": 426, "image": "COCO_val2014_000000249715.jpg", "conversations": [{"from": "human", "value": "Is there a tv in the image?"}, {"from": "gpt", "value": "This image contains chair, person, remote. Based on this, is there a tv in the image?"}]}, {"id": 427, "image": "COCO_val2014_000000080022.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket. Based on this, is there a person in the image?"}]}, {"id": 428, "image": "COCO_val2014_000000080022.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket. Based on this, is there a car in the image?"}]}, {"id": 429, "image": "COCO_val2014_000000080022.jpg", "conversations": [{"from": "human", "value": "Is there a sports ball in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket. Based on this, is there a sports ball in the image?"}]}, {"id": 430, "image": "COCO_val2014_000000080022.jpg", "conversations": [{"from": "human", "value": "Is there a baseball glove in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket. Based on this, is there a baseball glove in the image?"}]}, {"id": 431, "image": "COCO_val2014_000000080022.jpg", "conversations": [{"from": "human", "value": "Is there a tennis racket in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket. Based on this, is there a tennis racket in the image?"}]}, {"id": 432, "image": "COCO_val2014_000000080022.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket. Based on this, is there a chair in the image?"}]}, {"id": 433, "image": "COCO_val2014_000000564336.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, truck, laptop, dining table, chair, parking meter, bottle, car. Based on this, is there a person in the image?"}]}, {"id": 434, "image": "COCO_val2014_000000564336.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains person, truck, laptop, dining table, chair, parking meter, bottle, car. Based on this, is there a handbag in the image?"}]}, {"id": 435, "image": "COCO_val2014_000000564336.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains person, truck, laptop, dining table, chair, parking meter, bottle, car. Based on this, is there a truck in the image?"}]}, {"id": 436, "image": "COCO_val2014_000000564336.jpg", "conversations": [{"from": "human", "value": "Is there a traffic light in the image?"}, {"from": "gpt", "value": "This image contains person, truck, laptop, dining table, chair, parking meter, bottle, car. Based on this, is there a traffic light in the image?"}]}, {"id": 437, "image": "COCO_val2014_000000564336.jpg", "conversations": [{"from": "human", "value": "Is there a laptop in the image?"}, {"from": "gpt", "value": "This image contains person, truck, laptop, dining table, chair, parking meter, bottle, car. Based on this, is there a laptop in the image?"}]}, {"id": 438, "image": "COCO_val2014_000000564336.jpg", "conversations": [{"from": "human", "value": "Is there a tv in the image?"}, {"from": "gpt", "value": "This image contains person, truck, laptop, dining table, chair, parking meter, bottle, car. Based on this, is there a tv in the image?"}]}, {"id": 439, "image": "COCO_val2014_000000231589.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains chair, person, couch, bed. Based on this, is there a chair in the image?"}]}, {"id": 440, "image": "COCO_val2014_000000231589.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains chair, person, couch, bed. Based on this, is there a dining table in the image?"}]}, {"id": 441, "image": "COCO_val2014_000000231589.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains chair, person, couch, bed. Based on this, is there a person in the image?"}]}, {"id": 442, "image": "COCO_val2014_000000231589.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains chair, person, couch, bed. Based on this, is there a car in the image?"}]}, {"id": 443, "image": "COCO_val2014_000000231589.jpg", "conversations": [{"from": "human", "value": "Is there a couch in the image?"}, {"from": "gpt", "value": "This image contains chair, person, couch, bed. Based on this, is there a couch in the image?"}]}, {"id": 444, "image": "COCO_val2014_000000231589.jpg", "conversations": [{"from": "human", "value": "Is there a tv in the image?"}, {"from": "gpt", "value": "This image contains chair, person, couch, bed. Based on this, is there a tv in the image?"}]}, {"id": 445, "image": "COCO_val2014_000000465275.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, clock, couch, remote, vase. Based on this, is there a person in the image?"}]}, {"id": 446, "image": "COCO_val2014_000000465275.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, clock, couch, remote, vase. Based on this, is there a car in the image?"}]}, {"id": 447, "image": "COCO_val2014_000000465275.jpg", "conversations": [{"from": "human", "value": "Is there a clock in the image?"}, {"from": "gpt", "value": "This image contains person, clock, couch, remote, vase. Based on this, is there a clock in the image?"}]}, {"id": 448, "image": "COCO_val2014_000000465275.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains person, clock, couch, remote, vase. Based on this, is there a chair in the image?"}]}, {"id": 449, "image": "COCO_val2014_000000465275.jpg", "conversations": [{"from": "human", "value": "Is there a couch in the image?"}, {"from": "gpt", "value": "This image contains person, clock, couch, remote, vase. Based on this, is there a couch in the image?"}]}, {"id": 450, "image": "COCO_val2014_000000465275.jpg", "conversations": [{"from": "human", "value": "Is there a tv in the image?"}, {"from": "gpt", "value": "This image contains person, clock, couch, remote, vase. Based on this, is there a tv in the image?"}]}, {"id": 451, "image": "COCO_val2014_000000083275.jpg", "conversations": [{"from": "human", "value": "Is there a baseball glove in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball, baseball bat. Based on this, is there a baseball glove in the image?"}]}, {"id": 452, "image": "COCO_val2014_000000083275.jpg", "conversations": [{"from": "human", "value": "Is there a dog in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball, baseball bat. Based on this, is there a dog in the image?"}]}, {"id": 453, "image": "COCO_val2014_000000083275.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball, baseball bat. Based on this, is there a person in the image?"}]}, {"id": 454, "image": "COCO_val2014_000000083275.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball, baseball bat. Based on this, is there a car in the image?"}]}, {"id": 455, "image": "COCO_val2014_000000083275.jpg", "conversations": [{"from": "human", "value": "Is there a sports ball in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball, baseball bat. Based on this, is there a sports ball in the image?"}]}, {"id": 456, "image": "COCO_val2014_000000083275.jpg", "conversations": [{"from": "human", "value": "Is there a tennis racket in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball, baseball bat. Based on this, is there a tennis racket in the image?"}]}, {"id": 457, "image": "COCO_val2014_000000406403.jpg", "conversations": [{"from": "human", "value": "Is there a snowboard in the image?"}, {"from": "gpt", "value": "This image contains snowboard, person, skis. Based on this, is there a snowboard in the image?"}]}, {"id": 458, "image": "COCO_val2014_000000406403.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains snowboard, person, skis. Based on this, is there a backpack in the image?"}]}, {"id": 459, "image": "COCO_val2014_000000406403.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains snowboard, person, skis. Based on this, is there a person in the image?"}]}, {"id": 460, "image": "COCO_val2014_000000406403.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains snowboard, person, skis. Based on this, is there a car in the image?"}]}, {"id": 461, "image": "COCO_val2014_000000406403.jpg", "conversations": [{"from": "human", "value": "Is there a skis in the image?"}, {"from": "gpt", "value": "This image contains snowboard, person, skis. Based on this, is there a skis in the image?"}]}, {"id": 462, "image": "COCO_val2014_000000406403.jpg", "conversations": [{"from": "human", "value": "Is there a dog in the image?"}, {"from": "gpt", "value": "This image contains snowboard, person, skis. Based on this, is there a dog in the image?"}]}, {"id": 463, "image": "COCO_val2014_000000131018.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, bowl, scissors, spoon, bottle, sink, cup. Based on this, is there a person in the image?"}]}, {"id": 464, "image": "COCO_val2014_000000131018.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, bowl, scissors, spoon, bottle, sink, cup. Based on this, is there a car in the image?"}]}, {"id": 465, "image": "COCO_val2014_000000131018.jpg", "conversations": [{"from": "human", "value": "Is there a bowl in the image?"}, {"from": "gpt", "value": "This image contains person, bowl, scissors, spoon, bottle, sink, cup. Based on this, is there a bowl in the image?"}]}, {"id": 466, "image": "COCO_val2014_000000131018.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, bowl, scissors, spoon, bottle, sink, cup. Based on this, is there a dining table in the image?"}]}, {"id": 467, "image": "COCO_val2014_000000131018.jpg", "conversations": [{"from": "human", "value": "Is there a scissors in the image?"}, {"from": "gpt", "value": "This image contains person, bowl, scissors, spoon, bottle, sink, cup. Based on this, is there a scissors in the image?"}]}, {"id": 468, "image": "COCO_val2014_000000131018.jpg", "conversations": [{"from": "human", "value": "Is there a sandwich in the image?"}, {"from": "gpt", "value": "This image contains person, bowl, scissors, spoon, bottle, sink, cup. Based on this, is there a sandwich in the image?"}]}, {"id": 469, "image": "COCO_val2014_000000332625.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains chair, person, airplane, tv. Based on this, is there a chair in the image?"}]}, {"id": 470, "image": "COCO_val2014_000000332625.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains chair, person, airplane, tv. Based on this, is there a dining table in the image?"}]}, {"id": 471, "image": "COCO_val2014_000000332625.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains chair, person, airplane, tv. Based on this, is there a person in the image?"}]}, {"id": 472, "image": "COCO_val2014_000000332625.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains chair, person, airplane, tv. Based on this, is there a car in the image?"}]}, {"id": 473, "image": "COCO_val2014_000000332625.jpg", "conversations": [{"from": "human", "value": "Is there an airplane in the image?"}, {"from": "gpt", "value": "This image contains chair, person, airplane, tv. Based on this, is there an airplane in the image?"}]}, {"id": 474, "image": "COCO_val2014_000000332625.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains chair, person, airplane, tv. Based on this, is there a truck in the image?"}]}, {"id": 475, "image": "COCO_val2014_000000332025.jpg", "conversations": [{"from": "human", "value": "Is there a dog in the image?"}, {"from": "gpt", "value": "This image contains dog, person, backpack, skis, snowboard, cell phone. Based on this, is there a dog in the image?"}]}, {"id": 476, "image": "COCO_val2014_000000332025.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains dog, person, backpack, skis, snowboard, cell phone. Based on this, is there a car in the image?"}]}, {"id": 477, "image": "COCO_val2014_000000332025.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains dog, person, backpack, skis, snowboard, cell phone. Based on this, is there a person in the image?"}]}, {"id": 478, "image": "COCO_val2014_000000332025.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains dog, person, backpack, skis, snowboard, cell phone. Based on this, is there a dining table in the image?"}]}, {"id": 479, "image": "COCO_val2014_000000332025.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains dog, person, backpack, skis, snowboard, cell phone. Based on this, is there a backpack in the image?"}]}, {"id": 480, "image": "COCO_val2014_000000332025.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains dog, person, backpack, skis, snowboard, cell phone. Based on this, is there a handbag in the image?"}]}, {"id": 481, "image": "COCO_val2014_000000318204.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, horse, sheep, umbrella. Based on this, is there a person in the image?"}]}, {"id": 482, "image": "COCO_val2014_000000318204.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, horse, sheep, umbrella. Based on this, is there a car in the image?"}]}, {"id": 483, "image": "COCO_val2014_000000318204.jpg", "conversations": [{"from": "human", "value": "Is there a horse in the image?"}, {"from": "gpt", "value": "This image contains person, horse, sheep, umbrella. Based on this, is there a horse in the image?"}]}, {"id": 484, "image": "COCO_val2014_000000318204.jpg", "conversations": [{"from": "human", "value": "Is there a dog in the image?"}, {"from": "gpt", "value": "This image contains person, horse, sheep, umbrella. Based on this, is there a dog in the image?"}]}, {"id": 485, "image": "COCO_val2014_000000318204.jpg", "conversations": [{"from": "human", "value": "Is there a sheep in the image?"}, {"from": "gpt", "value": "This image contains person, horse, sheep, umbrella. Based on this, is there a sheep in the image?"}]}, {"id": 486, "image": "COCO_val2014_000000318204.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains person, horse, sheep, umbrella. Based on this, is there a truck in the image?"}]}, {"id": 487, "image": "COCO_val2014_000000455157.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, laptop, dining table, bench, umbrella. Based on this, is there a person in the image?"}]}, {"id": 488, "image": "COCO_val2014_000000455157.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, laptop, dining table, bench, umbrella. Based on this, is there a car in the image?"}]}, {"id": 489, "image": "COCO_val2014_000000455157.jpg", "conversations": [{"from": "human", "value": "Is there a laptop in the image?"}, {"from": "gpt", "value": "This image contains person, laptop, dining table, bench, umbrella. Based on this, is there a laptop in the image?"}]}, {"id": 490, "image": "COCO_val2014_000000455157.jpg", "conversations": [{"from": "human", "value": "Is there a tv in the image?"}, {"from": "gpt", "value": "This image contains person, laptop, dining table, bench, umbrella. Based on this, is there a tv in the image?"}]}, {"id": 491, "image": "COCO_val2014_000000455157.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, laptop, dining table, bench, umbrella. Based on this, is there a dining table in the image?"}]}, {"id": 492, "image": "COCO_val2014_000000455157.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains person, laptop, dining table, bench, umbrella. Based on this, is there a cup in the image?"}]}, {"id": 493, "image": "COCO_val2014_000000069189.jpg", "conversations": [{"from": "human", "value": "Is there a bird in the image?"}, {"from": "gpt", "value": "This image contains bird, person, handbag, bicycle, car, umbrella. Based on this, is there a bird in the image?"}]}, {"id": 494, "image": "COCO_val2014_000000069189.jpg", "conversations": [{"from": "human", "value": "Is there a boat in the image?"}, {"from": "gpt", "value": "This image contains bird, person, handbag, bicycle, car, umbrella. Based on this, is there a boat in the image?"}]}, {"id": 495, "image": "COCO_val2014_000000069189.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains bird, person, handbag, bicycle, car, umbrella. Based on this, is there a person in the image?"}]}, {"id": 496, "image": "COCO_val2014_000000069189.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains bird, person, handbag, bicycle, car, umbrella. Based on this, is there a dining table in the image?"}]}, {"id": 497, "image": "COCO_val2014_000000069189.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains bird, person, handbag, bicycle, car, umbrella. Based on this, is there a handbag in the image?"}]}, {"id": 498, "image": "COCO_val2014_000000069189.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains bird, person, handbag, bicycle, car, umbrella. Based on this, is there a backpack in the image?"}]}, {"id": 499, "image": "COCO_val2014_000000199764.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains backpack, truck, person, handbag, dining table, chair, bench. Based on this, is there a backpack in the image?"}]}, {"id": 500, "image": "COCO_val2014_000000199764.jpg", "conversations": [{"from": "human", "value": "Is there a skis in the image?"}, {"from": "gpt", "value": "This image contains backpack, truck, person, handbag, dining table, chair, bench. Based on this, is there a skis in the image?"}]}, {"id": 501, "image": "COCO_val2014_000000199764.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains backpack, truck, person, handbag, dining table, chair, bench. Based on this, is there a truck in the image?"}]}, {"id": 502, "image": "COCO_val2014_000000199764.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains backpack, truck, person, handbag, dining table, chair, bench. Based on this, is there a car in the image?"}]}, {"id": 503, "image": "COCO_val2014_000000199764.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains backpack, truck, person, handbag, dining table, chair, bench. Based on this, is there a person in the image?"}]}, {"id": 504, "image": "COCO_val2014_000000199764.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains backpack, truck, person, handbag, dining table, chair, bench. Based on this, is there a cup in the image?"}]}, {"id": 505, "image": "COCO_val2014_000000148766.jpg", "conversations": [{"from": "human", "value": "Is there a vase in the image?"}, {"from": "gpt", "value": "This image contains vase, bowl, toilet. Based on this, is there a vase in the image?"}]}, {"id": 506, "image": "COCO_val2014_000000148766.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains vase, bowl, toilet. Based on this, is there a dining table in the image?"}]}, {"id": 507, "image": "COCO_val2014_000000148766.jpg", "conversations": [{"from": "human", "value": "Is there a bowl in the image?"}, {"from": "gpt", "value": "This image contains vase, bowl, toilet. Based on this, is there a bowl in the image?"}]}, {"id": 508, "image": "COCO_val2014_000000148766.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains vase, bowl, toilet. Based on this, is there a cup in the image?"}]}, {"id": 509, "image": "COCO_val2014_000000148766.jpg", "conversations": [{"from": "human", "value": "Is there a toilet in the image?"}, {"from": "gpt", "value": "This image contains vase, bowl, toilet. Based on this, is there a toilet in the image?"}]}, {"id": 510, "image": "COCO_val2014_000000148766.jpg", "conversations": [{"from": "human", "value": "Is there a sink in the image?"}, {"from": "gpt", "value": "This image contains vase, bowl, toilet. Based on this, is there a sink in the image?"}]}, {"id": 511, "image": "COCO_val2014_000000175506.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, orange, frisbee. Based on this, is there a person in the image?"}]}, {"id": 512, "image": "COCO_val2014_000000175506.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, orange, frisbee. Based on this, is there a car in the image?"}]}, {"id": 513, "image": "COCO_val2014_000000175506.jpg", "conversations": [{"from": "human", "value": "Is there an orange in the image?"}, {"from": "gpt", "value": "This image contains person, orange, frisbee. Based on this, is there an orange in the image?"}]}, {"id": 514, "image": "COCO_val2014_000000175506.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, orange, frisbee. Based on this, is there a dining table in the image?"}]}, {"id": 515, "image": "COCO_val2014_000000175506.jpg", "conversations": [{"from": "human", "value": "Is there a frisbee in the image?"}, {"from": "gpt", "value": "This image contains person, orange, frisbee. Based on this, is there a frisbee in the image?"}]}, {"id": 516, "image": "COCO_val2014_000000175506.jpg", "conversations": [{"from": "human", "value": "Is there a dog in the image?"}, {"from": "gpt", "value": "This image contains person, orange, frisbee. Based on this, is there a dog in the image?"}]}, {"id": 517, "image": "COCO_val2014_000000353096.jpg", "conversations": [{"from": "human", "value": "Is there a tv in the image?"}, {"from": "gpt", "value": "This image contains tv, mouse, laptop, dining table, keyboard, apple. Based on this, is there a tv in the image?"}]}, {"id": 518, "image": "COCO_val2014_000000353096.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains tv, mouse, laptop, dining table, keyboard, apple. Based on this, is there a person in the image?"}]}, {"id": 519, "image": "COCO_val2014_000000353096.jpg", "conversations": [{"from": "human", "value": "Is there a mouse in the image?"}, {"from": "gpt", "value": "This image contains tv, mouse, laptop, dining table, keyboard, apple. Based on this, is there a mouse in the image?"}]}, {"id": 520, "image": "COCO_val2014_000000353096.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains tv, mouse, laptop, dining table, keyboard, apple. Based on this, is there a chair in the image?"}]}, {"id": 521, "image": "COCO_val2014_000000353096.jpg", "conversations": [{"from": "human", "value": "Is there a laptop in the image?"}, {"from": "gpt", "value": "This image contains tv, mouse, laptop, dining table, keyboard, apple. Based on this, is there a laptop in the image?"}]}, {"id": 522, "image": "COCO_val2014_000000353096.jpg", "conversations": [{"from": "human", "value": "Is there a cell phone in the image?"}, {"from": "gpt", "value": "This image contains tv, mouse, laptop, dining table, keyboard, apple. Based on this, is there a cell phone in the image?"}]}, {"id": 523, "image": "COCO_val2014_000000207205.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains chair, broccoli, carrot. Based on this, is there a chair in the image?"}]}, {"id": 524, "image": "COCO_val2014_000000207205.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains chair, broccoli, carrot. Based on this, is there a person in the image?"}]}, {"id": 525, "image": "COCO_val2014_000000207205.jpg", "conversations": [{"from": "human", "value": "Is there a broccoli in the image?"}, {"from": "gpt", "value": "This image contains chair, broccoli, carrot. Based on this, is there a broccoli in the image?"}]}, {"id": 526, "image": "COCO_val2014_000000207205.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains chair, broccoli, carrot. Based on this, is there a dining table in the image?"}]}, {"id": 527, "image": "COCO_val2014_000000207205.jpg", "conversations": [{"from": "human", "value": "Is there a carrot in the image?"}, {"from": "gpt", "value": "This image contains chair, broccoli, carrot. Based on this, is there a carrot in the image?"}]}, {"id": 528, "image": "COCO_val2014_000000207205.jpg", "conversations": [{"from": "human", "value": "Is there a bowl in the image?"}, {"from": "gpt", "value": "This image contains chair, broccoli, carrot. Based on this, is there a bowl in the image?"}]}, {"id": 529, "image": "COCO_val2014_000000427113.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, bench, clock. Based on this, is there a person in the image?"}]}, {"id": 530, "image": "COCO_val2014_000000427113.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, bench, clock. Based on this, is there a car in the image?"}]}, {"id": 531, "image": "COCO_val2014_000000427113.jpg", "conversations": [{"from": "human", "value": "Is there a bench in the image?"}, {"from": "gpt", "value": "This image contains person, bench, clock. Based on this, is there a bench in the image?"}]}, {"id": 532, "image": "COCO_val2014_000000427113.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, bench, clock. Based on this, is there a dining table in the image?"}]}, {"id": 533, "image": "COCO_val2014_000000427113.jpg", "conversations": [{"from": "human", "value": "Is there a clock in the image?"}, {"from": "gpt", "value": "This image contains person, bench, clock. Based on this, is there a clock in the image?"}]}, {"id": 534, "image": "COCO_val2014_000000427113.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains person, bench, clock. Based on this, is there a chair in the image?"}]}, {"id": 535, "image": "COCO_val2014_000000498374.jpg", "conversations": [{"from": "human", "value": "Is there a sink in the image?"}, {"from": "gpt", "value": "This image contains sink, person, toilet. Based on this, is there a sink in the image?"}]}, {"id": 536, "image": "COCO_val2014_000000498374.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains sink, person, toilet. Based on this, is there a bottle in the image?"}]}, {"id": 537, "image": "COCO_val2014_000000498374.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains sink, person, toilet. Based on this, is there a person in the image?"}]}, {"id": 538, "image": "COCO_val2014_000000498374.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains sink, person, toilet. Based on this, is there a car in the image?"}]}, {"id": 539, "image": "COCO_val2014_000000498374.jpg", "conversations": [{"from": "human", "value": "Is there a toilet in the image?"}, {"from": "gpt", "value": "This image contains sink, person, toilet. Based on this, is there a toilet in the image?"}]}, {"id": 540, "image": "COCO_val2014_000000498374.jpg", "conversations": [{"from": "human", "value": "Is there a vase in the image?"}, {"from": "gpt", "value": "This image contains sink, person, toilet. Based on this, is there a vase in the image?"}]}, {"id": 541, "image": "COCO_val2014_000000013348.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains truck, person, airplane. Based on this, is there a truck in the image?"}]}, {"id": 542, "image": "COCO_val2014_000000013348.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains truck, person, airplane. Based on this, is there a car in the image?"}]}, {"id": 543, "image": "COCO_val2014_000000013348.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains truck, person, airplane. Based on this, is there a person in the image?"}]}, {"id": 544, "image": "COCO_val2014_000000013348.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains truck, person, airplane. Based on this, is there a dining table in the image?"}]}, {"id": 545, "image": "COCO_val2014_000000013348.jpg", "conversations": [{"from": "human", "value": "Is there an airplane in the image?"}, {"from": "gpt", "value": "This image contains truck, person, airplane. Based on this, is there an airplane in the image?"}]}, {"id": 546, "image": "COCO_val2014_000000013348.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains truck, person, airplane. Based on this, is there a backpack in the image?"}]}, {"id": 547, "image": "COCO_val2014_000000081336.jpg", "conversations": [{"from": "human", "value": "Is there a traffic light in the image?"}, {"from": "gpt", "value": "This image contains traffic light, truck, person, car, stop sign. Based on this, is there a traffic light in the image?"}]}, {"id": 548, "image": "COCO_val2014_000000081336.jpg", "conversations": [{"from": "human", "value": "Is there a bus in the image?"}, {"from": "gpt", "value": "This image contains traffic light, truck, person, car, stop sign. Based on this, is there a bus in the image?"}]}, {"id": 549, "image": "COCO_val2014_000000081336.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains traffic light, truck, person, car, stop sign. Based on this, is there a truck in the image?"}]}, {"id": 550, "image": "COCO_val2014_000000081336.jpg", "conversations": [{"from": "human", "value": "Is there a motorcycle in the image?"}, {"from": "gpt", "value": "This image contains traffic light, truck, person, car, stop sign. Based on this, is there a motorcycle in the image?"}]}, {"id": 551, "image": "COCO_val2014_000000081336.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains traffic light, truck, person, car, stop sign. Based on this, is there a person in the image?"}]}, {"id": 552, "image": "COCO_val2014_000000081336.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains traffic light, truck, person, car, stop sign. Based on this, is there a dining table in the image?"}]}, {"id": 553, "image": "COCO_val2014_000000190185.jpg", "conversations": [{"from": "human", "value": "Is there a dog in the image?"}, {"from": "gpt", "value": "This image contains dog, bowl, sandwich, hot dog. Based on this, is there a dog in the image?"}]}, {"id": 554, "image": "COCO_val2014_000000190185.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains dog, bowl, sandwich, hot dog. Based on this, is there a person in the image?"}]}, {"id": 555, "image": "COCO_val2014_000000190185.jpg", "conversations": [{"from": "human", "value": "Is there a bowl in the image?"}, {"from": "gpt", "value": "This image contains dog, bowl, sandwich, hot dog. Based on this, is there a bowl in the image?"}]}, {"id": 556, "image": "COCO_val2014_000000190185.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains dog, bowl, sandwich, hot dog. Based on this, is there a cup in the image?"}]}, {"id": 557, "image": "COCO_val2014_000000190185.jpg", "conversations": [{"from": "human", "value": "Is there a sandwich in the image?"}, {"from": "gpt", "value": "This image contains dog, bowl, sandwich, hot dog. Based on this, is there a sandwich in the image?"}]}, {"id": 558, "image": "COCO_val2014_000000190185.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains dog, bowl, sandwich, hot dog. Based on this, is there a dining table in the image?"}]}, {"id": 559, "image": "COCO_val2014_000000209755.jpg", "conversations": [{"from": "human", "value": "Is there a spoon in the image?"}, {"from": "gpt", "value": "This image contains spoon, bowl, person, carrot, oven. Based on this, is there a spoon in the image?"}]}, {"id": 560, "image": "COCO_val2014_000000209755.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains spoon, bowl, person, carrot, oven. Based on this, is there a cup in the image?"}]}, {"id": 561, "image": "COCO_val2014_000000209755.jpg", "conversations": [{"from": "human", "value": "Is there a bowl in the image?"}, {"from": "gpt", "value": "This image contains spoon, bowl, person, carrot, oven. Based on this, is there a bowl in the image?"}]}, {"id": 562, "image": "COCO_val2014_000000209755.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains spoon, bowl, person, carrot, oven. Based on this, is there a dining table in the image?"}]}, {"id": 563, "image": "COCO_val2014_000000209755.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains spoon, bowl, person, carrot, oven. Based on this, is there a person in the image?"}]}, {"id": 564, "image": "COCO_val2014_000000209755.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains spoon, bowl, person, carrot, oven. Based on this, is there a car in the image?"}]}, {"id": 565, "image": "COCO_val2014_000000227227.jpg", "conversations": [{"from": "human", "value": "Is there a dog in the image?"}, {"from": "gpt", "value": "This image contains dog, person, car. Based on this, is there a dog in the image?"}]}, {"id": 566, "image": "COCO_val2014_000000227227.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains dog, person, car. Based on this, is there a truck in the image?"}]}, {"id": 567, "image": "COCO_val2014_000000227227.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains dog, person, car. Based on this, is there a person in the image?"}]}, {"id": 568, "image": "COCO_val2014_000000227227.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains dog, person, car. Based on this, is there a dining table in the image?"}]}, {"id": 569, "image": "COCO_val2014_000000227227.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains dog, person, car. Based on this, is there a car in the image?"}]}, {"id": 570, "image": "COCO_val2014_000000227227.jpg", "conversations": [{"from": "human", "value": "Is there a bus in the image?"}, {"from": "gpt", "value": "This image contains dog, person, car. Based on this, is there a bus in the image?"}]}, {"id": 571, "image": "COCO_val2014_000000397705.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, bed, cat, book, cup. Based on this, is there a person in the image?"}]}, {"id": 572, "image": "COCO_val2014_000000397705.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, bed, cat, book, cup. Based on this, is there a car in the image?"}]}, {"id": 573, "image": "COCO_val2014_000000397705.jpg", "conversations": [{"from": "human", "value": "Is there a bed in the image?"}, {"from": "gpt", "value": "This image contains person, bed, cat, book, cup. Based on this, is there a bed in the image?"}]}, {"id": 574, "image": "COCO_val2014_000000397705.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, bed, cat, book, cup. Based on this, is there a dining table in the image?"}]}, {"id": 575, "image": "COCO_val2014_000000397705.jpg", "conversations": [{"from": "human", "value": "Is there a cat in the image?"}, {"from": "gpt", "value": "This image contains person, bed, cat, book, cup. Based on this, is there a cat in the image?"}]}, {"id": 576, "image": "COCO_val2014_000000397705.jpg", "conversations": [{"from": "human", "value": "Is there a couch in the image?"}, {"from": "gpt", "value": "This image contains person, bed, cat, book, cup. Based on this, is there a couch in the image?"}]}, {"id": 577, "image": "COCO_val2014_000000287305.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, car, bus. Based on this, is there a person in the image?"}]}, {"id": 578, "image": "COCO_val2014_000000287305.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, car, bus. Based on this, is there a dining table in the image?"}]}, {"id": 579, "image": "COCO_val2014_000000287305.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, car, bus. Based on this, is there a car in the image?"}]}, {"id": 580, "image": "COCO_val2014_000000287305.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains person, car, bus. Based on this, is there a truck in the image?"}]}, {"id": 581, "image": "COCO_val2014_000000287305.jpg", "conversations": [{"from": "human", "value": "Is there a bus in the image?"}, {"from": "gpt", "value": "This image contains person, car, bus. Based on this, is there a bus in the image?"}]}, {"id": 582, "image": "COCO_val2014_000000287305.jpg", "conversations": [{"from": "human", "value": "Is there a traffic light in the image?"}, {"from": "gpt", "value": "This image contains person, car, bus. Based on this, is there a traffic light in the image?"}]}, {"id": 583, "image": "COCO_val2014_000000257327.jpg", "conversations": [{"from": "human", "value": "Is there a sink in the image?"}, {"from": "gpt", "value": "This image contains sink, toilet, bottle. Based on this, is there a sink in the image?"}]}, {"id": 584, "image": "COCO_val2014_000000257327.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains sink, toilet, bottle. Based on this, is there a person in the image?"}]}, {"id": 585, "image": "COCO_val2014_000000257327.jpg", "conversations": [{"from": "human", "value": "Is there a toilet in the image?"}, {"from": "gpt", "value": "This image contains sink, toilet, bottle. Based on this, is there a toilet in the image?"}]}, {"id": 586, "image": "COCO_val2014_000000257327.jpg", "conversations": [{"from": "human", "value": "Is there a vase in the image?"}, {"from": "gpt", "value": "This image contains sink, toilet, bottle. Based on this, is there a vase in the image?"}]}, {"id": 587, "image": "COCO_val2014_000000257327.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains sink, toilet, bottle. Based on this, is there a bottle in the image?"}]}, {"id": 588, "image": "COCO_val2014_000000257327.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains sink, toilet, bottle. Based on this, is there a dining table in the image?"}]}, {"id": 589, "image": "COCO_val2014_000000557016.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, bicycle, car, cow, motorcycle. Based on this, is there a person in the image?"}]}, {"id": 590, "image": "COCO_val2014_000000557016.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, bicycle, car, cow, motorcycle. Based on this, is there a dining table in the image?"}]}, {"id": 591, "image": "COCO_val2014_000000557016.jpg", "conversations": [{"from": "human", "value": "Is there a bicycle in the image?"}, {"from": "gpt", "value": "This image contains person, bicycle, car, cow, motorcycle. Based on this, is there a bicycle in the image?"}]}, {"id": 592, "image": "COCO_val2014_000000557016.jpg", "conversations": [{"from": "human", "value": "Is there a bus in the image?"}, {"from": "gpt", "value": "This image contains person, bicycle, car, cow, motorcycle. Based on this, is there a bus in the image?"}]}, {"id": 593, "image": "COCO_val2014_000000557016.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, bicycle, car, cow, motorcycle. Based on this, is there a car in the image?"}]}, {"id": 594, "image": "COCO_val2014_000000557016.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains person, bicycle, car, cow, motorcycle. Based on this, is there a truck in the image?"}]}, {"id": 595, "image": "COCO_val2014_000000105732.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, skis. Based on this, is there a backpack in the image?"}]}, {"id": 596, "image": "COCO_val2014_000000105732.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, skis. Based on this, is there a handbag in the image?"}]}, {"id": 597, "image": "COCO_val2014_000000105732.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, skis. Based on this, is there a person in the image?"}]}, {"id": 598, "image": "COCO_val2014_000000105732.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, skis. Based on this, is there a car in the image?"}]}, {"id": 599, "image": "COCO_val2014_000000105732.jpg", "conversations": [{"from": "human", "value": "Is there a skis in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, skis. Based on this, is there a skis in the image?"}]}, {"id": 600, "image": "COCO_val2014_000000105732.jpg", "conversations": [{"from": "human", "value": "Is there a snowboard in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, skis. Based on this, is there a snowboard in the image?"}]}, {"id": 601, "image": "COCO_val2014_000000534121.jpg", "conversations": [{"from": "human", "value": "Is there a tv in the image?"}, {"from": "gpt", "value": "This image contains tv, couch, boat, chair, book, cup. Based on this, is there a tv in the image?"}]}, {"id": 602, "image": "COCO_val2014_000000534121.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains tv, couch, boat, chair, book, cup. Based on this, is there a person in the image?"}]}, {"id": 603, "image": "COCO_val2014_000000534121.jpg", "conversations": [{"from": "human", "value": "Is there a couch in the image?"}, {"from": "gpt", "value": "This image contains tv, couch, boat, chair, book, cup. Based on this, is there a couch in the image?"}]}, {"id": 604, "image": "COCO_val2014_000000534121.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains tv, couch, boat, chair, book, cup. Based on this, is there a dining table in the image?"}]}, {"id": 605, "image": "COCO_val2014_000000534121.jpg", "conversations": [{"from": "human", "value": "Is there a boat in the image?"}, {"from": "gpt", "value": "This image contains tv, couch, boat, chair, book, cup. Based on this, is there a boat in the image?"}]}, {"id": 606, "image": "COCO_val2014_000000534121.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains tv, couch, boat, chair, book, cup. Based on this, is there a car in the image?"}]}, {"id": 607, "image": "COCO_val2014_000000520524.jpg", "conversations": [{"from": "human", "value": "Is there a motorcycle in the image?"}, {"from": "gpt", "value": "This image contains motorcycle, bicycle, car, dining table, orange. Based on this, is there a motorcycle in the image?"}]}, {"id": 608, "image": "COCO_val2014_000000520524.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains motorcycle, bicycle, car, dining table, orange. Based on this, is there a person in the image?"}]}, {"id": 609, "image": "COCO_val2014_000000520524.jpg", "conversations": [{"from": "human", "value": "Is there a bicycle in the image?"}, {"from": "gpt", "value": "This image contains motorcycle, bicycle, car, dining table, orange. Based on this, is there a bicycle in the image?"}]}, {"id": 610, "image": "COCO_val2014_000000520524.jpg", "conversations": [{"from": "human", "value": "Is there a bus in the image?"}, {"from": "gpt", "value": "This image contains motorcycle, bicycle, car, dining table, orange. Based on this, is there a bus in the image?"}]}, {"id": 611, "image": "COCO_val2014_000000520524.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains motorcycle, bicycle, car, dining table, orange. Based on this, is there a car in the image?"}]}, {"id": 612, "image": "COCO_val2014_000000520524.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains motorcycle, bicycle, car, dining table, orange. Based on this, is there a truck in the image?"}]}, {"id": 613, "image": "COCO_val2014_000000580294.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, bowl, spoon, sink, cake, toothbrush, oven, cup. Based on this, is there a person in the image?"}]}, {"id": 614, "image": "COCO_val2014_000000580294.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, bowl, spoon, sink, cake, toothbrush, oven, cup. Based on this, is there a car in the image?"}]}, {"id": 615, "image": "COCO_val2014_000000580294.jpg", "conversations": [{"from": "human", "value": "Is there a bowl in the image?"}, {"from": "gpt", "value": "This image contains person, bowl, spoon, sink, cake, toothbrush, oven, cup. Based on this, is there a bowl in the image?"}]}, {"id": 616, "image": "COCO_val2014_000000580294.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, bowl, spoon, sink, cake, toothbrush, oven, cup. Based on this, is there a dining table in the image?"}]}, {"id": 617, "image": "COCO_val2014_000000580294.jpg", "conversations": [{"from": "human", "value": "Is there a spoon in the image?"}, {"from": "gpt", "value": "This image contains person, bowl, spoon, sink, cake, toothbrush, oven, cup. Based on this, is there a spoon in the image?"}]}, {"id": 618, "image": "COCO_val2014_000000580294.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains person, bowl, spoon, sink, cake, toothbrush, oven, cup. Based on this, is there a bottle in the image?"}]}, {"id": 619, "image": "COCO_val2014_000000374061.jpg", "conversations": [{"from": "human", "value": "Is there a couch in the image?"}, {"from": "gpt", "value": "This image contains couch, bed, cat, teddy bear, bear. Based on this, is there a couch in the image?"}]}, {"id": 620, "image": "COCO_val2014_000000374061.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains couch, bed, cat, teddy bear, bear. Based on this, is there a person in the image?"}]}, {"id": 621, "image": "COCO_val2014_000000374061.jpg", "conversations": [{"from": "human", "value": "Is there a bed in the image?"}, {"from": "gpt", "value": "This image contains couch, bed, cat, teddy bear, bear. Based on this, is there a bed in the image?"}]}, {"id": 622, "image": "COCO_val2014_000000374061.jpg", "conversations": [{"from": "human", "value": "Is there a book in the image?"}, {"from": "gpt", "value": "This image contains couch, bed, cat, teddy bear, bear. Based on this, is there a book in the image?"}]}, {"id": 623, "image": "COCO_val2014_000000374061.jpg", "conversations": [{"from": "human", "value": "Is there a cat in the image?"}, {"from": "gpt", "value": "This image contains couch, bed, cat, teddy bear, bear. Based on this, is there a cat in the image?"}]}, {"id": 624, "image": "COCO_val2014_000000374061.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains couch, bed, cat, teddy bear, bear. Based on this, is there a chair in the image?"}]}, {"id": 625, "image": "COCO_val2014_000000094944.jpg", "conversations": [{"from": "human", "value": "Is there a snowboard in the image?"}, {"from": "gpt", "value": "This image contains snowboard, backpack, person, skis. Based on this, is there a snowboard in the image?"}]}, {"id": 626, "image": "COCO_val2014_000000094944.jpg", "conversations": [{"from": "human", "value": "Is there a surfboard in the image?"}, {"from": "gpt", "value": "This image contains snowboard, backpack, person, skis. Based on this, is there a surfboard in the image?"}]}, {"id": 627, "image": "COCO_val2014_000000094944.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains snowboard, backpack, person, skis. Based on this, is there a backpack in the image?"}]}, {"id": 628, "image": "COCO_val2014_000000094944.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains snowboard, backpack, person, skis. Based on this, is there a handbag in the image?"}]}, {"id": 629, "image": "COCO_val2014_000000094944.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains snowboard, backpack, person, skis. Based on this, is there a person in the image?"}]}, {"id": 630, "image": "COCO_val2014_000000094944.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains snowboard, backpack, person, skis. Based on this, is there a car in the image?"}]}, {"id": 631, "image": "COCO_val2014_000000572075.jpg", "conversations": [{"from": "human", "value": "Is there a bowl in the image?"}, {"from": "gpt", "value": "This image contains bowl, toilet, cat. Based on this, is there a bowl in the image?"}]}, {"id": 632, "image": "COCO_val2014_000000572075.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains bowl, toilet, cat. Based on this, is there a cup in the image?"}]}, {"id": 633, "image": "COCO_val2014_000000572075.jpg", "conversations": [{"from": "human", "value": "Is there a toilet in the image?"}, {"from": "gpt", "value": "This image contains bowl, toilet, cat. Based on this, is there a toilet in the image?"}]}, {"id": 634, "image": "COCO_val2014_000000572075.jpg", "conversations": [{"from": "human", "value": "Is there a sink in the image?"}, {"from": "gpt", "value": "This image contains bowl, toilet, cat. Based on this, is there a sink in the image?"}]}, {"id": 635, "image": "COCO_val2014_000000572075.jpg", "conversations": [{"from": "human", "value": "Is there a cat in the image?"}, {"from": "gpt", "value": "This image contains bowl, toilet, cat. Based on this, is there a cat in the image?"}]}, {"id": 636, "image": "COCO_val2014_000000572075.jpg", "conversations": [{"from": "human", "value": "Is there a couch in the image?"}, {"from": "gpt", "value": "This image contains bowl, toilet, cat. Based on this, is there a couch in the image?"}]}, {"id": 637, "image": "COCO_val2014_000000387098.jpg", "conversations": [{"from": "human", "value": "Is there a spoon in the image?"}, {"from": "gpt", "value": "This image contains spoon, laptop, remote, dining table, tv, mouse, bottle, keyboard, book, cup. Based on this, is there a spoon in the image?"}]}, {"id": 638, "image": "COCO_val2014_000000387098.jpg", "conversations": [{"from": "human", "value": "Is there a bowl in the image?"}, {"from": "gpt", "value": "This image contains spoon, laptop, remote, dining table, tv, mouse, bottle, keyboard, book, cup. Based on this, is there a bowl in the image?"}]}, {"id": 639, "image": "COCO_val2014_000000387098.jpg", "conversations": [{"from": "human", "value": "Is there a laptop in the image?"}, {"from": "gpt", "value": "This image contains spoon, laptop, remote, dining table, tv, mouse, bottle, keyboard, book, cup. Based on this, is there a laptop in the image?"}]}, {"id": 640, "image": "COCO_val2014_000000387098.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains spoon, laptop, remote, dining table, tv, mouse, bottle, keyboard, book, cup. Based on this, is there a person in the image?"}]}, {"id": 641, "image": "COCO_val2014_000000387098.jpg", "conversations": [{"from": "human", "value": "Is there a remote in the image?"}, {"from": "gpt", "value": "This image contains spoon, laptop, remote, dining table, tv, mouse, bottle, keyboard, book, cup. Based on this, is there a remote in the image?"}]}, {"id": 642, "image": "COCO_val2014_000000387098.jpg", "conversations": [{"from": "human", "value": "Is there a couch in the image?"}, {"from": "gpt", "value": "This image contains spoon, laptop, remote, dining table, tv, mouse, bottle, keyboard, book, cup. Based on this, is there a couch in the image?"}]}, {"id": 643, "image": "COCO_val2014_000000382670.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, bicycle, potted plant, boat, cow. Based on this, is there a person in the image?"}]}, {"id": 644, "image": "COCO_val2014_000000382670.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, bicycle, potted plant, boat, cow. Based on this, is there a car in the image?"}]}, {"id": 645, "image": "COCO_val2014_000000382670.jpg", "conversations": [{"from": "human", "value": "Is there a bicycle in the image?"}, {"from": "gpt", "value": "This image contains person, bicycle, potted plant, boat, cow. Based on this, is there a bicycle in the image?"}]}, {"id": 646, "image": "COCO_val2014_000000382670.jpg", "conversations": [{"from": "human", "value": "Is there a motorcycle in the image?"}, {"from": "gpt", "value": "This image contains person, bicycle, potted plant, boat, cow. Based on this, is there a motorcycle in the image?"}]}, {"id": 647, "image": "COCO_val2014_000000382670.jpg", "conversations": [{"from": "human", "value": "Is there a potted plant in the image?"}, {"from": "gpt", "value": "This image contains person, bicycle, potted plant, boat, cow. Based on this, is there a potted plant in the image?"}]}, {"id": 648, "image": "COCO_val2014_000000382670.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, bicycle, potted plant, boat, cow. Based on this, is there a dining table in the image?"}]}, {"id": 649, "image": "COCO_val2014_000000414516.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, dining table, chair, bench, elephant. Based on this, is there a person in the image?"}]}, {"id": 650, "image": "COCO_val2014_000000414516.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, dining table, chair, bench, elephant. Based on this, is there a car in the image?"}]}, {"id": 651, "image": "COCO_val2014_000000414516.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, dining table, chair, bench, elephant. Based on this, is there a dining table in the image?"}]}, {"id": 652, "image": "COCO_val2014_000000414516.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains person, dining table, chair, bench, elephant. Based on this, is there a cup in the image?"}]}, {"id": 653, "image": "COCO_val2014_000000414516.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains person, dining table, chair, bench, elephant. Based on this, is there a chair in the image?"}]}, {"id": 654, "image": "COCO_val2014_000000414516.jpg", "conversations": [{"from": "human", "value": "Is there a couch in the image?"}, {"from": "gpt", "value": "This image contains person, dining table, chair, bench, elephant. Based on this, is there a couch in the image?"}]}, {"id": 655, "image": "COCO_val2014_000000204360.jpg", "conversations": [{"from": "human", "value": "Is there a traffic light in the image?"}, {"from": "gpt", "value": "This image contains traffic light, person, backpack, bicycle, car, bus. Based on this, is there a traffic light in the image?"}]}, {"id": 656, "image": "COCO_val2014_000000204360.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains traffic light, person, backpack, bicycle, car, bus. Based on this, is there a truck in the image?"}]}, {"id": 657, "image": "COCO_val2014_000000204360.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains traffic light, person, backpack, bicycle, car, bus. Based on this, is there a person in the image?"}]}, {"id": 658, "image": "COCO_val2014_000000204360.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains traffic light, person, backpack, bicycle, car, bus. Based on this, is there a dining table in the image?"}]}, {"id": 659, "image": "COCO_val2014_000000204360.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains traffic light, person, backpack, bicycle, car, bus. Based on this, is there a backpack in the image?"}]}, {"id": 660, "image": "COCO_val2014_000000204360.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains traffic light, person, backpack, bicycle, car, bus. Based on this, is there a handbag in the image?"}]}, {"id": 661, "image": "COCO_val2014_000000245642.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, bicycle, sheep. Based on this, is there a person in the image?"}]}, {"id": 662, "image": "COCO_val2014_000000245642.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, bicycle, sheep. Based on this, is there a car in the image?"}]}, {"id": 663, "image": "COCO_val2014_000000245642.jpg", "conversations": [{"from": "human", "value": "Is there a bicycle in the image?"}, {"from": "gpt", "value": "This image contains person, bicycle, sheep. Based on this, is there a bicycle in the image?"}]}, {"id": 664, "image": "COCO_val2014_000000245642.jpg", "conversations": [{"from": "human", "value": "Is there a motorcycle in the image?"}, {"from": "gpt", "value": "This image contains person, bicycle, sheep. Based on this, is there a motorcycle in the image?"}]}, {"id": 665, "image": "COCO_val2014_000000245642.jpg", "conversations": [{"from": "human", "value": "Is there a sheep in the image?"}, {"from": "gpt", "value": "This image contains person, bicycle, sheep. Based on this, is there a sheep in the image?"}]}, {"id": 666, "image": "COCO_val2014_000000245642.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains person, bicycle, sheep. Based on this, is there a truck in the image?"}]}, {"id": 667, "image": "COCO_val2014_000000237767.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, remote, dining table, apple, cell phone, tv, couch, book. Based on this, is there a person in the image?"}]}, {"id": 668, "image": "COCO_val2014_000000237767.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, remote, dining table, apple, cell phone, tv, couch, book. Based on this, is there a car in the image?"}]}, {"id": 669, "image": "COCO_val2014_000000237767.jpg", "conversations": [{"from": "human", "value": "Is there a remote in the image?"}, {"from": "gpt", "value": "This image contains person, remote, dining table, apple, cell phone, tv, couch, book. Based on this, is there a remote in the image?"}]}, {"id": 670, "image": "COCO_val2014_000000237767.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains person, remote, dining table, apple, cell phone, tv, couch, book. Based on this, is there a chair in the image?"}]}, {"id": 671, "image": "COCO_val2014_000000237767.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, remote, dining table, apple, cell phone, tv, couch, book. Based on this, is there a dining table in the image?"}]}, {"id": 672, "image": "COCO_val2014_000000237767.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains person, remote, dining table, apple, cell phone, tv, couch, book. Based on this, is there a cup in the image?"}]}, {"id": 673, "image": "COCO_val2014_000000370900.jpg", "conversations": [{"from": "human", "value": "Is there a tie in the image?"}, {"from": "gpt", "value": "This image contains tie, bear, teddy bear, dining table. Based on this, is there a tie in the image?"}]}, {"id": 674, "image": "COCO_val2014_000000370900.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains tie, bear, teddy bear, dining table. Based on this, is there a person in the image?"}]}, {"id": 675, "image": "COCO_val2014_000000370900.jpg", "conversations": [{"from": "human", "value": "Is there a bear in the image?"}, {"from": "gpt", "value": "This image contains tie, bear, teddy bear, dining table. Based on this, is there a bear in the image?"}]}, {"id": 676, "image": "COCO_val2014_000000370900.jpg", "conversations": [{"from": "human", "value": "Is there a couch in the image?"}, {"from": "gpt", "value": "This image contains tie, bear, teddy bear, dining table. Based on this, is there a couch in the image?"}]}, {"id": 677, "image": "COCO_val2014_000000370900.jpg", "conversations": [{"from": "human", "value": "Is there a teddy bear in the image?"}, {"from": "gpt", "value": "This image contains tie, bear, teddy bear, dining table. Based on this, is there a teddy bear in the image?"}]}, {"id": 678, "image": "COCO_val2014_000000370900.jpg", "conversations": [{"from": "human", "value": "Is there a bed in the image?"}, {"from": "gpt", "value": "This image contains tie, bear, teddy bear, dining table. Based on this, is there a bed in the image?"}]}, {"id": 679, "image": "COCO_val2014_000000094501.jpg", "conversations": [{"from": "human", "value": "Is there a cake in the image?"}, {"from": "gpt", "value": "This image contains cake, bottle, fork, dining table. Based on this, is there a cake in the image?"}]}, {"id": 680, "image": "COCO_val2014_000000094501.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains cake, bottle, fork, dining table. Based on this, is there a person in the image?"}]}, {"id": 681, "image": "COCO_val2014_000000094501.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains cake, bottle, fork, dining table. Based on this, is there a bottle in the image?"}]}, {"id": 682, "image": "COCO_val2014_000000094501.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains cake, bottle, fork, dining table. Based on this, is there a cup in the image?"}]}, {"id": 683, "image": "COCO_val2014_000000094501.jpg", "conversations": [{"from": "human", "value": "Is there a fork in the image?"}, {"from": "gpt", "value": "This image contains cake, bottle, fork, dining table. Based on this, is there a fork in the image?"}]}, {"id": 684, "image": "COCO_val2014_000000094501.jpg", "conversations": [{"from": "human", "value": "Is there a knife in the image?"}, {"from": "gpt", "value": "This image contains cake, bottle, fork, dining table. Based on this, is there a knife in the image?"}]}, {"id": 685, "image": "COCO_val2014_000000069196.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, airplane, handbag. Based on this, is there a backpack in the image?"}]}, {"id": 686, "image": "COCO_val2014_000000069196.jpg", "conversations": [{"from": "human", "value": "Is there a skis in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, airplane, handbag. Based on this, is there a skis in the image?"}]}, {"id": 687, "image": "COCO_val2014_000000069196.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, airplane, handbag. Based on this, is there a person in the image?"}]}, {"id": 688, "image": "COCO_val2014_000000069196.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, airplane, handbag. Based on this, is there a car in the image?"}]}, {"id": 689, "image": "COCO_val2014_000000069196.jpg", "conversations": [{"from": "human", "value": "Is there an airplane in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, airplane, handbag. Based on this, is there an airplane in the image?"}]}, {"id": 690, "image": "COCO_val2014_000000069196.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, airplane, handbag. Based on this, is there a truck in the image?"}]}, {"id": 691, "image": "COCO_val2014_000000366141.jpg", "conversations": [{"from": "human", "value": "Is there a tv in the image?"}, {"from": "gpt", "value": "This image contains tv, couch, dining table, chair, cat. Based on this, is there a tv in the image?"}]}, {"id": 692, "image": "COCO_val2014_000000366141.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains tv, couch, dining table, chair, cat. Based on this, is there a person in the image?"}]}, {"id": 693, "image": "COCO_val2014_000000366141.jpg", "conversations": [{"from": "human", "value": "Is there a couch in the image?"}, {"from": "gpt", "value": "This image contains tv, couch, dining table, chair, cat. Based on this, is there a couch in the image?"}]}, {"id": 694, "image": "COCO_val2014_000000366141.jpg", "conversations": [{"from": "human", "value": "Is there a book in the image?"}, {"from": "gpt", "value": "This image contains tv, couch, dining table, chair, cat. Based on this, is there a book in the image?"}]}, {"id": 695, "image": "COCO_val2014_000000366141.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains tv, couch, dining table, chair, cat. Based on this, is there a dining table in the image?"}]}, {"id": 696, "image": "COCO_val2014_000000366141.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains tv, couch, dining table, chair, cat. Based on this, is there a cup in the image?"}]}, {"id": 697, "image": "COCO_val2014_000000093946.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, bowl, fork, dining table, chair, pizza. Based on this, is there a person in the image?"}]}, {"id": 698, "image": "COCO_val2014_000000093946.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, bowl, fork, dining table, chair, pizza. Based on this, is there a car in the image?"}]}, {"id": 699, "image": "COCO_val2014_000000093946.jpg", "conversations": [{"from": "human", "value": "Is there a bowl in the image?"}, {"from": "gpt", "value": "This image contains person, bowl, fork, dining table, chair, pizza. Based on this, is there a bowl in the image?"}]}, {"id": 700, "image": "COCO_val2014_000000093946.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains person, bowl, fork, dining table, chair, pizza. Based on this, is there a cup in the image?"}]}, {"id": 701, "image": "COCO_val2014_000000093946.jpg", "conversations": [{"from": "human", "value": "Is there a fork in the image?"}, {"from": "gpt", "value": "This image contains person, bowl, fork, dining table, chair, pizza. Based on this, is there a fork in the image?"}]}, {"id": 702, "image": "COCO_val2014_000000093946.jpg", "conversations": [{"from": "human", "value": "Is there a knife in the image?"}, {"from": "gpt", "value": "This image contains person, bowl, fork, dining table, chair, pizza. Based on this, is there a knife in the image?"}]}, {"id": 703, "image": "COCO_val2014_000000032610.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains backpack, bench, laptop, dining table. Based on this, is there a backpack in the image?"}]}, {"id": 704, "image": "COCO_val2014_000000032610.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains backpack, bench, laptop, dining table. Based on this, is there a person in the image?"}]}, {"id": 705, "image": "COCO_val2014_000000032610.jpg", "conversations": [{"from": "human", "value": "Is there a bench in the image?"}, {"from": "gpt", "value": "This image contains backpack, bench, laptop, dining table. Based on this, is there a bench in the image?"}]}, {"id": 706, "image": "COCO_val2014_000000032610.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains backpack, bench, laptop, dining table. Based on this, is there a chair in the image?"}]}, {"id": 707, "image": "COCO_val2014_000000032610.jpg", "conversations": [{"from": "human", "value": "Is there a laptop in the image?"}, {"from": "gpt", "value": "This image contains backpack, bench, laptop, dining table. Based on this, is there a laptop in the image?"}]}, {"id": 708, "image": "COCO_val2014_000000032610.jpg", "conversations": [{"from": "human", "value": "Is there a tv in the image?"}, {"from": "gpt", "value": "This image contains backpack, bench, laptop, dining table. Based on this, is there a tv in the image?"}]}, {"id": 709, "image": "COCO_val2014_000000239130.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, bicycle, car, cell phone. Based on this, is there a person in the image?"}]}, {"id": 710, "image": "COCO_val2014_000000239130.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, bicycle, car, cell phone. Based on this, is there a dining table in the image?"}]}, {"id": 711, "image": "COCO_val2014_000000239130.jpg", "conversations": [{"from": "human", "value": "Is there a bicycle in the image?"}, {"from": "gpt", "value": "This image contains person, bicycle, car, cell phone. Based on this, is there a bicycle in the image?"}]}, {"id": 712, "image": "COCO_val2014_000000239130.jpg", "conversations": [{"from": "human", "value": "Is there a motorcycle in the image?"}, {"from": "gpt", "value": "This image contains person, bicycle, car, cell phone. Based on this, is there a motorcycle in the image?"}]}, {"id": 713, "image": "COCO_val2014_000000239130.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, bicycle, car, cell phone. Based on this, is there a car in the image?"}]}, {"id": 714, "image": "COCO_val2014_000000239130.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains person, bicycle, car, cell phone. Based on this, is there a truck in the image?"}]}, {"id": 715, "image": "COCO_val2014_000000226097.jpg", "conversations": [{"from": "human", "value": "Is there a spoon in the image?"}, {"from": "gpt", "value": "This image contains spoon, bowl, bottle, sink, refrigerator, oven, cup. Based on this, is there a spoon in the image?"}]}, {"id": 716, "image": "COCO_val2014_000000226097.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains spoon, bowl, bottle, sink, refrigerator, oven, cup. Based on this, is there a person in the image?"}]}, {"id": 717, "image": "COCO_val2014_000000226097.jpg", "conversations": [{"from": "human", "value": "Is there a bowl in the image?"}, {"from": "gpt", "value": "This image contains spoon, bowl, bottle, sink, refrigerator, oven, cup. Based on this, is there a bowl in the image?"}]}, {"id": 718, "image": "COCO_val2014_000000226097.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains spoon, bowl, bottle, sink, refrigerator, oven, cup. Based on this, is there a dining table in the image?"}]}, {"id": 719, "image": "COCO_val2014_000000226097.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains spoon, bowl, bottle, sink, refrigerator, oven, cup. Based on this, is there a bottle in the image?"}]}, {"id": 720, "image": "COCO_val2014_000000226097.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains spoon, bowl, bottle, sink, refrigerator, oven, cup. Based on this, is there a chair in the image?"}]}, {"id": 721, "image": "COCO_val2014_000000538054.jpg", "conversations": [{"from": "human", "value": "Is there a banana in the image?"}, {"from": "gpt", "value": "This image contains banana, person, handbag. Based on this, is there a banana in the image?"}]}, {"id": 722, "image": "COCO_val2014_000000538054.jpg", "conversations": [{"from": "human", "value": "Is there a bowl in the image?"}, {"from": "gpt", "value": "This image contains banana, person, handbag. Based on this, is there a bowl in the image?"}]}, {"id": 723, "image": "COCO_val2014_000000538054.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains banana, person, handbag. Based on this, is there a person in the image?"}]}, {"id": 724, "image": "COCO_val2014_000000538054.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains banana, person, handbag. Based on this, is there a car in the image?"}]}, {"id": 725, "image": "COCO_val2014_000000538054.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains banana, person, handbag. Based on this, is there a handbag in the image?"}]}, {"id": 726, "image": "COCO_val2014_000000538054.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains banana, person, handbag. Based on this, is there a backpack in the image?"}]}, {"id": 727, "image": "COCO_val2014_000000114710.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, sheep. Based on this, is there a backpack in the image?"}]}, {"id": 728, "image": "COCO_val2014_000000114710.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, sheep. Based on this, is there a handbag in the image?"}]}, {"id": 729, "image": "COCO_val2014_000000114710.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, sheep. Based on this, is there a person in the image?"}]}, {"id": 730, "image": "COCO_val2014_000000114710.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, sheep. Based on this, is there a car in the image?"}]}, {"id": 731, "image": "COCO_val2014_000000114710.jpg", "conversations": [{"from": "human", "value": "Is there a sheep in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, sheep. Based on this, is there a sheep in the image?"}]}, {"id": 732, "image": "COCO_val2014_000000114710.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, sheep. Based on this, is there a truck in the image?"}]}, {"id": 733, "image": "COCO_val2014_000000113701.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains chair, clock, bed, book. Based on this, is there a chair in the image?"}]}, {"id": 734, "image": "COCO_val2014_000000113701.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains chair, clock, bed, book. Based on this, is there a person in the image?"}]}, {"id": 735, "image": "COCO_val2014_000000113701.jpg", "conversations": [{"from": "human", "value": "Is there a clock in the image?"}, {"from": "gpt", "value": "This image contains chair, clock, bed, book. Based on this, is there a clock in the image?"}]}, {"id": 736, "image": "COCO_val2014_000000113701.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains chair, clock, bed, book. Based on this, is there a dining table in the image?"}]}, {"id": 737, "image": "COCO_val2014_000000113701.jpg", "conversations": [{"from": "human", "value": "Is there a bed in the image?"}, {"from": "gpt", "value": "This image contains chair, clock, bed, book. Based on this, is there a bed in the image?"}]}, {"id": 738, "image": "COCO_val2014_000000113701.jpg", "conversations": [{"from": "human", "value": "Is there a cat in the image?"}, {"from": "gpt", "value": "This image contains chair, clock, bed, book. Based on this, is there a cat in the image?"}]}, {"id": 739, "image": "COCO_val2014_000000065001.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, motorcycle, car, bicycle. Based on this, is there a person in the image?"}]}, {"id": 740, "image": "COCO_val2014_000000065001.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, motorcycle, car, bicycle. Based on this, is there a dining table in the image?"}]}, {"id": 741, "image": "COCO_val2014_000000065001.jpg", "conversations": [{"from": "human", "value": "Is there a motorcycle in the image?"}, {"from": "gpt", "value": "This image contains person, motorcycle, car, bicycle. Based on this, is there a motorcycle in the image?"}]}, {"id": 742, "image": "COCO_val2014_000000065001.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains person, motorcycle, car, bicycle. Based on this, is there a truck in the image?"}]}, {"id": 743, "image": "COCO_val2014_000000065001.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, motorcycle, car, bicycle. Based on this, is there a car in the image?"}]}, {"id": 744, "image": "COCO_val2014_000000065001.jpg", "conversations": [{"from": "human", "value": "Is there a bus in the image?"}, {"from": "gpt", "value": "This image contains person, motorcycle, car, bicycle. Based on this, is there a bus in the image?"}]}, {"id": 745, "image": "COCO_val2014_000000482275.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, knife, vase, cup, cake, tie. Based on this, is there a person in the image?"}]}, {"id": 746, "image": "COCO_val2014_000000482275.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, knife, vase, cup, cake, tie. Based on this, is there a car in the image?"}]}, {"id": 747, "image": "COCO_val2014_000000482275.jpg", "conversations": [{"from": "human", "value": "Is there a knife in the image?"}, {"from": "gpt", "value": "This image contains person, knife, vase, cup, cake, tie. Based on this, is there a knife in the image?"}]}, {"id": 748, "image": "COCO_val2014_000000482275.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, knife, vase, cup, cake, tie. Based on this, is there a dining table in the image?"}]}, {"id": 749, "image": "COCO_val2014_000000482275.jpg", "conversations": [{"from": "human", "value": "Is there a vase in the image?"}, {"from": "gpt", "value": "This image contains person, knife, vase, cup, cake, tie. Based on this, is there a vase in the image?"}]}, {"id": 750, "image": "COCO_val2014_000000482275.jpg", "conversations": [{"from": "human", "value": "Is there a potted plant in the image?"}, {"from": "gpt", "value": "This image contains person, knife, vase, cup, cake, tie. Based on this, is there a potted plant in the image?"}]}, {"id": 751, "image": "COCO_val2014_000000140983.jpg", "conversations": [{"from": "human", "value": "Is there a toothbrush in the image?"}, {"from": "gpt", "value": "This image contains toothbrush, couch, person. Based on this, is there a toothbrush in the image?"}]}, {"id": 752, "image": "COCO_val2014_000000140983.jpg", "conversations": [{"from": "human", "value": "Is there a sink in the image?"}, {"from": "gpt", "value": "This image contains toothbrush, couch, person. Based on this, is there a sink in the image?"}]}, {"id": 753, "image": "COCO_val2014_000000140983.jpg", "conversations": [{"from": "human", "value": "Is there a couch in the image?"}, {"from": "gpt", "value": "This image contains toothbrush, couch, person. Based on this, is there a couch in the image?"}]}, {"id": 754, "image": "COCO_val2014_000000140983.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains toothbrush, couch, person. Based on this, is there a chair in the image?"}]}, {"id": 755, "image": "COCO_val2014_000000140983.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains toothbrush, couch, person. Based on this, is there a person in the image?"}]}, {"id": 756, "image": "COCO_val2014_000000140983.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains toothbrush, couch, person. Based on this, is there a car in the image?"}]}, {"id": 757, "image": "COCO_val2014_000000044520.jpg", "conversations": [{"from": "human", "value": "Is there a traffic light in the image?"}, {"from": "gpt", "value": "This image contains traffic light, train, stop sign. Based on this, is there a traffic light in the image?"}]}, {"id": 758, "image": "COCO_val2014_000000044520.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains traffic light, train, stop sign. Based on this, is there a person in the image?"}]}, {"id": 759, "image": "COCO_val2014_000000044520.jpg", "conversations": [{"from": "human", "value": "Is there a train in the image?"}, {"from": "gpt", "value": "This image contains traffic light, train, stop sign. Based on this, is there a train in the image?"}]}, {"id": 760, "image": "COCO_val2014_000000044520.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains traffic light, train, stop sign. Based on this, is there a car in the image?"}]}, {"id": 761, "image": "COCO_val2014_000000044520.jpg", "conversations": [{"from": "human", "value": "Is there a stop sign in the image?"}, {"from": "gpt", "value": "This image contains traffic light, train, stop sign. Based on this, is there a stop sign in the image?"}]}, {"id": 762, "image": "COCO_val2014_000000044520.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains traffic light, train, stop sign. Based on this, is there a truck in the image?"}]}, {"id": 763, "image": "COCO_val2014_000000518177.jpg", "conversations": [{"from": "human", "value": "Is there a toaster in the image?"}, {"from": "gpt", "value": "This image contains toaster, person, microwave, oven. Based on this, is there a toaster in the image?"}]}, {"id": 764, "image": "COCO_val2014_000000518177.jpg", "conversations": [{"from": "human", "value": "Is there a tv in the image?"}, {"from": "gpt", "value": "This image contains toaster, person, microwave, oven. Based on this, is there a tv in the image?"}]}, {"id": 765, "image": "COCO_val2014_000000518177.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains toaster, person, microwave, oven. Based on this, is there a person in the image?"}]}, {"id": 766, "image": "COCO_val2014_000000518177.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains toaster, person, microwave, oven. Based on this, is there a car in the image?"}]}, {"id": 767, "image": "COCO_val2014_000000518177.jpg", "conversations": [{"from": "human", "value": "Is there a microwave in the image?"}, {"from": "gpt", "value": "This image contains toaster, person, microwave, oven. Based on this, is there a microwave in the image?"}]}, {"id": 768, "image": "COCO_val2014_000000518177.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains toaster, person, microwave, oven. Based on this, is there a bottle in the image?"}]}, {"id": 769, "image": "COCO_val2014_000000203479.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, couch, dining table, teddy bear, cup. Based on this, is there a person in the image?"}]}, {"id": 770, "image": "COCO_val2014_000000203479.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, couch, dining table, teddy bear, cup. Based on this, is there a car in the image?"}]}, {"id": 771, "image": "COCO_val2014_000000203479.jpg", "conversations": [{"from": "human", "value": "Is there a couch in the image?"}, {"from": "gpt", "value": "This image contains person, couch, dining table, teddy bear, cup. Based on this, is there a couch in the image?"}]}, {"id": 772, "image": "COCO_val2014_000000203479.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains person, couch, dining table, teddy bear, cup. Based on this, is there a chair in the image?"}]}, {"id": 773, "image": "COCO_val2014_000000203479.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, couch, dining table, teddy bear, cup. Based on this, is there a dining table in the image?"}]}, {"id": 774, "image": "COCO_val2014_000000203479.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains person, couch, dining table, teddy bear, cup. Based on this, is there a bottle in the image?"}]}, {"id": 775, "image": "COCO_val2014_000000551881.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains handbag, potted plant, dining table, chair, refrigerator, book. Based on this, is there a handbag in the image?"}]}, {"id": 776, "image": "COCO_val2014_000000551881.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains handbag, potted plant, dining table, chair, refrigerator, book. Based on this, is there a person in the image?"}]}, {"id": 777, "image": "COCO_val2014_000000551881.jpg", "conversations": [{"from": "human", "value": "Is there a potted plant in the image?"}, {"from": "gpt", "value": "This image contains handbag, potted plant, dining table, chair, refrigerator, book. Based on this, is there a potted plant in the image?"}]}, {"id": 778, "image": "COCO_val2014_000000551881.jpg", "conversations": [{"from": "human", "value": "Is there a vase in the image?"}, {"from": "gpt", "value": "This image contains handbag, potted plant, dining table, chair, refrigerator, book. Based on this, is there a vase in the image?"}]}, {"id": 779, "image": "COCO_val2014_000000551881.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains handbag, potted plant, dining table, chair, refrigerator, book. Based on this, is there a dining table in the image?"}]}, {"id": 780, "image": "COCO_val2014_000000551881.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains handbag, potted plant, dining table, chair, refrigerator, book. Based on this, is there a cup in the image?"}]}, {"id": 781, "image": "COCO_val2014_000000369541.jpg", "conversations": [{"from": "human", "value": "Is there a dog in the image?"}, {"from": "gpt", "value": "This image contains dog, person, frisbee. Based on this, is there a dog in the image?"}]}, {"id": 782, "image": "COCO_val2014_000000369541.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains dog, person, frisbee. Based on this, is there a car in the image?"}]}, {"id": 783, "image": "COCO_val2014_000000369541.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains dog, person, frisbee. Based on this, is there a person in the image?"}]}, {"id": 784, "image": "COCO_val2014_000000369541.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains dog, person, frisbee. Based on this, is there a dining table in the image?"}]}, {"id": 785, "image": "COCO_val2014_000000369541.jpg", "conversations": [{"from": "human", "value": "Is there a frisbee in the image?"}, {"from": "gpt", "value": "This image contains dog, person, frisbee. Based on this, is there a frisbee in the image?"}]}, {"id": 786, "image": "COCO_val2014_000000369541.jpg", "conversations": [{"from": "human", "value": "Is there an orange in the image?"}, {"from": "gpt", "value": "This image contains dog, person, frisbee. Based on this, is there an orange in the image?"}]}, {"id": 787, "image": "COCO_val2014_000000007795.jpg", "conversations": [{"from": "human", "value": "Is there a clock in the image?"}, {"from": "gpt", "value": "This image contains clock, bed, remote. Based on this, is there a clock in the image?"}]}, {"id": 788, "image": "COCO_val2014_000000007795.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains clock, bed, remote. Based on this, is there a person in the image?"}]}, {"id": 789, "image": "COCO_val2014_000000007795.jpg", "conversations": [{"from": "human", "value": "Is there a bed in the image?"}, {"from": "gpt", "value": "This image contains clock, bed, remote. Based on this, is there a bed in the image?"}]}, {"id": 790, "image": "COCO_val2014_000000007795.jpg", "conversations": [{"from": "human", "value": "Is there a book in the image?"}, {"from": "gpt", "value": "This image contains clock, bed, remote. Based on this, is there a book in the image?"}]}, {"id": 791, "image": "COCO_val2014_000000007795.jpg", "conversations": [{"from": "human", "value": "Is there a remote in the image?"}, {"from": "gpt", "value": "This image contains clock, bed, remote. Based on this, is there a remote in the image?"}]}, {"id": 792, "image": "COCO_val2014_000000007795.jpg", "conversations": [{"from": "human", "value": "Is there a tv in the image?"}, {"from": "gpt", "value": "This image contains clock, bed, remote. Based on this, is there a tv in the image?"}]}, {"id": 793, "image": "COCO_val2014_000000303099.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains bottle, cat, toilet. Based on this, is there a bottle in the image?"}]}, {"id": 794, "image": "COCO_val2014_000000303099.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains bottle, cat, toilet. Based on this, is there a person in the image?"}]}, {"id": 795, "image": "COCO_val2014_000000303099.jpg", "conversations": [{"from": "human", "value": "Is there a cat in the image?"}, {"from": "gpt", "value": "This image contains bottle, cat, toilet. Based on this, is there a cat in the image?"}]}, {"id": 796, "image": "COCO_val2014_000000303099.jpg", "conversations": [{"from": "human", "value": "Is there a couch in the image?"}, {"from": "gpt", "value": "This image contains bottle, cat, toilet. Based on this, is there a couch in the image?"}]}, {"id": 797, "image": "COCO_val2014_000000303099.jpg", "conversations": [{"from": "human", "value": "Is there a toilet in the image?"}, {"from": "gpt", "value": "This image contains bottle, cat, toilet. Based on this, is there a toilet in the image?"}]}, {"id": 798, "image": "COCO_val2014_000000303099.jpg", "conversations": [{"from": "human", "value": "Is there a sink in the image?"}, {"from": "gpt", "value": "This image contains bottle, cat, toilet. Based on this, is there a sink in the image?"}]}, {"id": 799, "image": "COCO_val2014_000000147289.jpg", "conversations": [{"from": "human", "value": "Is there a fire hydrant in the image?"}, {"from": "gpt", "value": "This image contains fire hydrant, car, stop sign. Based on this, is there a fire hydrant in the image?"}]}, {"id": 800, "image": "COCO_val2014_000000147289.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains fire hydrant, car, stop sign. Based on this, is there a person in the image?"}]}, {"id": 801, "image": "COCO_val2014_000000147289.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains fire hydrant, car, stop sign. Based on this, is there a car in the image?"}]}, {"id": 802, "image": "COCO_val2014_000000147289.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains fire hydrant, car, stop sign. Based on this, is there a truck in the image?"}]}, {"id": 803, "image": "COCO_val2014_000000147289.jpg", "conversations": [{"from": "human", "value": "Is there a stop sign in the image?"}, {"from": "gpt", "value": "This image contains fire hydrant, car, stop sign. Based on this, is there a stop sign in the image?"}]}, {"id": 804, "image": "COCO_val2014_000000147289.jpg", "conversations": [{"from": "human", "value": "Is there a traffic light in the image?"}, {"from": "gpt", "value": "This image contains fire hydrant, car, stop sign. Based on this, is there a traffic light in the image?"}]}, {"id": 805, "image": "COCO_val2014_000000102439.jpg", "conversations": [{"from": "human", "value": "Is there a tv in the image?"}, {"from": "gpt", "value": "This image contains tv, person, remote. Based on this, is there a tv in the image?"}]}, {"id": 806, "image": "COCO_val2014_000000102439.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains tv, person, remote. Based on this, is there a dining table in the image?"}]}, {"id": 807, "image": "COCO_val2014_000000102439.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains tv, person, remote. Based on this, is there a person in the image?"}]}, {"id": 808, "image": "COCO_val2014_000000102439.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains tv, person, remote. Based on this, is there a car in the image?"}]}, {"id": 809, "image": "COCO_val2014_000000102439.jpg", "conversations": [{"from": "human", "value": "Is there a remote in the image?"}, {"from": "gpt", "value": "This image contains tv, person, remote. Based on this, is there a remote in the image?"}]}, {"id": 810, "image": "COCO_val2014_000000102439.jpg", "conversations": [{"from": "human", "value": "Is there a couch in the image?"}, {"from": "gpt", "value": "This image contains tv, person, remote. Based on this, is there a couch in the image?"}]}, {"id": 811, "image": "COCO_val2014_000000183757.jpg", "conversations": [{"from": "human", "value": "Is there a boat in the image?"}, {"from": "gpt", "value": "This image contains boat, dog, cat. Based on this, is there a boat in the image?"}]}, {"id": 812, "image": "COCO_val2014_000000183757.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains boat, dog, cat. Based on this, is there a person in the image?"}]}, {"id": 813, "image": "COCO_val2014_000000183757.jpg", "conversations": [{"from": "human", "value": "Is there a dog in the image?"}, {"from": "gpt", "value": "This image contains boat, dog, cat. Based on this, is there a dog in the image?"}]}, {"id": 814, "image": "COCO_val2014_000000183757.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains boat, dog, cat. Based on this, is there a car in the image?"}]}, {"id": 815, "image": "COCO_val2014_000000183757.jpg", "conversations": [{"from": "human", "value": "Is there a cat in the image?"}, {"from": "gpt", "value": "This image contains boat, dog, cat. Based on this, is there a cat in the image?"}]}, {"id": 816, "image": "COCO_val2014_000000183757.jpg", "conversations": [{"from": "human", "value": "Is there a couch in the image?"}, {"from": "gpt", "value": "This image contains boat, dog, cat. Based on this, is there a couch in the image?"}]}, {"id": 817, "image": "COCO_val2014_000000500473.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, broccoli, handbag, carrot, dining table, orange, apple. Based on this, is there a person in the image?"}]}, {"id": 818, "image": "COCO_val2014_000000500473.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, broccoli, handbag, carrot, dining table, orange, apple. Based on this, is there a car in the image?"}]}, {"id": 819, "image": "COCO_val2014_000000500473.jpg", "conversations": [{"from": "human", "value": "Is there a broccoli in the image?"}, {"from": "gpt", "value": "This image contains person, broccoli, handbag, carrot, dining table, orange, apple. Based on this, is there a broccoli in the image?"}]}, {"id": 820, "image": "COCO_val2014_000000500473.jpg", "conversations": [{"from": "human", "value": "Is there a bowl in the image?"}, {"from": "gpt", "value": "This image contains person, broccoli, handbag, carrot, dining table, orange, apple. Based on this, is there a bowl in the image?"}]}, {"id": 821, "image": "COCO_val2014_000000500473.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains person, broccoli, handbag, carrot, dining table, orange, apple. Based on this, is there a handbag in the image?"}]}, {"id": 822, "image": "COCO_val2014_000000500473.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains person, broccoli, handbag, carrot, dining table, orange, apple. Based on this, is there a backpack in the image?"}]}, {"id": 823, "image": "COCO_val2014_000000327532.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains chair, person, sports ball, tennis racket. Based on this, is there a chair in the image?"}]}, {"id": 824, "image": "COCO_val2014_000000327532.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains chair, person, sports ball, tennis racket. Based on this, is there a dining table in the image?"}]}, {"id": 825, "image": "COCO_val2014_000000327532.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains chair, person, sports ball, tennis racket. Based on this, is there a person in the image?"}]}, {"id": 826, "image": "COCO_val2014_000000327532.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains chair, person, sports ball, tennis racket. Based on this, is there a car in the image?"}]}, {"id": 827, "image": "COCO_val2014_000000327532.jpg", "conversations": [{"from": "human", "value": "Is there a sports ball in the image?"}, {"from": "gpt", "value": "This image contains chair, person, sports ball, tennis racket. Based on this, is there a sports ball in the image?"}]}, {"id": 828, "image": "COCO_val2014_000000327532.jpg", "conversations": [{"from": "human", "value": "Is there a baseball glove in the image?"}, {"from": "gpt", "value": "This image contains chair, person, sports ball, tennis racket. Based on this, is there a baseball glove in the image?"}]}, {"id": 829, "image": "COCO_val2014_000000167110.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains car, person, skateboard. Based on this, is there a car in the image?"}]}, {"id": 830, "image": "COCO_val2014_000000167110.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains car, person, skateboard. Based on this, is there a truck in the image?"}]}, {"id": 831, "image": "COCO_val2014_000000167110.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains car, person, skateboard. Based on this, is there a person in the image?"}]}, {"id": 832, "image": "COCO_val2014_000000167110.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains car, person, skateboard. Based on this, is there a dining table in the image?"}]}, {"id": 833, "image": "COCO_val2014_000000167110.jpg", "conversations": [{"from": "human", "value": "Is there a skateboard in the image?"}, {"from": "gpt", "value": "This image contains car, person, skateboard. Based on this, is there a skateboard in the image?"}]}, {"id": 834, "image": "COCO_val2014_000000167110.jpg", "conversations": [{"from": "human", "value": "Is there a bicycle in the image?"}, {"from": "gpt", "value": "This image contains car, person, skateboard. Based on this, is there a bicycle in the image?"}]}, {"id": 835, "image": "COCO_val2014_000000300876.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, spoon, bowl, dining table, knife, chair, cake, handbag, bottle, cup. Based on this, is there a person in the image?"}]}, {"id": 836, "image": "COCO_val2014_000000300876.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, spoon, bowl, dining table, knife, chair, cake, handbag, bottle, cup. Based on this, is there a car in the image?"}]}, {"id": 837, "image": "COCO_val2014_000000300876.jpg", "conversations": [{"from": "human", "value": "Is there a spoon in the image?"}, {"from": "gpt", "value": "This image contains person, spoon, bowl, dining table, knife, chair, cake, handbag, bottle, cup. Based on this, is there a spoon in the image?"}]}, {"id": 838, "image": "COCO_val2014_000000300876.jpg", "conversations": [{"from": "human", "value": "Is there an oven in the image?"}, {"from": "gpt", "value": "This image contains person, spoon, bowl, dining table, knife, chair, cake, handbag, bottle, cup. Based on this, is there an oven in the image?"}]}, {"id": 839, "image": "COCO_val2014_000000300876.jpg", "conversations": [{"from": "human", "value": "Is there a bowl in the image?"}, {"from": "gpt", "value": "This image contains person, spoon, bowl, dining table, knife, chair, cake, handbag, bottle, cup. Based on this, is there a bowl in the image?"}]}, {"id": 840, "image": "COCO_val2014_000000300876.jpg", "conversations": [{"from": "human", "value": "Is there a banana in the image?"}, {"from": "gpt", "value": "This image contains person, spoon, bowl, dining table, knife, chair, cake, handbag, bottle, cup. Based on this, is there a banana in the image?"}]}, {"id": 841, "image": "COCO_val2014_000000443240.jpg", "conversations": [{"from": "human", "value": "Is there a tv in the image?"}, {"from": "gpt", "value": "This image contains tv, chair, couch. Based on this, is there a tv in the image?"}]}, {"id": 842, "image": "COCO_val2014_000000443240.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains tv, chair, couch. Based on this, is there a person in the image?"}]}, {"id": 843, "image": "COCO_val2014_000000443240.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains tv, chair, couch. Based on this, is there a chair in the image?"}]}, {"id": 844, "image": "COCO_val2014_000000443240.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains tv, chair, couch. Based on this, is there a dining table in the image?"}]}, {"id": 845, "image": "COCO_val2014_000000443240.jpg", "conversations": [{"from": "human", "value": "Is there a couch in the image?"}, {"from": "gpt", "value": "This image contains tv, chair, couch. Based on this, is there a couch in the image?"}]}, {"id": 846, "image": "COCO_val2014_000000443240.jpg", "conversations": [{"from": "human", "value": "Is there a book in the image?"}, {"from": "gpt", "value": "This image contains tv, chair, couch. Based on this, is there a book in the image?"}]}, {"id": 847, "image": "COCO_val2014_000000288042.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains truck, person, umbrella. Based on this, is there a truck in the image?"}]}, {"id": 848, "image": "COCO_val2014_000000288042.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains truck, person, umbrella. Based on this, is there a car in the image?"}]}, {"id": 849, "image": "COCO_val2014_000000288042.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains truck, person, umbrella. Based on this, is there a person in the image?"}]}, {"id": 850, "image": "COCO_val2014_000000288042.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains truck, person, umbrella. Based on this, is there a dining table in the image?"}]}, {"id": 851, "image": "COCO_val2014_000000288042.jpg", "conversations": [{"from": "human", "value": "Is there an umbrella in the image?"}, {"from": "gpt", "value": "This image contains truck, person, umbrella. Based on this, is there an umbrella in the image?"}]}, {"id": 852, "image": "COCO_val2014_000000288042.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains truck, person, umbrella. Based on this, is there a handbag in the image?"}]}, {"id": 853, "image": "COCO_val2014_000000270609.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, dining table, chair, orange, cup. Based on this, is there a person in the image?"}]}, {"id": 854, "image": "COCO_val2014_000000270609.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, dining table, chair, orange, cup. Based on this, is there a car in the image?"}]}, {"id": 855, "image": "COCO_val2014_000000270609.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, dining table, chair, orange, cup. Based on this, is there a dining table in the image?"}]}, {"id": 856, "image": "COCO_val2014_000000270609.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains person, dining table, chair, orange, cup. Based on this, is there a bottle in the image?"}]}, {"id": 857, "image": "COCO_val2014_000000270609.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains person, dining table, chair, orange, cup. Based on this, is there a chair in the image?"}]}, {"id": 858, "image": "COCO_val2014_000000270609.jpg", "conversations": [{"from": "human", "value": "Is there a couch in the image?"}, {"from": "gpt", "value": "This image contains person, dining table, chair, orange, cup. Based on this, is there a couch in the image?"}]}, {"id": 859, "image": "COCO_val2014_000000208028.jpg", "conversations": [{"from": "human", "value": "Is there a keyboard in the image?"}, {"from": "gpt", "value": "This image contains keyboard, person, laptop. Based on this, is there a keyboard in the image?"}]}, {"id": 860, "image": "COCO_val2014_000000208028.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains keyboard, person, laptop. Based on this, is there a dining table in the image?"}]}, {"id": 861, "image": "COCO_val2014_000000208028.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains keyboard, person, laptop. Based on this, is there a person in the image?"}]}, {"id": 862, "image": "COCO_val2014_000000208028.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains keyboard, person, laptop. Based on this, is there a car in the image?"}]}, {"id": 863, "image": "COCO_val2014_000000208028.jpg", "conversations": [{"from": "human", "value": "Is there a laptop in the image?"}, {"from": "gpt", "value": "This image contains keyboard, person, laptop. Based on this, is there a laptop in the image?"}]}, {"id": 864, "image": "COCO_val2014_000000208028.jpg", "conversations": [{"from": "human", "value": "Is there a tv in the image?"}, {"from": "gpt", "value": "This image contains keyboard, person, laptop. Based on this, is there a tv in the image?"}]}, {"id": 865, "image": "COCO_val2014_000000314992.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, handbag, cell phone. Based on this, is there a person in the image?"}]}, {"id": 866, "image": "COCO_val2014_000000314992.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, handbag, cell phone. Based on this, is there a car in the image?"}]}, {"id": 867, "image": "COCO_val2014_000000314992.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains person, handbag, cell phone. Based on this, is there a handbag in the image?"}]}, {"id": 868, "image": "COCO_val2014_000000314992.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains person, handbag, cell phone. Based on this, is there a backpack in the image?"}]}, {"id": 869, "image": "COCO_val2014_000000314992.jpg", "conversations": [{"from": "human", "value": "Is there a cell phone in the image?"}, {"from": "gpt", "value": "This image contains person, handbag, cell phone. Based on this, is there a cell phone in the image?"}]}, {"id": 870, "image": "COCO_val2014_000000314992.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, handbag, cell phone. Based on this, is there a dining table in the image?"}]}, {"id": 871, "image": "COCO_val2014_000000424642.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, bottle, frisbee. Based on this, is there a person in the image?"}]}, {"id": 872, "image": "COCO_val2014_000000424642.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, bottle, frisbee. Based on this, is there a car in the image?"}]}, {"id": 873, "image": "COCO_val2014_000000424642.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains person, bottle, frisbee. Based on this, is there a bottle in the image?"}]}, {"id": 874, "image": "COCO_val2014_000000424642.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, bottle, frisbee. Based on this, is there a dining table in the image?"}]}, {"id": 875, "image": "COCO_val2014_000000424642.jpg", "conversations": [{"from": "human", "value": "Is there a frisbee in the image?"}, {"from": "gpt", "value": "This image contains person, bottle, frisbee. Based on this, is there a frisbee in the image?"}]}, {"id": 876, "image": "COCO_val2014_000000424642.jpg", "conversations": [{"from": "human", "value": "Is there a dog in the image?"}, {"from": "gpt", "value": "This image contains person, bottle, frisbee. Based on this, is there a dog in the image?"}]}, {"id": 877, "image": "COCO_val2014_000000467176.jpg", "conversations": [{"from": "human", "value": "Is there a tv in the image?"}, {"from": "gpt", "value": "This image contains tv, person, couch, remote, chair, book, cup. Based on this, is there a tv in the image?"}]}, {"id": 878, "image": "COCO_val2014_000000467176.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains tv, person, couch, remote, chair, book, cup. Based on this, is there a dining table in the image?"}]}, {"id": 879, "image": "COCO_val2014_000000467176.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains tv, person, couch, remote, chair, book, cup. Based on this, is there a person in the image?"}]}, {"id": 880, "image": "COCO_val2014_000000467176.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains tv, person, couch, remote, chair, book, cup. Based on this, is there a car in the image?"}]}, {"id": 881, "image": "COCO_val2014_000000467176.jpg", "conversations": [{"from": "human", "value": "Is there a couch in the image?"}, {"from": "gpt", "value": "This image contains tv, person, couch, remote, chair, book, cup. Based on this, is there a couch in the image?"}]}, {"id": 882, "image": "COCO_val2014_000000467176.jpg", "conversations": [{"from": "human", "value": "Is there a vase in the image?"}, {"from": "gpt", "value": "This image contains tv, person, couch, remote, chair, book, cup. Based on this, is there a vase in the image?"}]}, {"id": 883, "image": "COCO_val2014_000000087435.jpg", "conversations": [{"from": "human", "value": "Is there a motorcycle in the image?"}, {"from": "gpt", "value": "This image contains motorcycle, person, car, bench, bus. Based on this, is there a motorcycle in the image?"}]}, {"id": 884, "image": "COCO_val2014_000000087435.jpg", "conversations": [{"from": "human", "value": "Is there a bicycle in the image?"}, {"from": "gpt", "value": "This image contains motorcycle, person, car, bench, bus. Based on this, is there a bicycle in the image?"}]}, {"id": 885, "image": "COCO_val2014_000000087435.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains motorcycle, person, car, bench, bus. Based on this, is there a person in the image?"}]}, {"id": 886, "image": "COCO_val2014_000000087435.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains motorcycle, person, car, bench, bus. Based on this, is there a dining table in the image?"}]}, {"id": 887, "image": "COCO_val2014_000000087435.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains motorcycle, person, car, bench, bus. Based on this, is there a car in the image?"}]}, {"id": 888, "image": "COCO_val2014_000000087435.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains motorcycle, person, car, bench, bus. Based on this, is there a truck in the image?"}]}, {"id": 889, "image": "COCO_val2014_000000079446.jpg", "conversations": [{"from": "human", "value": "Is there a sink in the image?"}, {"from": "gpt", "value": "This image contains sink, bottle, toilet, cup. Based on this, is there a sink in the image?"}]}, {"id": 890, "image": "COCO_val2014_000000079446.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains sink, bottle, toilet, cup. Based on this, is there a person in the image?"}]}, {"id": 891, "image": "COCO_val2014_000000079446.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains sink, bottle, toilet, cup. Based on this, is there a bottle in the image?"}]}, {"id": 892, "image": "COCO_val2014_000000079446.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains sink, bottle, toilet, cup. Based on this, is there a dining table in the image?"}]}, {"id": 893, "image": "COCO_val2014_000000079446.jpg", "conversations": [{"from": "human", "value": "Is there a toilet in the image?"}, {"from": "gpt", "value": "This image contains sink, bottle, toilet, cup. Based on this, is there a toilet in the image?"}]}, {"id": 894, "image": "COCO_val2014_000000079446.jpg", "conversations": [{"from": "human", "value": "Is there a vase in the image?"}, {"from": "gpt", "value": "This image contains sink, bottle, toilet, cup. Based on this, is there a vase in the image?"}]}, {"id": 895, "image": "COCO_val2014_000000354398.jpg", "conversations": [{"from": "human", "value": "Is there a dog in the image?"}, {"from": "gpt", "value": "This image contains dog, truck, person, car, tie. Based on this, is there a dog in the image?"}]}, {"id": 896, "image": "COCO_val2014_000000354398.jpg", "conversations": [{"from": "human", "value": "Is there a frisbee in the image?"}, {"from": "gpt", "value": "This image contains dog, truck, person, car, tie. Based on this, is there a frisbee in the image?"}]}, {"id": 897, "image": "COCO_val2014_000000354398.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains dog, truck, person, car, tie. Based on this, is there a truck in the image?"}]}, {"id": 898, "image": "COCO_val2014_000000354398.jpg", "conversations": [{"from": "human", "value": "Is there a traffic light in the image?"}, {"from": "gpt", "value": "This image contains dog, truck, person, car, tie. Based on this, is there a traffic light in the image?"}]}, {"id": 899, "image": "COCO_val2014_000000354398.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains dog, truck, person, car, tie. Based on this, is there a person in the image?"}]}, {"id": 900, "image": "COCO_val2014_000000354398.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains dog, truck, person, car, tie. Based on this, is there a dining table in the image?"}]}, {"id": 901, "image": "COCO_val2014_000000430052.jpg", "conversations": [{"from": "human", "value": "Is there a vase in the image?"}, {"from": "gpt", "value": "This image contains vase, bird, bottle, dining table. Based on this, is there a vase in the image?"}]}, {"id": 902, "image": "COCO_val2014_000000430052.jpg", "conversations": [{"from": "human", "value": "Is there a potted plant in the image?"}, {"from": "gpt", "value": "This image contains vase, bird, bottle, dining table. Based on this, is there a potted plant in the image?"}]}, {"id": 903, "image": "COCO_val2014_000000430052.jpg", "conversations": [{"from": "human", "value": "Is there a bird in the image?"}, {"from": "gpt", "value": "This image contains vase, bird, bottle, dining table. Based on this, is there a bird in the image?"}]}, {"id": 904, "image": "COCO_val2014_000000430052.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains vase, bird, bottle, dining table. Based on this, is there a person in the image?"}]}, {"id": 905, "image": "COCO_val2014_000000430052.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains vase, bird, bottle, dining table. Based on this, is there a bottle in the image?"}]}, {"id": 906, "image": "COCO_val2014_000000430052.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains vase, bird, bottle, dining table. Based on this, is there a cup in the image?"}]}, {"id": 907, "image": "COCO_val2014_000000567886.jpg", "conversations": [{"from": "human", "value": "Is there a teddy bear in the image?"}, {"from": "gpt", "value": "This image contains teddy bear, person, book. Based on this, is there a teddy bear in the image?"}]}, {"id": 908, "image": "COCO_val2014_000000567886.jpg", "conversations": [{"from": "human", "value": "Is there a bear in the image?"}, {"from": "gpt", "value": "This image contains teddy bear, person, book. Based on this, is there a bear in the image?"}]}, {"id": 909, "image": "COCO_val2014_000000567886.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains teddy bear, person, book. Based on this, is there a person in the image?"}]}, {"id": 910, "image": "COCO_val2014_000000567886.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains teddy bear, person, book. Based on this, is there a car in the image?"}]}, {"id": 911, "image": "COCO_val2014_000000567886.jpg", "conversations": [{"from": "human", "value": "Is there a book in the image?"}, {"from": "gpt", "value": "This image contains teddy bear, person, book. Based on this, is there a book in the image?"}]}, {"id": 912, "image": "COCO_val2014_000000567886.jpg", "conversations": [{"from": "human", "value": "Is there a tv in the image?"}, {"from": "gpt", "value": "This image contains teddy bear, person, book. Based on this, is there a tv in the image?"}]}, {"id": 913, "image": "COCO_val2014_000000539251.jpg", "conversations": [{"from": "human", "value": "Is there a sink in the image?"}, {"from": "gpt", "value": "This image contains sink, person, potted plant. Based on this, is there a sink in the image?"}]}, {"id": 914, "image": "COCO_val2014_000000539251.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains sink, person, potted plant. Based on this, is there a bottle in the image?"}]}, {"id": 915, "image": "COCO_val2014_000000539251.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains sink, person, potted plant. Based on this, is there a person in the image?"}]}, {"id": 916, "image": "COCO_val2014_000000539251.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains sink, person, potted plant. Based on this, is there a car in the image?"}]}, {"id": 917, "image": "COCO_val2014_000000539251.jpg", "conversations": [{"from": "human", "value": "Is there a potted plant in the image?"}, {"from": "gpt", "value": "This image contains sink, person, potted plant. Based on this, is there a potted plant in the image?"}]}, {"id": 918, "image": "COCO_val2014_000000539251.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains sink, person, potted plant. Based on this, is there a dining table in the image?"}]}, {"id": 919, "image": "COCO_val2014_000000551908.jpg", "conversations": [{"from": "human", "value": "Is there a broccoli in the image?"}, {"from": "gpt", "value": "This image contains broccoli, carrot, bed, dining table. Based on this, is there a broccoli in the image?"}]}, {"id": 920, "image": "COCO_val2014_000000551908.jpg", "conversations": [{"from": "human", "value": "Is there a bowl in the image?"}, {"from": "gpt", "value": "This image contains broccoli, carrot, bed, dining table. Based on this, is there a bowl in the image?"}]}, {"id": 921, "image": "COCO_val2014_000000551908.jpg", "conversations": [{"from": "human", "value": "Is there a carrot in the image?"}, {"from": "gpt", "value": "This image contains broccoli, carrot, bed, dining table. Based on this, is there a carrot in the image?"}]}, {"id": 922, "image": "COCO_val2014_000000551908.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains broccoli, carrot, bed, dining table. Based on this, is there a person in the image?"}]}, {"id": 923, "image": "COCO_val2014_000000551908.jpg", "conversations": [{"from": "human", "value": "Is there a bed in the image?"}, {"from": "gpt", "value": "This image contains broccoli, carrot, bed, dining table. Based on this, is there a bed in the image?"}]}, {"id": 924, "image": "COCO_val2014_000000551908.jpg", "conversations": [{"from": "human", "value": "Is there a book in the image?"}, {"from": "gpt", "value": "This image contains broccoli, carrot, bed, dining table. Based on this, is there a book in the image?"}]}, {"id": 925, "image": "COCO_val2014_000000102906.jpg", "conversations": [{"from": "human", "value": "Is there a traffic light in the image?"}, {"from": "gpt", "value": "This image contains traffic light, car, fire hydrant. Based on this, is there a traffic light in the image?"}]}, {"id": 926, "image": "COCO_val2014_000000102906.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains traffic light, car, fire hydrant. Based on this, is there a person in the image?"}]}, {"id": 927, "image": "COCO_val2014_000000102906.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains traffic light, car, fire hydrant. Based on this, is there a car in the image?"}]}, {"id": 928, "image": "COCO_val2014_000000102906.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains traffic light, car, fire hydrant. Based on this, is there a truck in the image?"}]}, {"id": 929, "image": "COCO_val2014_000000102906.jpg", "conversations": [{"from": "human", "value": "Is there a fire hydrant in the image?"}, {"from": "gpt", "value": "This image contains traffic light, car, fire hydrant. Based on this, is there a fire hydrant in the image?"}]}, {"id": 930, "image": "COCO_val2014_000000102906.jpg", "conversations": [{"from": "human", "value": "Is there a stop sign in the image?"}, {"from": "gpt", "value": "This image contains traffic light, car, fire hydrant. Based on this, is there a stop sign in the image?"}]}, {"id": 931, "image": "COCO_val2014_000000327771.jpg", "conversations": [{"from": "human", "value": "Is there a vase in the image?"}, {"from": "gpt", "value": "This image contains vase, bed, dining table. Based on this, is there a vase in the image?"}]}, {"id": 932, "image": "COCO_val2014_000000327771.jpg", "conversations": [{"from": "human", "value": "Is there a potted plant in the image?"}, {"from": "gpt", "value": "This image contains vase, bed, dining table. Based on this, is there a potted plant in the image?"}]}, {"id": 933, "image": "COCO_val2014_000000327771.jpg", "conversations": [{"from": "human", "value": "Is there a bed in the image?"}, {"from": "gpt", "value": "This image contains vase, bed, dining table. Based on this, is there a bed in the image?"}]}, {"id": 934, "image": "COCO_val2014_000000327771.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains vase, bed, dining table. Based on this, is there a person in the image?"}]}, {"id": 935, "image": "COCO_val2014_000000327771.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains vase, bed, dining table. Based on this, is there a dining table in the image?"}]}, {"id": 936, "image": "COCO_val2014_000000327771.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains vase, bed, dining table. Based on this, is there a cup in the image?"}]}, {"id": 937, "image": "COCO_val2014_000000280734.jpg", "conversations": [{"from": "human", "value": "Is there a pizza in the image?"}, {"from": "gpt", "value": "This image contains pizza, person, dining table. Based on this, is there a pizza in the image?"}]}, {"id": 938, "image": "COCO_val2014_000000280734.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains pizza, person, dining table. Based on this, is there a cup in the image?"}]}, {"id": 939, "image": "COCO_val2014_000000280734.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains pizza, person, dining table. Based on this, is there a person in the image?"}]}, {"id": 940, "image": "COCO_val2014_000000280734.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains pizza, person, dining table. Based on this, is there a car in the image?"}]}, {"id": 941, "image": "COCO_val2014_000000280734.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains pizza, person, dining table. Based on this, is there a dining table in the image?"}]}, {"id": 942, "image": "COCO_val2014_000000280734.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains pizza, person, dining table. Based on this, is there a chair in the image?"}]}, {"id": 943, "image": "COCO_val2014_000000111817.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, cup, cake, dining table. Based on this, is there a person in the image?"}]}, {"id": 944, "image": "COCO_val2014_000000111817.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, cup, cake, dining table. Based on this, is there a car in the image?"}]}, {"id": 945, "image": "COCO_val2014_000000111817.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains person, cup, cake, dining table. Based on this, is there a cup in the image?"}]}, {"id": 946, "image": "COCO_val2014_000000111817.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains person, cup, cake, dining table. Based on this, is there a bottle in the image?"}]}, {"id": 947, "image": "COCO_val2014_000000111817.jpg", "conversations": [{"from": "human", "value": "Is there a cake in the image?"}, {"from": "gpt", "value": "This image contains person, cup, cake, dining table. Based on this, is there a cake in the image?"}]}, {"id": 948, "image": "COCO_val2014_000000111817.jpg", "conversations": [{"from": "human", "value": "Is there a spoon in the image?"}, {"from": "gpt", "value": "This image contains person, cup, cake, dining table. Based on this, is there a spoon in the image?"}]}, {"id": 949, "image": "COCO_val2014_000000379162.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, handbag, bottle, tennis racket, chair. Based on this, is there a person in the image?"}]}, {"id": 950, "image": "COCO_val2014_000000379162.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, handbag, bottle, tennis racket, chair. Based on this, is there a car in the image?"}]}, {"id": 951, "image": "COCO_val2014_000000379162.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains person, handbag, bottle, tennis racket, chair. Based on this, is there a handbag in the image?"}]}, {"id": 952, "image": "COCO_val2014_000000379162.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains person, handbag, bottle, tennis racket, chair. Based on this, is there a backpack in the image?"}]}, {"id": 953, "image": "COCO_val2014_000000379162.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains person, handbag, bottle, tennis racket, chair. Based on this, is there a bottle in the image?"}]}, {"id": 954, "image": "COCO_val2014_000000379162.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, handbag, bottle, tennis racket, chair. Based on this, is there a dining table in the image?"}]}, {"id": 955, "image": "COCO_val2014_000000489728.jpg", "conversations": [{"from": "human", "value": "Is there a bowl in the image?"}, {"from": "gpt", "value": "This image contains bowl, person, laptop, orange, bed, tv, couch, book. Based on this, is there a bowl in the image?"}]}, {"id": 956, "image": "COCO_val2014_000000489728.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains bowl, person, laptop, orange, bed, tv, couch, book. Based on this, is there a cup in the image?"}]}, {"id": 957, "image": "COCO_val2014_000000489728.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains bowl, person, laptop, orange, bed, tv, couch, book. Based on this, is there a person in the image?"}]}, {"id": 958, "image": "COCO_val2014_000000489728.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains bowl, person, laptop, orange, bed, tv, couch, book. Based on this, is there a car in the image?"}]}, {"id": 959, "image": "COCO_val2014_000000489728.jpg", "conversations": [{"from": "human", "value": "Is there a laptop in the image?"}, {"from": "gpt", "value": "This image contains bowl, person, laptop, orange, bed, tv, couch, book. Based on this, is there a laptop in the image?"}]}, {"id": 960, "image": "COCO_val2014_000000489728.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains bowl, person, laptop, orange, bed, tv, couch, book. Based on this, is there a dining table in the image?"}]}, {"id": 961, "image": "COCO_val2014_000000419453.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, umbrella. Based on this, is there a person in the image?"}]}, {"id": 962, "image": "COCO_val2014_000000419453.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, umbrella. Based on this, is there a car in the image?"}]}, {"id": 963, "image": "COCO_val2014_000000419453.jpg", "conversations": [{"from": "human", "value": "Is there a sports ball in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, umbrella. Based on this, is there a sports ball in the image?"}]}, {"id": 964, "image": "COCO_val2014_000000419453.jpg", "conversations": [{"from": "human", "value": "Is there a tennis racket in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, umbrella. Based on this, is there a tennis racket in the image?"}]}, {"id": 965, "image": "COCO_val2014_000000419453.jpg", "conversations": [{"from": "human", "value": "Is there an umbrella in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, umbrella. Based on this, is there an umbrella in the image?"}]}, {"id": 966, "image": "COCO_val2014_000000419453.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, umbrella. Based on this, is there a handbag in the image?"}]}, {"id": 967, "image": "COCO_val2014_000000358255.jpg", "conversations": [{"from": "human", "value": "Is there a teddy bear in the image?"}, {"from": "gpt", "value": "This image contains teddy bear, person, bed, book. Based on this, is there a teddy bear in the image?"}]}, {"id": 968, "image": "COCO_val2014_000000358255.jpg", "conversations": [{"from": "human", "value": "Is there a bear in the image?"}, {"from": "gpt", "value": "This image contains teddy bear, person, bed, book. Based on this, is there a bear in the image?"}]}, {"id": 969, "image": "COCO_val2014_000000358255.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains teddy bear, person, bed, book. Based on this, is there a person in the image?"}]}, {"id": 970, "image": "COCO_val2014_000000358255.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains teddy bear, person, bed, book. Based on this, is there a car in the image?"}]}, {"id": 971, "image": "COCO_val2014_000000358255.jpg", "conversations": [{"from": "human", "value": "Is there a bed in the image?"}, {"from": "gpt", "value": "This image contains teddy bear, person, bed, book. Based on this, is there a bed in the image?"}]}, {"id": 972, "image": "COCO_val2014_000000358255.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains teddy bear, person, bed, book. Based on this, is there a dining table in the image?"}]}, {"id": 973, "image": "COCO_val2014_000000178078.jpg", "conversations": [{"from": "human", "value": "Is there a motorcycle in the image?"}, {"from": "gpt", "value": "This image contains motorcycle, car, bicycle. Based on this, is there a motorcycle in the image?"}]}, {"id": 974, "image": "COCO_val2014_000000178078.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains motorcycle, car, bicycle. Based on this, is there a person in the image?"}]}, {"id": 975, "image": "COCO_val2014_000000178078.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains motorcycle, car, bicycle. Based on this, is there a car in the image?"}]}, {"id": 976, "image": "COCO_val2014_000000178078.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains motorcycle, car, bicycle. Based on this, is there a truck in the image?"}]}, {"id": 977, "image": "COCO_val2014_000000178078.jpg", "conversations": [{"from": "human", "value": "Is there a bicycle in the image?"}, {"from": "gpt", "value": "This image contains motorcycle, car, bicycle. Based on this, is there a bicycle in the image?"}]}, {"id": 978, "image": "COCO_val2014_000000178078.jpg", "conversations": [{"from": "human", "value": "Is there a bus in the image?"}, {"from": "gpt", "value": "This image contains motorcycle, car, bicycle. Based on this, is there a bus in the image?"}]}, {"id": 979, "image": "COCO_val2014_000000197219.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, handbag, dining table, chair, pizza. Based on this, is there a person in the image?"}]}, {"id": 980, "image": "COCO_val2014_000000197219.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, handbag, dining table, chair, pizza. Based on this, is there a car in the image?"}]}, {"id": 981, "image": "COCO_val2014_000000197219.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains person, handbag, dining table, chair, pizza. Based on this, is there a handbag in the image?"}]}, {"id": 982, "image": "COCO_val2014_000000197219.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains person, handbag, dining table, chair, pizza. Based on this, is there a backpack in the image?"}]}, {"id": 983, "image": "COCO_val2014_000000197219.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, handbag, dining table, chair, pizza. Based on this, is there a dining table in the image?"}]}, {"id": 984, "image": "COCO_val2014_000000197219.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains person, handbag, dining table, chair, pizza. Based on this, is there a cup in the image?"}]}, {"id": 985, "image": "COCO_val2014_000000460931.jpg", "conversations": [{"from": "human", "value": "Is there a donut in the image?"}, {"from": "gpt", "value": "This image contains donut, cake, person. Based on this, is there a donut in the image?"}]}, {"id": 986, "image": "COCO_val2014_000000460931.jpg", "conversations": [{"from": "human", "value": "Is there a spoon in the image?"}, {"from": "gpt", "value": "This image contains donut, cake, person. Based on this, is there a spoon in the image?"}]}, {"id": 987, "image": "COCO_val2014_000000460931.jpg", "conversations": [{"from": "human", "value": "Is there a cake in the image?"}, {"from": "gpt", "value": "This image contains donut, cake, person. Based on this, is there a cake in the image?"}]}, {"id": 988, "image": "COCO_val2014_000000460931.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains donut, cake, person. Based on this, is there a cup in the image?"}]}, {"id": 989, "image": "COCO_val2014_000000460931.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains donut, cake, person. Based on this, is there a person in the image?"}]}, {"id": 990, "image": "COCO_val2014_000000460931.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains donut, cake, person. Based on this, is there a car in the image?"}]}, {"id": 991, "image": "COCO_val2014_000000506483.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, car, bench, cat. Based on this, is there a backpack in the image?"}]}, {"id": 992, "image": "COCO_val2014_000000506483.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, car, bench, cat. Based on this, is there a handbag in the image?"}]}, {"id": 993, "image": "COCO_val2014_000000506483.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, car, bench, cat. Based on this, is there a person in the image?"}]}, {"id": 994, "image": "COCO_val2014_000000506483.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, car, bench, cat. Based on this, is there a dining table in the image?"}]}, {"id": 995, "image": "COCO_val2014_000000506483.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, car, bench, cat. Based on this, is there a car in the image?"}]}, {"id": 996, "image": "COCO_val2014_000000506483.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, car, bench, cat. Based on this, is there a truck in the image?"}]}, {"id": 997, "image": "COCO_val2014_000000468934.jpg", "conversations": [{"from": "human", "value": "Is there a banana in the image?"}, {"from": "gpt", "value": "This image contains banana, person, fork, dining table. Based on this, is there a banana in the image?"}]}, {"id": 998, "image": "COCO_val2014_000000468934.jpg", "conversations": [{"from": "human", "value": "Is there a bowl in the image?"}, {"from": "gpt", "value": "This image contains banana, person, fork, dining table. Based on this, is there a bowl in the image?"}]}, {"id": 999, "image": "COCO_val2014_000000468934.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains banana, person, fork, dining table. Based on this, is there a person in the image?"}]}, {"id": 1000, "image": "COCO_val2014_000000468934.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains banana, person, fork, dining table. Based on this, is there a car in the image?"}]}, {"id": 1001, "image": "COCO_val2014_000000468934.jpg", "conversations": [{"from": "human", "value": "Is there a fork in the image?"}, {"from": "gpt", "value": "This image contains banana, person, fork, dining table. Based on this, is there a fork in the image?"}]}, {"id": 1002, "image": "COCO_val2014_000000468934.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains banana, person, fork, dining table. Based on this, is there a cup in the image?"}]}, {"id": 1003, "image": "COCO_val2014_000000189694.jpg", "conversations": [{"from": "human", "value": "Is there a sink in the image?"}, {"from": "gpt", "value": "This image contains sink, person, bottle, microwave. Based on this, is there a sink in the image?"}]}, {"id": 1004, "image": "COCO_val2014_000000189694.jpg", "conversations": [{"from": "human", "value": "Is there a toilet in the image?"}, {"from": "gpt", "value": "This image contains sink, person, bottle, microwave. Based on this, is there a toilet in the image?"}]}, {"id": 1005, "image": "COCO_val2014_000000189694.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains sink, person, bottle, microwave. Based on this, is there a person in the image?"}]}, {"id": 1006, "image": "COCO_val2014_000000189694.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains sink, person, bottle, microwave. Based on this, is there a car in the image?"}]}, {"id": 1007, "image": "COCO_val2014_000000189694.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains sink, person, bottle, microwave. Based on this, is there a bottle in the image?"}]}, {"id": 1008, "image": "COCO_val2014_000000189694.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains sink, person, bottle, microwave. Based on this, is there a dining table in the image?"}]}, {"id": 1009, "image": "COCO_val2014_000000273450.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, orange, car, parking meter. Based on this, is there a person in the image?"}]}, {"id": 1010, "image": "COCO_val2014_000000273450.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, orange, car, parking meter. Based on this, is there a dining table in the image?"}]}, {"id": 1011, "image": "COCO_val2014_000000273450.jpg", "conversations": [{"from": "human", "value": "Is there an orange in the image?"}, {"from": "gpt", "value": "This image contains person, orange, car, parking meter. Based on this, is there an orange in the image?"}]}, {"id": 1012, "image": "COCO_val2014_000000273450.jpg", "conversations": [{"from": "human", "value": "Is there a bowl in the image?"}, {"from": "gpt", "value": "This image contains person, orange, car, parking meter. Based on this, is there a bowl in the image?"}]}, {"id": 1013, "image": "COCO_val2014_000000273450.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, orange, car, parking meter. Based on this, is there a car in the image?"}]}, {"id": 1014, "image": "COCO_val2014_000000273450.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains person, orange, car, parking meter. Based on this, is there a truck in the image?"}]}, {"id": 1015, "image": "COCO_val2014_000000278226.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, couch, laptop, cup. Based on this, is there a person in the image?"}]}, {"id": 1016, "image": "COCO_val2014_000000278226.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, couch, laptop, cup. Based on this, is there a car in the image?"}]}, {"id": 1017, "image": "COCO_val2014_000000278226.jpg", "conversations": [{"from": "human", "value": "Is there a couch in the image?"}, {"from": "gpt", "value": "This image contains person, couch, laptop, cup. Based on this, is there a couch in the image?"}]}, {"id": 1018, "image": "COCO_val2014_000000278226.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains person, couch, laptop, cup. Based on this, is there a chair in the image?"}]}, {"id": 1019, "image": "COCO_val2014_000000278226.jpg", "conversations": [{"from": "human", "value": "Is there a laptop in the image?"}, {"from": "gpt", "value": "This image contains person, couch, laptop, cup. Based on this, is there a laptop in the image?"}]}, {"id": 1020, "image": "COCO_val2014_000000278226.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, couch, laptop, cup. Based on this, is there a dining table in the image?"}]}, {"id": 1021, "image": "COCO_val2014_000000449432.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, handbag, train, boat, suitcase, bus. Based on this, is there a backpack in the image?"}]}, {"id": 1022, "image": "COCO_val2014_000000449432.jpg", "conversations": [{"from": "human", "value": "Is there a skis in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, handbag, train, boat, suitcase, bus. Based on this, is there a skis in the image?"}]}, {"id": 1023, "image": "COCO_val2014_000000449432.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, handbag, train, boat, suitcase, bus. Based on this, is there a person in the image?"}]}, {"id": 1024, "image": "COCO_val2014_000000449432.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, handbag, train, boat, suitcase, bus. Based on this, is there a car in the image?"}]}, {"id": 1025, "image": "COCO_val2014_000000449432.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, handbag, train, boat, suitcase, bus. Based on this, is there a handbag in the image?"}]}, {"id": 1026, "image": "COCO_val2014_000000449432.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, handbag, train, boat, suitcase, bus. Based on this, is there a dining table in the image?"}]}, {"id": 1027, "image": "COCO_val2014_000000153300.jpg", "conversations": [{"from": "human", "value": "Is there a spoon in the image?"}, {"from": "gpt", "value": "This image contains spoon, bowl, person, dining table, knife, cake, fork, bottle, cup. Based on this, is there a spoon in the image?"}]}, {"id": 1028, "image": "COCO_val2014_000000153300.jpg", "conversations": [{"from": "human", "value": "Is there an oven in the image?"}, {"from": "gpt", "value": "This image contains spoon, bowl, person, dining table, knife, cake, fork, bottle, cup. Based on this, is there an oven in the image?"}]}, {"id": 1029, "image": "COCO_val2014_000000153300.jpg", "conversations": [{"from": "human", "value": "Is there a bowl in the image?"}, {"from": "gpt", "value": "This image contains spoon, bowl, person, dining table, knife, cake, fork, bottle, cup. Based on this, is there a bowl in the image?"}]}, {"id": 1030, "image": "COCO_val2014_000000153300.jpg", "conversations": [{"from": "human", "value": "Is there a banana in the image?"}, {"from": "gpt", "value": "This image contains spoon, bowl, person, dining table, knife, cake, fork, bottle, cup. Based on this, is there a banana in the image?"}]}, {"id": 1031, "image": "COCO_val2014_000000153300.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains spoon, bowl, person, dining table, knife, cake, fork, bottle, cup. Based on this, is there a person in the image?"}]}, {"id": 1032, "image": "COCO_val2014_000000153300.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains spoon, bowl, person, dining table, knife, cake, fork, bottle, cup. Based on this, is there a car in the image?"}]}, {"id": 1033, "image": "COCO_val2014_000000506178.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, bed, remote. Based on this, is there a person in the image?"}]}, {"id": 1034, "image": "COCO_val2014_000000506178.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, bed, remote. Based on this, is there a car in the image?"}]}, {"id": 1035, "image": "COCO_val2014_000000506178.jpg", "conversations": [{"from": "human", "value": "Is there a bed in the image?"}, {"from": "gpt", "value": "This image contains person, bed, remote. Based on this, is there a bed in the image?"}]}, {"id": 1036, "image": "COCO_val2014_000000506178.jpg", "conversations": [{"from": "human", "value": "Is there a book in the image?"}, {"from": "gpt", "value": "This image contains person, bed, remote. Based on this, is there a book in the image?"}]}, {"id": 1037, "image": "COCO_val2014_000000506178.jpg", "conversations": [{"from": "human", "value": "Is there a remote in the image?"}, {"from": "gpt", "value": "This image contains person, bed, remote. Based on this, is there a remote in the image?"}]}, {"id": 1038, "image": "COCO_val2014_000000506178.jpg", "conversations": [{"from": "human", "value": "Is there a tv in the image?"}, {"from": "gpt", "value": "This image contains person, bed, remote. Based on this, is there a tv in the image?"}]}, {"id": 1039, "image": "COCO_val2014_000000249720.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, traffic light, bicycle, car, stop sign, bench. Based on this, is there a backpack in the image?"}]}, {"id": 1040, "image": "COCO_val2014_000000249720.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, traffic light, bicycle, car, stop sign, bench. Based on this, is there a handbag in the image?"}]}, {"id": 1041, "image": "COCO_val2014_000000249720.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, traffic light, bicycle, car, stop sign, bench. Based on this, is there a person in the image?"}]}, {"id": 1042, "image": "COCO_val2014_000000249720.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, traffic light, bicycle, car, stop sign, bench. Based on this, is there a dining table in the image?"}]}, {"id": 1043, "image": "COCO_val2014_000000249720.jpg", "conversations": [{"from": "human", "value": "Is there a traffic light in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, traffic light, bicycle, car, stop sign, bench. Based on this, is there a traffic light in the image?"}]}, {"id": 1044, "image": "COCO_val2014_000000249720.jpg", "conversations": [{"from": "human", "value": "Is there a bus in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, traffic light, bicycle, car, stop sign, bench. Based on this, is there a bus in the image?"}]}, {"id": 1045, "image": "COCO_val2014_000000205206.jpg", "conversations": [{"from": "human", "value": "Is there a traffic light in the image?"}, {"from": "gpt", "value": "This image contains traffic light, train, car, bus. Based on this, is there a traffic light in the image?"}]}, {"id": 1046, "image": "COCO_val2014_000000205206.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains traffic light, train, car, bus. Based on this, is there a person in the image?"}]}, {"id": 1047, "image": "COCO_val2014_000000205206.jpg", "conversations": [{"from": "human", "value": "Is there a train in the image?"}, {"from": "gpt", "value": "This image contains traffic light, train, car, bus. Based on this, is there a train in the image?"}]}, {"id": 1048, "image": "COCO_val2014_000000205206.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains traffic light, train, car, bus. Based on this, is there a truck in the image?"}]}, {"id": 1049, "image": "COCO_val2014_000000205206.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains traffic light, train, car, bus. Based on this, is there a car in the image?"}]}, {"id": 1050, "image": "COCO_val2014_000000205206.jpg", "conversations": [{"from": "human", "value": "Is there a bicycle in the image?"}, {"from": "gpt", "value": "This image contains traffic light, train, car, bus. Based on this, is there a bicycle in the image?"}]}, {"id": 1051, "image": "COCO_val2014_000000018150.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, couch, bottle, pizza. Based on this, is there a backpack in the image?"}]}, {"id": 1052, "image": "COCO_val2014_000000018150.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, couch, bottle, pizza. Based on this, is there a handbag in the image?"}]}, {"id": 1053, "image": "COCO_val2014_000000018150.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, couch, bottle, pizza. Based on this, is there a person in the image?"}]}, {"id": 1054, "image": "COCO_val2014_000000018150.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, couch, bottle, pizza. Based on this, is there a car in the image?"}]}, {"id": 1055, "image": "COCO_val2014_000000018150.jpg", "conversations": [{"from": "human", "value": "Is there a couch in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, couch, bottle, pizza. Based on this, is there a couch in the image?"}]}, {"id": 1056, "image": "COCO_val2014_000000018150.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, couch, bottle, pizza. Based on this, is there a chair in the image?"}]}, {"id": 1057, "image": "COCO_val2014_000000303534.jpg", "conversations": [{"from": "human", "value": "Is there a tv in the image?"}, {"from": "gpt", "value": "This image contains tv, backpack, chair, bed, book, cup. Based on this, is there a tv in the image?"}]}, {"id": 1058, "image": "COCO_val2014_000000303534.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains tv, backpack, chair, bed, book, cup. Based on this, is there a person in the image?"}]}, {"id": 1059, "image": "COCO_val2014_000000303534.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains tv, backpack, chair, bed, book, cup. Based on this, is there a backpack in the image?"}]}, {"id": 1060, "image": "COCO_val2014_000000303534.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains tv, backpack, chair, bed, book, cup. Based on this, is there a handbag in the image?"}]}, {"id": 1061, "image": "COCO_val2014_000000303534.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains tv, backpack, chair, bed, book, cup. Based on this, is there a chair in the image?"}]}, {"id": 1062, "image": "COCO_val2014_000000303534.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains tv, backpack, chair, bed, book, cup. Based on this, is there a dining table in the image?"}]}, {"id": 1063, "image": "COCO_val2014_000000278771.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, bottle, bench, baseball bat. Based on this, is there a person in the image?"}]}, {"id": 1064, "image": "COCO_val2014_000000278771.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, bottle, bench, baseball bat. Based on this, is there a car in the image?"}]}, {"id": 1065, "image": "COCO_val2014_000000278771.jpg", "conversations": [{"from": "human", "value": "Is there a sports ball in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, bottle, bench, baseball bat. Based on this, is there a sports ball in the image?"}]}, {"id": 1066, "image": "COCO_val2014_000000278771.jpg", "conversations": [{"from": "human", "value": "Is there a tennis racket in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, bottle, bench, baseball bat. Based on this, is there a tennis racket in the image?"}]}, {"id": 1067, "image": "COCO_val2014_000000278771.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, bottle, bench, baseball bat. Based on this, is there a bottle in the image?"}]}, {"id": 1068, "image": "COCO_val2014_000000278771.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, bottle, bench, baseball bat. Based on this, is there a dining table in the image?"}]}, {"id": 1069, "image": "COCO_val2014_000000134075.jpg", "conversations": [{"from": "human", "value": "Is there a spoon in the image?"}, {"from": "gpt", "value": "This image contains spoon, person, bottle, dining table, cell phone, cup. Based on this, is there a spoon in the image?"}]}, {"id": 1070, "image": "COCO_val2014_000000134075.jpg", "conversations": [{"from": "human", "value": "Is there a bowl in the image?"}, {"from": "gpt", "value": "This image contains spoon, person, bottle, dining table, cell phone, cup. Based on this, is there a bowl in the image?"}]}, {"id": 1071, "image": "COCO_val2014_000000134075.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains spoon, person, bottle, dining table, cell phone, cup. Based on this, is there a person in the image?"}]}, {"id": 1072, "image": "COCO_val2014_000000134075.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains spoon, person, bottle, dining table, cell phone, cup. Based on this, is there a car in the image?"}]}, {"id": 1073, "image": "COCO_val2014_000000134075.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains spoon, person, bottle, dining table, cell phone, cup. Based on this, is there a bottle in the image?"}]}, {"id": 1074, "image": "COCO_val2014_000000134075.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains spoon, person, bottle, dining table, cell phone, cup. Based on this, is there a chair in the image?"}]}, {"id": 1075, "image": "COCO_val2014_000000227204.jpg", "conversations": [{"from": "human", "value": "Is there a banana in the image?"}, {"from": "gpt", "value": "This image contains banana, person, spoon, bowl, dining table, knife, bottle, cell phone, cup. Based on this, is there a banana in the image?"}]}, {"id": 1076, "image": "COCO_val2014_000000227204.jpg", "conversations": [{"from": "human", "value": "Is there an orange in the image?"}, {"from": "gpt", "value": "This image contains banana, person, spoon, bowl, dining table, knife, bottle, cell phone, cup. Based on this, is there an orange in the image?"}]}, {"id": 1077, "image": "COCO_val2014_000000227204.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains banana, person, spoon, bowl, dining table, knife, bottle, cell phone, cup. Based on this, is there a person in the image?"}]}, {"id": 1078, "image": "COCO_val2014_000000227204.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains banana, person, spoon, bowl, dining table, knife, bottle, cell phone, cup. Based on this, is there a car in the image?"}]}, {"id": 1079, "image": "COCO_val2014_000000227204.jpg", "conversations": [{"from": "human", "value": "Is there a spoon in the image?"}, {"from": "gpt", "value": "This image contains banana, person, spoon, bowl, dining table, knife, bottle, cell phone, cup. Based on this, is there a spoon in the image?"}]}, {"id": 1080, "image": "COCO_val2014_000000227204.jpg", "conversations": [{"from": "human", "value": "Is there an oven in the image?"}, {"from": "gpt", "value": "This image contains banana, person, spoon, bowl, dining table, knife, bottle, cell phone, cup. Based on this, is there an oven in the image?"}]}, {"id": 1081, "image": "COCO_val2014_000000124629.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket. Based on this, is there a person in the image?"}]}, {"id": 1082, "image": "COCO_val2014_000000124629.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket. Based on this, is there a car in the image?"}]}, {"id": 1083, "image": "COCO_val2014_000000124629.jpg", "conversations": [{"from": "human", "value": "Is there a sports ball in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket. Based on this, is there a sports ball in the image?"}]}, {"id": 1084, "image": "COCO_val2014_000000124629.jpg", "conversations": [{"from": "human", "value": "Is there a baseball glove in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket. Based on this, is there a baseball glove in the image?"}]}, {"id": 1085, "image": "COCO_val2014_000000124629.jpg", "conversations": [{"from": "human", "value": "Is there a tennis racket in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket. Based on this, is there a tennis racket in the image?"}]}, {"id": 1086, "image": "COCO_val2014_000000124629.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket. Based on this, is there a chair in the image?"}]}, {"id": 1087, "image": "COCO_val2014_000000142774.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, motorcycle, bus. Based on this, is there a person in the image?"}]}, {"id": 1088, "image": "COCO_val2014_000000142774.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, motorcycle, bus. Based on this, is there a car in the image?"}]}, {"id": 1089, "image": "COCO_val2014_000000142774.jpg", "conversations": [{"from": "human", "value": "Is there a motorcycle in the image?"}, {"from": "gpt", "value": "This image contains person, motorcycle, bus. Based on this, is there a motorcycle in the image?"}]}, {"id": 1090, "image": "COCO_val2014_000000142774.jpg", "conversations": [{"from": "human", "value": "Is there a bicycle in the image?"}, {"from": "gpt", "value": "This image contains person, motorcycle, bus. Based on this, is there a bicycle in the image?"}]}, {"id": 1091, "image": "COCO_val2014_000000142774.jpg", "conversations": [{"from": "human", "value": "Is there a bus in the image?"}, {"from": "gpt", "value": "This image contains person, motorcycle, bus. Based on this, is there a bus in the image?"}]}, {"id": 1092, "image": "COCO_val2014_000000142774.jpg", "conversations": [{"from": "human", "value": "Is there a traffic light in the image?"}, {"from": "gpt", "value": "This image contains person, motorcycle, bus. Based on this, is there a traffic light in the image?"}]}, {"id": 1093, "image": "COCO_val2014_000000199959.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, train, handbag. Based on this, is there a backpack in the image?"}]}, {"id": 1094, "image": "COCO_val2014_000000199959.jpg", "conversations": [{"from": "human", "value": "Is there a skis in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, train, handbag. Based on this, is there a skis in the image?"}]}, {"id": 1095, "image": "COCO_val2014_000000199959.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, train, handbag. Based on this, is there a person in the image?"}]}, {"id": 1096, "image": "COCO_val2014_000000199959.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, train, handbag. Based on this, is there a car in the image?"}]}, {"id": 1097, "image": "COCO_val2014_000000199959.jpg", "conversations": [{"from": "human", "value": "Is there a train in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, train, handbag. Based on this, is there a train in the image?"}]}, {"id": 1098, "image": "COCO_val2014_000000199959.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, train, handbag. Based on this, is there a truck in the image?"}]}, {"id": 1099, "image": "COCO_val2014_000000316700.jpg", "conversations": [{"from": "human", "value": "Is there a bowl in the image?"}, {"from": "gpt", "value": "This image contains bowl, broccoli, dining table, knife, orange, sandwich, fork, cup. Based on this, is there a bowl in the image?"}]}, {"id": 1100, "image": "COCO_val2014_000000316700.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains bowl, broccoli, dining table, knife, orange, sandwich, fork, cup. Based on this, is there a person in the image?"}]}, {"id": 1101, "image": "COCO_val2014_000000316700.jpg", "conversations": [{"from": "human", "value": "Is there a broccoli in the image?"}, {"from": "gpt", "value": "This image contains bowl, broccoli, dining table, knife, orange, sandwich, fork, cup. Based on this, is there a broccoli in the image?"}]}, {"id": 1102, "image": "COCO_val2014_000000316700.jpg", "conversations": [{"from": "human", "value": "Is there a carrot in the image?"}, {"from": "gpt", "value": "This image contains bowl, broccoli, dining table, knife, orange, sandwich, fork, cup. Based on this, is there a carrot in the image?"}]}, {"id": 1103, "image": "COCO_val2014_000000316700.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains bowl, broccoli, dining table, knife, orange, sandwich, fork, cup. Based on this, is there a dining table in the image?"}]}, {"id": 1104, "image": "COCO_val2014_000000316700.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains bowl, broccoli, dining table, knife, orange, sandwich, fork, cup. Based on this, is there a chair in the image?"}]}, {"id": 1105, "image": "COCO_val2014_000000040361.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, baseball bat. Based on this, is there a person in the image?"}]}, {"id": 1106, "image": "COCO_val2014_000000040361.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, baseball bat. Based on this, is there a car in the image?"}]}, {"id": 1107, "image": "COCO_val2014_000000040361.jpg", "conversations": [{"from": "human", "value": "Is there a sports ball in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, baseball bat. Based on this, is there a sports ball in the image?"}]}, {"id": 1108, "image": "COCO_val2014_000000040361.jpg", "conversations": [{"from": "human", "value": "Is there a tennis racket in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, baseball bat. Based on this, is there a tennis racket in the image?"}]}, {"id": 1109, "image": "COCO_val2014_000000040361.jpg", "conversations": [{"from": "human", "value": "Is there a baseball bat in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, baseball bat. Based on this, is there a baseball bat in the image?"}]}, {"id": 1110, "image": "COCO_val2014_000000040361.jpg", "conversations": [{"from": "human", "value": "Is there a baseball glove in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, baseball bat. Based on this, is there a baseball glove in the image?"}]}, {"id": 1111, "image": "COCO_val2014_000000378873.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains truck, bowl, person, handbag, dining table, orange, carrot. Based on this, is there a truck in the image?"}]}, {"id": 1112, "image": "COCO_val2014_000000378873.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains truck, bowl, person, handbag, dining table, orange, carrot. Based on this, is there a car in the image?"}]}, {"id": 1113, "image": "COCO_val2014_000000378873.jpg", "conversations": [{"from": "human", "value": "Is there a bowl in the image?"}, {"from": "gpt", "value": "This image contains truck, bowl, person, handbag, dining table, orange, carrot. Based on this, is there a bowl in the image?"}]}, {"id": 1114, "image": "COCO_val2014_000000378873.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains truck, bowl, person, handbag, dining table, orange, carrot. Based on this, is there a cup in the image?"}]}, {"id": 1115, "image": "COCO_val2014_000000378873.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains truck, bowl, person, handbag, dining table, orange, carrot. Based on this, is there a person in the image?"}]}, {"id": 1116, "image": "COCO_val2014_000000378873.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains truck, bowl, person, handbag, dining table, orange, carrot. Based on this, is there a chair in the image?"}]}, {"id": 1117, "image": "COCO_val2014_000000574790.jpg", "conversations": [{"from": "human", "value": "Is there a traffic light in the image?"}, {"from": "gpt", "value": "This image contains traffic light, truck, car. Based on this, is there a traffic light in the image?"}]}, {"id": 1118, "image": "COCO_val2014_000000574790.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains traffic light, truck, car. Based on this, is there a person in the image?"}]}, {"id": 1119, "image": "COCO_val2014_000000574790.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains traffic light, truck, car. Based on this, is there a truck in the image?"}]}, {"id": 1120, "image": "COCO_val2014_000000574790.jpg", "conversations": [{"from": "human", "value": "Is there a motorcycle in the image?"}, {"from": "gpt", "value": "This image contains traffic light, truck, car. Based on this, is there a motorcycle in the image?"}]}, {"id": 1121, "image": "COCO_val2014_000000574790.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains traffic light, truck, car. Based on this, is there a car in the image?"}]}, {"id": 1122, "image": "COCO_val2014_000000574790.jpg", "conversations": [{"from": "human", "value": "Is there a bus in the image?"}, {"from": "gpt", "value": "This image contains traffic light, truck, car. Based on this, is there a bus in the image?"}]}, {"id": 1123, "image": "COCO_val2014_000000011241.jpg", "conversations": [{"from": "human", "value": "Is there a bowl in the image?"}, {"from": "gpt", "value": "This image contains bowl, spoon, sandwich, bottle, knife, donut, cup. Based on this, is there a bowl in the image?"}]}, {"id": 1124, "image": "COCO_val2014_000000011241.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains bowl, spoon, sandwich, bottle, knife, donut, cup. Based on this, is there a dining table in the image?"}]}, {"id": 1125, "image": "COCO_val2014_000000011241.jpg", "conversations": [{"from": "human", "value": "Is there a spoon in the image?"}, {"from": "gpt", "value": "This image contains bowl, spoon, sandwich, bottle, knife, donut, cup. Based on this, is there a spoon in the image?"}]}, {"id": 1126, "image": "COCO_val2014_000000011241.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains bowl, spoon, sandwich, bottle, knife, donut, cup. Based on this, is there a person in the image?"}]}, {"id": 1127, "image": "COCO_val2014_000000011241.jpg", "conversations": [{"from": "human", "value": "Is there a sandwich in the image?"}, {"from": "gpt", "value": "This image contains bowl, spoon, sandwich, bottle, knife, donut, cup. Based on this, is there a sandwich in the image?"}]}, {"id": 1128, "image": "COCO_val2014_000000011241.jpg", "conversations": [{"from": "human", "value": "Is there a fork in the image?"}, {"from": "gpt", "value": "This image contains bowl, spoon, sandwich, bottle, knife, donut, cup. Based on this, is there a fork in the image?"}]}, {"id": 1129, "image": "COCO_val2014_000000525667.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, bicycle, dining table, bench, cup. Based on this, is there a person in the image?"}]}, {"id": 1130, "image": "COCO_val2014_000000525667.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, bicycle, dining table, bench, cup. Based on this, is there a car in the image?"}]}, {"id": 1131, "image": "COCO_val2014_000000525667.jpg", "conversations": [{"from": "human", "value": "Is there a bicycle in the image?"}, {"from": "gpt", "value": "This image contains person, bicycle, dining table, bench, cup. Based on this, is there a bicycle in the image?"}]}, {"id": 1132, "image": "COCO_val2014_000000525667.jpg", "conversations": [{"from": "human", "value": "Is there a motorcycle in the image?"}, {"from": "gpt", "value": "This image contains person, bicycle, dining table, bench, cup. Based on this, is there a motorcycle in the image?"}]}, {"id": 1133, "image": "COCO_val2014_000000525667.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, bicycle, dining table, bench, cup. Based on this, is there a dining table in the image?"}]}, {"id": 1134, "image": "COCO_val2014_000000525667.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains person, bicycle, dining table, bench, cup. Based on this, is there a chair in the image?"}]}, {"id": 1135, "image": "COCO_val2014_000000246145.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains chair, clock, dining table. Based on this, is there a chair in the image?"}]}, {"id": 1136, "image": "COCO_val2014_000000246145.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains chair, clock, dining table. Based on this, is there a person in the image?"}]}, {"id": 1137, "image": "COCO_val2014_000000246145.jpg", "conversations": [{"from": "human", "value": "Is there a clock in the image?"}, {"from": "gpt", "value": "This image contains chair, clock, dining table. Based on this, is there a clock in the image?"}]}, {"id": 1138, "image": "COCO_val2014_000000246145.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains chair, clock, dining table. Based on this, is there a car in the image?"}]}, {"id": 1139, "image": "COCO_val2014_000000246145.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains chair, clock, dining table. Based on this, is there a dining table in the image?"}]}, {"id": 1140, "image": "COCO_val2014_000000246145.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains chair, clock, dining table. Based on this, is there a cup in the image?"}]}, {"id": 1141, "image": "COCO_val2014_000000313162.jpg", "conversations": [{"from": "human", "value": "Is there a pizza in the image?"}, {"from": "gpt", "value": "This image contains pizza, cup, dining table. Based on this, is there a pizza in the image?"}]}, {"id": 1142, "image": "COCO_val2014_000000313162.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains pizza, cup, dining table. Based on this, is there a person in the image?"}]}, {"id": 1143, "image": "COCO_val2014_000000313162.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains pizza, cup, dining table. Based on this, is there a cup in the image?"}]}, {"id": 1144, "image": "COCO_val2014_000000313162.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains pizza, cup, dining table. Based on this, is there a bottle in the image?"}]}, {"id": 1145, "image": "COCO_val2014_000000313162.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains pizza, cup, dining table. Based on this, is there a dining table in the image?"}]}, {"id": 1146, "image": "COCO_val2014_000000313162.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains pizza, cup, dining table. Based on this, is there a chair in the image?"}]}, {"id": 1147, "image": "COCO_val2014_000000529668.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, handbag, cell phone. Based on this, is there a person in the image?"}]}, {"id": 1148, "image": "COCO_val2014_000000529668.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, handbag, cell phone. Based on this, is there a car in the image?"}]}, {"id": 1149, "image": "COCO_val2014_000000529668.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains person, handbag, cell phone. Based on this, is there a handbag in the image?"}]}, {"id": 1150, "image": "COCO_val2014_000000529668.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains person, handbag, cell phone. Based on this, is there a backpack in the image?"}]}, {"id": 1151, "image": "COCO_val2014_000000529668.jpg", "conversations": [{"from": "human", "value": "Is there a cell phone in the image?"}, {"from": "gpt", "value": "This image contains person, handbag, cell phone. Based on this, is there a cell phone in the image?"}]}, {"id": 1152, "image": "COCO_val2014_000000529668.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, handbag, cell phone. Based on this, is there a dining table in the image?"}]}, {"id": 1153, "image": "COCO_val2014_000000376959.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains chair, person, cell phone, dining table. Based on this, is there a chair in the image?"}]}, {"id": 1154, "image": "COCO_val2014_000000376959.jpg", "conversations": [{"from": "human", "value": "Is there a couch in the image?"}, {"from": "gpt", "value": "This image contains chair, person, cell phone, dining table. Based on this, is there a couch in the image?"}]}, {"id": 1155, "image": "COCO_val2014_000000376959.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains chair, person, cell phone, dining table. Based on this, is there a person in the image?"}]}, {"id": 1156, "image": "COCO_val2014_000000376959.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains chair, person, cell phone, dining table. Based on this, is there a car in the image?"}]}, {"id": 1157, "image": "COCO_val2014_000000376959.jpg", "conversations": [{"from": "human", "value": "Is there a cell phone in the image?"}, {"from": "gpt", "value": "This image contains chair, person, cell phone, dining table. Based on this, is there a cell phone in the image?"}]}, {"id": 1158, "image": "COCO_val2014_000000376959.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains chair, person, cell phone, dining table. Based on this, is there a handbag in the image?"}]}, {"id": 1159, "image": "COCO_val2014_000000275863.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains chair, person, bench, baseball bat. Based on this, is there a chair in the image?"}]}, {"id": 1160, "image": "COCO_val2014_000000275863.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains chair, person, bench, baseball bat. Based on this, is there a dining table in the image?"}]}, {"id": 1161, "image": "COCO_val2014_000000275863.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains chair, person, bench, baseball bat. Based on this, is there a person in the image?"}]}, {"id": 1162, "image": "COCO_val2014_000000275863.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains chair, person, bench, baseball bat. Based on this, is there a car in the image?"}]}, {"id": 1163, "image": "COCO_val2014_000000275863.jpg", "conversations": [{"from": "human", "value": "Is there a bench in the image?"}, {"from": "gpt", "value": "This image contains chair, person, bench, baseball bat. Based on this, is there a bench in the image?"}]}, {"id": 1164, "image": "COCO_val2014_000000275863.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains chair, person, bench, baseball bat. Based on this, is there a backpack in the image?"}]}, {"id": 1165, "image": "COCO_val2014_000000327038.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, spoon, bowl, fork, bottle, knife. Based on this, is there a person in the image?"}]}, {"id": 1166, "image": "COCO_val2014_000000327038.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, spoon, bowl, fork, bottle, knife. Based on this, is there a car in the image?"}]}, {"id": 1167, "image": "COCO_val2014_000000327038.jpg", "conversations": [{"from": "human", "value": "Is there a spoon in the image?"}, {"from": "gpt", "value": "This image contains person, spoon, bowl, fork, bottle, knife. Based on this, is there a spoon in the image?"}]}, {"id": 1168, "image": "COCO_val2014_000000327038.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains person, spoon, bowl, fork, bottle, knife. Based on this, is there a cup in the image?"}]}, {"id": 1169, "image": "COCO_val2014_000000327038.jpg", "conversations": [{"from": "human", "value": "Is there a bowl in the image?"}, {"from": "gpt", "value": "This image contains person, spoon, bowl, fork, bottle, knife. Based on this, is there a bowl in the image?"}]}, {"id": 1170, "image": "COCO_val2014_000000327038.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, spoon, bowl, fork, bottle, knife. Based on this, is there a dining table in the image?"}]}, {"id": 1171, "image": "COCO_val2014_000000513136.jpg", "conversations": [{"from": "human", "value": "Is there a pizza in the image?"}, {"from": "gpt", "value": "This image contains pizza, cup, dining table. Based on this, is there a pizza in the image?"}]}, {"id": 1172, "image": "COCO_val2014_000000513136.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains pizza, cup, dining table. Based on this, is there a person in the image?"}]}, {"id": 1173, "image": "COCO_val2014_000000513136.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains pizza, cup, dining table. Based on this, is there a cup in the image?"}]}, {"id": 1174, "image": "COCO_val2014_000000513136.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains pizza, cup, dining table. Based on this, is there a bottle in the image?"}]}, {"id": 1175, "image": "COCO_val2014_000000513136.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains pizza, cup, dining table. Based on this, is there a dining table in the image?"}]}, {"id": 1176, "image": "COCO_val2014_000000513136.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains pizza, cup, dining table. Based on this, is there a chair in the image?"}]}, {"id": 1177, "image": "COCO_val2014_000000184338.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains truck, bed, person. Based on this, is there a truck in the image?"}]}, {"id": 1178, "image": "COCO_val2014_000000184338.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains truck, bed, person. Based on this, is there a car in the image?"}]}, {"id": 1179, "image": "COCO_val2014_000000184338.jpg", "conversations": [{"from": "human", "value": "Is there a bed in the image?"}, {"from": "gpt", "value": "This image contains truck, bed, person. Based on this, is there a bed in the image?"}]}, {"id": 1180, "image": "COCO_val2014_000000184338.jpg", "conversations": [{"from": "human", "value": "Is there a book in the image?"}, {"from": "gpt", "value": "This image contains truck, bed, person. Based on this, is there a book in the image?"}]}, {"id": 1181, "image": "COCO_val2014_000000184338.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains truck, bed, person. Based on this, is there a person in the image?"}]}, {"id": 1182, "image": "COCO_val2014_000000184338.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains truck, bed, person. Based on this, is there a dining table in the image?"}]}, {"id": 1183, "image": "COCO_val2014_000000175437.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, dining table, donut. Based on this, is there a person in the image?"}]}, {"id": 1184, "image": "COCO_val2014_000000175437.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, dining table, donut. Based on this, is there a car in the image?"}]}, {"id": 1185, "image": "COCO_val2014_000000175437.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, dining table, donut. Based on this, is there a dining table in the image?"}]}, {"id": 1186, "image": "COCO_val2014_000000175437.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains person, dining table, donut. Based on this, is there a cup in the image?"}]}, {"id": 1187, "image": "COCO_val2014_000000175437.jpg", "conversations": [{"from": "human", "value": "Is there a donut in the image?"}, {"from": "gpt", "value": "This image contains person, dining table, donut. Based on this, is there a donut in the image?"}]}, {"id": 1188, "image": "COCO_val2014_000000175437.jpg", "conversations": [{"from": "human", "value": "Is there a spoon in the image?"}, {"from": "gpt", "value": "This image contains person, dining table, donut. Based on this, is there a spoon in the image?"}]}, {"id": 1189, "image": "COCO_val2014_000000498100.jpg", "conversations": [{"from": "human", "value": "Is there a vase in the image?"}, {"from": "gpt", "value": "This image contains vase, person, dining table. Based on this, is there a vase in the image?"}]}, {"id": 1190, "image": "COCO_val2014_000000498100.jpg", "conversations": [{"from": "human", "value": "Is there a potted plant in the image?"}, {"from": "gpt", "value": "This image contains vase, person, dining table. Based on this, is there a potted plant in the image?"}]}, {"id": 1191, "image": "COCO_val2014_000000498100.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains vase, person, dining table. Based on this, is there a person in the image?"}]}, {"id": 1192, "image": "COCO_val2014_000000498100.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains vase, person, dining table. Based on this, is there a car in the image?"}]}, {"id": 1193, "image": "COCO_val2014_000000498100.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains vase, person, dining table. Based on this, is there a dining table in the image?"}]}, {"id": 1194, "image": "COCO_val2014_000000498100.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains vase, person, dining table. Based on this, is there a cup in the image?"}]}, {"id": 1195, "image": "COCO_val2014_000000375909.jpg", "conversations": [{"from": "human", "value": "Is there a refrigerator in the image?"}, {"from": "gpt", "value": "This image contains refrigerator, couch, bed. Based on this, is there a refrigerator in the image?"}]}, {"id": 1196, "image": "COCO_val2014_000000375909.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains refrigerator, couch, bed. Based on this, is there a bottle in the image?"}]}, {"id": 1197, "image": "COCO_val2014_000000375909.jpg", "conversations": [{"from": "human", "value": "Is there a couch in the image?"}, {"from": "gpt", "value": "This image contains refrigerator, couch, bed. Based on this, is there a couch in the image?"}]}, {"id": 1198, "image": "COCO_val2014_000000375909.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains refrigerator, couch, bed. Based on this, is there a person in the image?"}]}, {"id": 1199, "image": "COCO_val2014_000000375909.jpg", "conversations": [{"from": "human", "value": "Is there a bed in the image?"}, {"from": "gpt", "value": "This image contains refrigerator, couch, bed. Based on this, is there a bed in the image?"}]}, {"id": 1200, "image": "COCO_val2014_000000375909.jpg", "conversations": [{"from": "human", "value": "Is there a book in the image?"}, {"from": "gpt", "value": "This image contains refrigerator, couch, bed. Based on this, is there a book in the image?"}]}, {"id": 1201, "image": "COCO_val2014_000000396338.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains backpack, truck, person, handbag, car, motorcycle. Based on this, is there a backpack in the image?"}]}, {"id": 1202, "image": "COCO_val2014_000000396338.jpg", "conversations": [{"from": "human", "value": "Is there a skis in the image?"}, {"from": "gpt", "value": "This image contains backpack, truck, person, handbag, car, motorcycle. Based on this, is there a skis in the image?"}]}, {"id": 1203, "image": "COCO_val2014_000000396338.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains backpack, truck, person, handbag, car, motorcycle. Based on this, is there a truck in the image?"}]}, {"id": 1204, "image": "COCO_val2014_000000396338.jpg", "conversations": [{"from": "human", "value": "Is there a traffic light in the image?"}, {"from": "gpt", "value": "This image contains backpack, truck, person, handbag, car, motorcycle. Based on this, is there a traffic light in the image?"}]}, {"id": 1205, "image": "COCO_val2014_000000396338.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains backpack, truck, person, handbag, car, motorcycle. Based on this, is there a person in the image?"}]}, {"id": 1206, "image": "COCO_val2014_000000396338.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains backpack, truck, person, handbag, car, motorcycle. Based on this, is there a dining table in the image?"}]}, {"id": 1207, "image": "COCO_val2014_000000124930.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, bowl, spoon, wine glass, knife, cup. Based on this, is there a person in the image?"}]}, {"id": 1208, "image": "COCO_val2014_000000124930.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, bowl, spoon, wine glass, knife, cup. Based on this, is there a car in the image?"}]}, {"id": 1209, "image": "COCO_val2014_000000124930.jpg", "conversations": [{"from": "human", "value": "Is there a bowl in the image?"}, {"from": "gpt", "value": "This image contains person, bowl, spoon, wine glass, knife, cup. Based on this, is there a bowl in the image?"}]}, {"id": 1210, "image": "COCO_val2014_000000124930.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, bowl, spoon, wine glass, knife, cup. Based on this, is there a dining table in the image?"}]}, {"id": 1211, "image": "COCO_val2014_000000124930.jpg", "conversations": [{"from": "human", "value": "Is there a spoon in the image?"}, {"from": "gpt", "value": "This image contains person, bowl, spoon, wine glass, knife, cup. Based on this, is there a spoon in the image?"}]}, {"id": 1212, "image": "COCO_val2014_000000124930.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains person, bowl, spoon, wine glass, knife, cup. Based on this, is there a bottle in the image?"}]}, {"id": 1213, "image": "COCO_val2014_000000112664.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, handbag, suitcase, bench, tie. Based on this, is there a person in the image?"}]}, {"id": 1214, "image": "COCO_val2014_000000112664.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, handbag, suitcase, bench, tie. Based on this, is there a car in the image?"}]}, {"id": 1215, "image": "COCO_val2014_000000112664.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains person, handbag, suitcase, bench, tie. Based on this, is there a handbag in the image?"}]}, {"id": 1216, "image": "COCO_val2014_000000112664.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains person, handbag, suitcase, bench, tie. Based on this, is there a backpack in the image?"}]}, {"id": 1217, "image": "COCO_val2014_000000112664.jpg", "conversations": [{"from": "human", "value": "Is there a suitcase in the image?"}, {"from": "gpt", "value": "This image contains person, handbag, suitcase, bench, tie. Based on this, is there a suitcase in the image?"}]}, {"id": 1218, "image": "COCO_val2014_000000112664.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains person, handbag, suitcase, bench, tie. Based on this, is there a bottle in the image?"}]}, {"id": 1219, "image": "COCO_val2014_000000377879.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains truck, train, bed. Based on this, is there a truck in the image?"}]}, {"id": 1220, "image": "COCO_val2014_000000377879.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains truck, train, bed. Based on this, is there a person in the image?"}]}, {"id": 1221, "image": "COCO_val2014_000000377879.jpg", "conversations": [{"from": "human", "value": "Is there a train in the image?"}, {"from": "gpt", "value": "This image contains truck, train, bed. Based on this, is there a train in the image?"}]}, {"id": 1222, "image": "COCO_val2014_000000377879.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains truck, train, bed. Based on this, is there a car in the image?"}]}, {"id": 1223, "image": "COCO_val2014_000000377879.jpg", "conversations": [{"from": "human", "value": "Is there a bed in the image?"}, {"from": "gpt", "value": "This image contains truck, train, bed. Based on this, is there a bed in the image?"}]}, {"id": 1224, "image": "COCO_val2014_000000377879.jpg", "conversations": [{"from": "human", "value": "Is there a book in the image?"}, {"from": "gpt", "value": "This image contains truck, train, bed. Based on this, is there a book in the image?"}]}, {"id": 1225, "image": "COCO_val2014_000000377401.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains truck, clock, car. Based on this, is there a truck in the image?"}]}, {"id": 1226, "image": "COCO_val2014_000000377401.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains truck, clock, car. Based on this, is there a person in the image?"}]}, {"id": 1227, "image": "COCO_val2014_000000377401.jpg", "conversations": [{"from": "human", "value": "Is there a clock in the image?"}, {"from": "gpt", "value": "This image contains truck, clock, car. Based on this, is there a clock in the image?"}]}, {"id": 1228, "image": "COCO_val2014_000000377401.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains truck, clock, car. Based on this, is there a chair in the image?"}]}, {"id": 1229, "image": "COCO_val2014_000000377401.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains truck, clock, car. Based on this, is there a car in the image?"}]}, {"id": 1230, "image": "COCO_val2014_000000377401.jpg", "conversations": [{"from": "human", "value": "Is there a bus in the image?"}, {"from": "gpt", "value": "This image contains truck, clock, car. Based on this, is there a bus in the image?"}]}, {"id": 1231, "image": "COCO_val2014_000000049473.jpg", "conversations": [{"from": "human", "value": "Is there a vase in the image?"}, {"from": "gpt", "value": "This image contains vase, book, dining table. Based on this, is there a vase in the image?"}]}, {"id": 1232, "image": "COCO_val2014_000000049473.jpg", "conversations": [{"from": "human", "value": "Is there a potted plant in the image?"}, {"from": "gpt", "value": "This image contains vase, book, dining table. Based on this, is there a potted plant in the image?"}]}, {"id": 1233, "image": "COCO_val2014_000000049473.jpg", "conversations": [{"from": "human", "value": "Is there a book in the image?"}, {"from": "gpt", "value": "This image contains vase, book, dining table. Based on this, is there a book in the image?"}]}, {"id": 1234, "image": "COCO_val2014_000000049473.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains vase, book, dining table. Based on this, is there a person in the image?"}]}, {"id": 1235, "image": "COCO_val2014_000000049473.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains vase, book, dining table. Based on this, is there a dining table in the image?"}]}, {"id": 1236, "image": "COCO_val2014_000000049473.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains vase, book, dining table. Based on this, is there a cup in the image?"}]}, {"id": 1237, "image": "COCO_val2014_000000153865.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, car, kite. Based on this, is there a person in the image?"}]}, {"id": 1238, "image": "COCO_val2014_000000153865.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, car, kite. Based on this, is there a dining table in the image?"}]}, {"id": 1239, "image": "COCO_val2014_000000153865.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, car, kite. Based on this, is there a car in the image?"}]}, {"id": 1240, "image": "COCO_val2014_000000153865.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains person, car, kite. Based on this, is there a truck in the image?"}]}, {"id": 1241, "image": "COCO_val2014_000000153865.jpg", "conversations": [{"from": "human", "value": "Is there a kite in the image?"}, {"from": "gpt", "value": "This image contains person, car, kite. Based on this, is there a kite in the image?"}]}, {"id": 1242, "image": "COCO_val2014_000000153865.jpg", "conversations": [{"from": "human", "value": "Is there an umbrella in the image?"}, {"from": "gpt", "value": "This image contains person, car, kite. Based on this, is there an umbrella in the image?"}]}, {"id": 1243, "image": "COCO_val2014_000000383185.jpg", "conversations": [{"from": "human", "value": "Is there a banana in the image?"}, {"from": "gpt", "value": "This image contains banana, spoon, bowl, bottle, cup. Based on this, is there a banana in the image?"}]}, {"id": 1244, "image": "COCO_val2014_000000383185.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains banana, spoon, bowl, bottle, cup. Based on this, is there a dining table in the image?"}]}, {"id": 1245, "image": "COCO_val2014_000000383185.jpg", "conversations": [{"from": "human", "value": "Is there a spoon in the image?"}, {"from": "gpt", "value": "This image contains banana, spoon, bowl, bottle, cup. Based on this, is there a spoon in the image?"}]}, {"id": 1246, "image": "COCO_val2014_000000383185.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains banana, spoon, bowl, bottle, cup. Based on this, is there a person in the image?"}]}, {"id": 1247, "image": "COCO_val2014_000000383185.jpg", "conversations": [{"from": "human", "value": "Is there a bowl in the image?"}, {"from": "gpt", "value": "This image contains banana, spoon, bowl, bottle, cup. Based on this, is there a bowl in the image?"}]}, {"id": 1248, "image": "COCO_val2014_000000383185.jpg", "conversations": [{"from": "human", "value": "Is there a knife in the image?"}, {"from": "gpt", "value": "This image contains banana, spoon, bowl, bottle, cup. Based on this, is there a knife in the image?"}]}, {"id": 1249, "image": "COCO_val2014_000000388983.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, bowl, sandwich, hot dog, dining table, cup. Based on this, is there a person in the image?"}]}, {"id": 1250, "image": "COCO_val2014_000000388983.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, bowl, sandwich, hot dog, dining table, cup. Based on this, is there a car in the image?"}]}, {"id": 1251, "image": "COCO_val2014_000000388983.jpg", "conversations": [{"from": "human", "value": "Is there a bowl in the image?"}, {"from": "gpt", "value": "This image contains person, bowl, sandwich, hot dog, dining table, cup. Based on this, is there a bowl in the image?"}]}, {"id": 1252, "image": "COCO_val2014_000000388983.jpg", "conversations": [{"from": "human", "value": "Is there a spoon in the image?"}, {"from": "gpt", "value": "This image contains person, bowl, sandwich, hot dog, dining table, cup. Based on this, is there a spoon in the image?"}]}, {"id": 1253, "image": "COCO_val2014_000000388983.jpg", "conversations": [{"from": "human", "value": "Is there a sandwich in the image?"}, {"from": "gpt", "value": "This image contains person, bowl, sandwich, hot dog, dining table, cup. Based on this, is there a sandwich in the image?"}]}, {"id": 1254, "image": "COCO_val2014_000000388983.jpg", "conversations": [{"from": "human", "value": "Is there a fork in the image?"}, {"from": "gpt", "value": "This image contains person, bowl, sandwich, hot dog, dining table, cup. Based on this, is there a fork in the image?"}]}, {"id": 1255, "image": "COCO_val2014_000000295377.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, skis. Based on this, is there a backpack in the image?"}]}, {"id": 1256, "image": "COCO_val2014_000000295377.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, skis. Based on this, is there a handbag in the image?"}]}, {"id": 1257, "image": "COCO_val2014_000000295377.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, skis. Based on this, is there a person in the image?"}]}, {"id": 1258, "image": "COCO_val2014_000000295377.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, skis. Based on this, is there a car in the image?"}]}, {"id": 1259, "image": "COCO_val2014_000000295377.jpg", "conversations": [{"from": "human", "value": "Is there a skis in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, skis. Based on this, is there a skis in the image?"}]}, {"id": 1260, "image": "COCO_val2014_000000295377.jpg", "conversations": [{"from": "human", "value": "Is there a snowboard in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, skis. Based on this, is there a snowboard in the image?"}]}, {"id": 1261, "image": "COCO_val2014_000000034773.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains chair, dog, couch, potted plant. Based on this, is there a chair in the image?"}]}, {"id": 1262, "image": "COCO_val2014_000000034773.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains chair, dog, couch, potted plant. Based on this, is there a person in the image?"}]}, {"id": 1263, "image": "COCO_val2014_000000034773.jpg", "conversations": [{"from": "human", "value": "Is there a dog in the image?"}, {"from": "gpt", "value": "This image contains chair, dog, couch, potted plant. Based on this, is there a dog in the image?"}]}, {"id": 1264, "image": "COCO_val2014_000000034773.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains chair, dog, couch, potted plant. Based on this, is there a car in the image?"}]}, {"id": 1265, "image": "COCO_val2014_000000034773.jpg", "conversations": [{"from": "human", "value": "Is there a couch in the image?"}, {"from": "gpt", "value": "This image contains chair, dog, couch, potted plant. Based on this, is there a couch in the image?"}]}, {"id": 1266, "image": "COCO_val2014_000000034773.jpg", "conversations": [{"from": "human", "value": "Is there a tv in the image?"}, {"from": "gpt", "value": "This image contains chair, dog, couch, potted plant. Based on this, is there a tv in the image?"}]}, {"id": 1267, "image": "COCO_val2014_000000244455.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains truck, person, bicycle, car, motorcycle. Based on this, is there a truck in the image?"}]}, {"id": 1268, "image": "COCO_val2014_000000244455.jpg", "conversations": [{"from": "human", "value": "Is there a traffic light in the image?"}, {"from": "gpt", "value": "This image contains truck, person, bicycle, car, motorcycle. Based on this, is there a traffic light in the image?"}]}, {"id": 1269, "image": "COCO_val2014_000000244455.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains truck, person, bicycle, car, motorcycle. Based on this, is there a person in the image?"}]}, {"id": 1270, "image": "COCO_val2014_000000244455.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains truck, person, bicycle, car, motorcycle. Based on this, is there a dining table in the image?"}]}, {"id": 1271, "image": "COCO_val2014_000000244455.jpg", "conversations": [{"from": "human", "value": "Is there a bicycle in the image?"}, {"from": "gpt", "value": "This image contains truck, person, bicycle, car, motorcycle. Based on this, is there a bicycle in the image?"}]}, {"id": 1272, "image": "COCO_val2014_000000244455.jpg", "conversations": [{"from": "human", "value": "Is there a bus in the image?"}, {"from": "gpt", "value": "This image contains truck, person, bicycle, car, motorcycle. Based on this, is there a bus in the image?"}]}, {"id": 1273, "image": "COCO_val2014_000000303652.jpg", "conversations": [{"from": "human", "value": "Is there a spoon in the image?"}, {"from": "gpt", "value": "This image contains spoon, dining table, knife, cake, cup. Based on this, is there a spoon in the image?"}]}, {"id": 1274, "image": "COCO_val2014_000000303652.jpg", "conversations": [{"from": "human", "value": "Is there a bowl in the image?"}, {"from": "gpt", "value": "This image contains spoon, dining table, knife, cake, cup. Based on this, is there a bowl in the image?"}]}, {"id": 1275, "image": "COCO_val2014_000000303652.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains spoon, dining table, knife, cake, cup. Based on this, is there a dining table in the image?"}]}, {"id": 1276, "image": "COCO_val2014_000000303652.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains spoon, dining table, knife, cake, cup. Based on this, is there a person in the image?"}]}, {"id": 1277, "image": "COCO_val2014_000000303652.jpg", "conversations": [{"from": "human", "value": "Is there a knife in the image?"}, {"from": "gpt", "value": "This image contains spoon, dining table, knife, cake, cup. Based on this, is there a knife in the image?"}]}, {"id": 1278, "image": "COCO_val2014_000000303652.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains spoon, dining table, knife, cake, cup. Based on this, is there a bottle in the image?"}]}, {"id": 1279, "image": "COCO_val2014_000000098493.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains truck, clock, person, car, chair. Based on this, is there a truck in the image?"}]}, {"id": 1280, "image": "COCO_val2014_000000098493.jpg", "conversations": [{"from": "human", "value": "Is there a traffic light in the image?"}, {"from": "gpt", "value": "This image contains truck, clock, person, car, chair. Based on this, is there a traffic light in the image?"}]}, {"id": 1281, "image": "COCO_val2014_000000098493.jpg", "conversations": [{"from": "human", "value": "Is there a clock in the image?"}, {"from": "gpt", "value": "This image contains truck, clock, person, car, chair. Based on this, is there a clock in the image?"}]}, {"id": 1282, "image": "COCO_val2014_000000098493.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains truck, clock, person, car, chair. Based on this, is there a dining table in the image?"}]}, {"id": 1283, "image": "COCO_val2014_000000098493.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains truck, clock, person, car, chair. Based on this, is there a person in the image?"}]}, {"id": 1284, "image": "COCO_val2014_000000098493.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains truck, clock, person, car, chair. Based on this, is there a handbag in the image?"}]}, {"id": 1285, "image": "COCO_val2014_000000201148.jpg", "conversations": [{"from": "human", "value": "Is there a traffic light in the image?"}, {"from": "gpt", "value": "This image contains traffic light, person, train. Based on this, is there a traffic light in the image?"}]}, {"id": 1286, "image": "COCO_val2014_000000201148.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains traffic light, person, train. Based on this, is there a car in the image?"}]}, {"id": 1287, "image": "COCO_val2014_000000201148.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains traffic light, person, train. Based on this, is there a person in the image?"}]}, {"id": 1288, "image": "COCO_val2014_000000201148.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains traffic light, person, train. Based on this, is there a dining table in the image?"}]}, {"id": 1289, "image": "COCO_val2014_000000201148.jpg", "conversations": [{"from": "human", "value": "Is there a train in the image?"}, {"from": "gpt", "value": "This image contains traffic light, person, train. Based on this, is there a train in the image?"}]}, {"id": 1290, "image": "COCO_val2014_000000201148.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains traffic light, person, train. Based on this, is there a truck in the image?"}]}, {"id": 1291, "image": "COCO_val2014_000000307166.jpg", "conversations": [{"from": "human", "value": "Is there a pizza in the image?"}, {"from": "gpt", "value": "This image contains pizza, bottle, oven, dining table. Based on this, is there a pizza in the image?"}]}, {"id": 1292, "image": "COCO_val2014_000000307166.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains pizza, bottle, oven, dining table. Based on this, is there a person in the image?"}]}, {"id": 1293, "image": "COCO_val2014_000000307166.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains pizza, bottle, oven, dining table. Based on this, is there a bottle in the image?"}]}, {"id": 1294, "image": "COCO_val2014_000000307166.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains pizza, bottle, oven, dining table. Based on this, is there a cup in the image?"}]}, {"id": 1295, "image": "COCO_val2014_000000307166.jpg", "conversations": [{"from": "human", "value": "Is there an oven in the image?"}, {"from": "gpt", "value": "This image contains pizza, bottle, oven, dining table. Based on this, is there an oven in the image?"}]}, {"id": 1296, "image": "COCO_val2014_000000307166.jpg", "conversations": [{"from": "human", "value": "Is there a spoon in the image?"}, {"from": "gpt", "value": "This image contains pizza, bottle, oven, dining table. Based on this, is there a spoon in the image?"}]}, {"id": 1297, "image": "COCO_val2014_000000313034.jpg", "conversations": [{"from": "human", "value": "Is there a clock in the image?"}, {"from": "gpt", "value": "This image contains clock, person, bottle, fork, vase, cake, cup. Based on this, is there a clock in the image?"}]}, {"id": 1298, "image": "COCO_val2014_000000313034.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains clock, person, bottle, fork, vase, cake, cup. Based on this, is there a chair in the image?"}]}, {"id": 1299, "image": "COCO_val2014_000000313034.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains clock, person, bottle, fork, vase, cake, cup. Based on this, is there a person in the image?"}]}, {"id": 1300, "image": "COCO_val2014_000000313034.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains clock, person, bottle, fork, vase, cake, cup. Based on this, is there a car in the image?"}]}, {"id": 1301, "image": "COCO_val2014_000000313034.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains clock, person, bottle, fork, vase, cake, cup. Based on this, is there a bottle in the image?"}]}, {"id": 1302, "image": "COCO_val2014_000000313034.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains clock, person, bottle, fork, vase, cake, cup. Based on this, is there a dining table in the image?"}]}, {"id": 1303, "image": "COCO_val2014_000000355342.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, orange, umbrella. Based on this, is there a person in the image?"}]}, {"id": 1304, "image": "COCO_val2014_000000355342.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, orange, umbrella. Based on this, is there a car in the image?"}]}, {"id": 1305, "image": "COCO_val2014_000000355342.jpg", "conversations": [{"from": "human", "value": "Is there an orange in the image?"}, {"from": "gpt", "value": "This image contains person, orange, umbrella. Based on this, is there an orange in the image?"}]}, {"id": 1306, "image": "COCO_val2014_000000355342.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, orange, umbrella. Based on this, is there a dining table in the image?"}]}, {"id": 1307, "image": "COCO_val2014_000000355342.jpg", "conversations": [{"from": "human", "value": "Is there an umbrella in the image?"}, {"from": "gpt", "value": "This image contains person, orange, umbrella. Based on this, is there an umbrella in the image?"}]}, {"id": 1308, "image": "COCO_val2014_000000355342.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains person, orange, umbrella. Based on this, is there a handbag in the image?"}]}, {"id": 1309, "image": "COCO_val2014_000000333237.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains chair, bed, dining table. Based on this, is there a chair in the image?"}]}, {"id": 1310, "image": "COCO_val2014_000000333237.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains chair, bed, dining table. Based on this, is there a person in the image?"}]}, {"id": 1311, "image": "COCO_val2014_000000333237.jpg", "conversations": [{"from": "human", "value": "Is there a bed in the image?"}, {"from": "gpt", "value": "This image contains chair, bed, dining table. Based on this, is there a bed in the image?"}]}, {"id": 1312, "image": "COCO_val2014_000000333237.jpg", "conversations": [{"from": "human", "value": "Is there a book in the image?"}, {"from": "gpt", "value": "This image contains chair, bed, dining table. Based on this, is there a book in the image?"}]}, {"id": 1313, "image": "COCO_val2014_000000333237.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains chair, bed, dining table. Based on this, is there a dining table in the image?"}]}, {"id": 1314, "image": "COCO_val2014_000000333237.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains chair, bed, dining table. Based on this, is there a cup in the image?"}]}, {"id": 1315, "image": "COCO_val2014_000000526368.jpg", "conversations": [{"from": "human", "value": "Is there a laptop in the image?"}, {"from": "gpt", "value": "This image contains laptop, dining table, chair, keyboard, book. Based on this, is there a laptop in the image?"}]}, {"id": 1316, "image": "COCO_val2014_000000526368.jpg", "conversations": [{"from": "human", "value": "Is there a tv in the image?"}, {"from": "gpt", "value": "This image contains laptop, dining table, chair, keyboard, book. Based on this, is there a tv in the image?"}]}, {"id": 1317, "image": "COCO_val2014_000000526368.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains laptop, dining table, chair, keyboard, book. Based on this, is there a dining table in the image?"}]}, {"id": 1318, "image": "COCO_val2014_000000526368.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains laptop, dining table, chair, keyboard, book. Based on this, is there a person in the image?"}]}, {"id": 1319, "image": "COCO_val2014_000000526368.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains laptop, dining table, chair, keyboard, book. Based on this, is there a chair in the image?"}]}, {"id": 1320, "image": "COCO_val2014_000000526368.jpg", "conversations": [{"from": "human", "value": "Is there a couch in the image?"}, {"from": "gpt", "value": "This image contains laptop, dining table, chair, keyboard, book. Based on this, is there a couch in the image?"}]}, {"id": 1321, "image": "COCO_val2014_000000429033.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains chair, person, laptop. Based on this, is there a chair in the image?"}]}, {"id": 1322, "image": "COCO_val2014_000000429033.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains chair, person, laptop. Based on this, is there a dining table in the image?"}]}, {"id": 1323, "image": "COCO_val2014_000000429033.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains chair, person, laptop. Based on this, is there a person in the image?"}]}, {"id": 1324, "image": "COCO_val2014_000000429033.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains chair, person, laptop. Based on this, is there a car in the image?"}]}, {"id": 1325, "image": "COCO_val2014_000000429033.jpg", "conversations": [{"from": "human", "value": "Is there a laptop in the image?"}, {"from": "gpt", "value": "This image contains chair, person, laptop. Based on this, is there a laptop in the image?"}]}, {"id": 1326, "image": "COCO_val2014_000000429033.jpg", "conversations": [{"from": "human", "value": "Is there a tv in the image?"}, {"from": "gpt", "value": "This image contains chair, person, laptop. Based on this, is there a tv in the image?"}]}, {"id": 1327, "image": "COCO_val2014_000000287035.jpg", "conversations": [{"from": "human", "value": "Is there a tv in the image?"}, {"from": "gpt", "value": "This image contains tv, mouse, laptop, dining table, chair, keyboard, cell phone. Based on this, is there a tv in the image?"}]}, {"id": 1328, "image": "COCO_val2014_000000287035.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains tv, mouse, laptop, dining table, chair, keyboard, cell phone. Based on this, is there a person in the image?"}]}, {"id": 1329, "image": "COCO_val2014_000000287035.jpg", "conversations": [{"from": "human", "value": "Is there a mouse in the image?"}, {"from": "gpt", "value": "This image contains tv, mouse, laptop, dining table, chair, keyboard, cell phone. Based on this, is there a mouse in the image?"}]}, {"id": 1330, "image": "COCO_val2014_000000287035.jpg", "conversations": [{"from": "human", "value": "Is there a book in the image?"}, {"from": "gpt", "value": "This image contains tv, mouse, laptop, dining table, chair, keyboard, cell phone. Based on this, is there a book in the image?"}]}, {"id": 1331, "image": "COCO_val2014_000000287035.jpg", "conversations": [{"from": "human", "value": "Is there a laptop in the image?"}, {"from": "gpt", "value": "This image contains tv, mouse, laptop, dining table, chair, keyboard, cell phone. Based on this, is there a laptop in the image?"}]}, {"id": 1332, "image": "COCO_val2014_000000287035.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains tv, mouse, laptop, dining table, chair, keyboard, cell phone. Based on this, is there a bottle in the image?"}]}, {"id": 1333, "image": "COCO_val2014_000000299074.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, cell phone, bus. Based on this, is there a person in the image?"}]}, {"id": 1334, "image": "COCO_val2014_000000299074.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, cell phone, bus. Based on this, is there a car in the image?"}]}, {"id": 1335, "image": "COCO_val2014_000000299074.jpg", "conversations": [{"from": "human", "value": "Is there a cell phone in the image?"}, {"from": "gpt", "value": "This image contains person, cell phone, bus. Based on this, is there a cell phone in the image?"}]}, {"id": 1336, "image": "COCO_val2014_000000299074.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, cell phone, bus. Based on this, is there a dining table in the image?"}]}, {"id": 1337, "image": "COCO_val2014_000000299074.jpg", "conversations": [{"from": "human", "value": "Is there a bus in the image?"}, {"from": "gpt", "value": "This image contains person, cell phone, bus. Based on this, is there a bus in the image?"}]}, {"id": 1338, "image": "COCO_val2014_000000299074.jpg", "conversations": [{"from": "human", "value": "Is there a traffic light in the image?"}, {"from": "gpt", "value": "This image contains person, cell phone, bus. Based on this, is there a traffic light in the image?"}]}, {"id": 1339, "image": "COCO_val2014_000000120648.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains handbag, dining table, suitcase, bed, book. Based on this, is there a handbag in the image?"}]}, {"id": 1340, "image": "COCO_val2014_000000120648.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains handbag, dining table, suitcase, bed, book. Based on this, is there a person in the image?"}]}, {"id": 1341, "image": "COCO_val2014_000000120648.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains handbag, dining table, suitcase, bed, book. Based on this, is there a dining table in the image?"}]}, {"id": 1342, "image": "COCO_val2014_000000120648.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains handbag, dining table, suitcase, bed, book. Based on this, is there a cup in the image?"}]}, {"id": 1343, "image": "COCO_val2014_000000120648.jpg", "conversations": [{"from": "human", "value": "Is there a suitcase in the image?"}, {"from": "gpt", "value": "This image contains handbag, dining table, suitcase, bed, book. Based on this, is there a suitcase in the image?"}]}, {"id": 1344, "image": "COCO_val2014_000000120648.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains handbag, dining table, suitcase, bed, book. Based on this, is there a backpack in the image?"}]}, {"id": 1345, "image": "COCO_val2014_000000186709.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains car, truck, orange, apple. Based on this, is there a car in the image?"}]}, {"id": 1346, "image": "COCO_val2014_000000186709.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains car, truck, orange, apple. Based on this, is there a person in the image?"}]}, {"id": 1347, "image": "COCO_val2014_000000186709.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains car, truck, orange, apple. Based on this, is there a truck in the image?"}]}, {"id": 1348, "image": "COCO_val2014_000000186709.jpg", "conversations": [{"from": "human", "value": "Is there a traffic light in the image?"}, {"from": "gpt", "value": "This image contains car, truck, orange, apple. Based on this, is there a traffic light in the image?"}]}, {"id": 1349, "image": "COCO_val2014_000000186709.jpg", "conversations": [{"from": "human", "value": "Is there an orange in the image?"}, {"from": "gpt", "value": "This image contains car, truck, orange, apple. Based on this, is there an orange in the image?"}]}, {"id": 1350, "image": "COCO_val2014_000000186709.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains car, truck, orange, apple. Based on this, is there a dining table in the image?"}]}, {"id": 1351, "image": "COCO_val2014_000000025972.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains truck, couch, car, bottle, bicycle, stop sign, chair. Based on this, is there a truck in the image?"}]}, {"id": 1352, "image": "COCO_val2014_000000025972.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains truck, couch, car, bottle, bicycle, stop sign, chair. Based on this, is there a person in the image?"}]}, {"id": 1353, "image": "COCO_val2014_000000025972.jpg", "conversations": [{"from": "human", "value": "Is there a couch in the image?"}, {"from": "gpt", "value": "This image contains truck, couch, car, bottle, bicycle, stop sign, chair. Based on this, is there a couch in the image?"}]}, {"id": 1354, "image": "COCO_val2014_000000025972.jpg", "conversations": [{"from": "human", "value": "Is there a tv in the image?"}, {"from": "gpt", "value": "This image contains truck, couch, car, bottle, bicycle, stop sign, chair. Based on this, is there a tv in the image?"}]}, {"id": 1355, "image": "COCO_val2014_000000025972.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains truck, couch, car, bottle, bicycle, stop sign, chair. Based on this, is there a car in the image?"}]}, {"id": 1356, "image": "COCO_val2014_000000025972.jpg", "conversations": [{"from": "human", "value": "Is there a bus in the image?"}, {"from": "gpt", "value": "This image contains truck, couch, car, bottle, bicycle, stop sign, chair. Based on this, is there a bus in the image?"}]}, {"id": 1357, "image": "COCO_val2014_000000505542.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, train, car. Based on this, is there a person in the image?"}]}, {"id": 1358, "image": "COCO_val2014_000000505542.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, train, car. Based on this, is there a dining table in the image?"}]}, {"id": 1359, "image": "COCO_val2014_000000505542.jpg", "conversations": [{"from": "human", "value": "Is there a train in the image?"}, {"from": "gpt", "value": "This image contains person, train, car. Based on this, is there a train in the image?"}]}, {"id": 1360, "image": "COCO_val2014_000000505542.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains person, train, car. Based on this, is there a truck in the image?"}]}, {"id": 1361, "image": "COCO_val2014_000000505542.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, train, car. Based on this, is there a car in the image?"}]}, {"id": 1362, "image": "COCO_val2014_000000505542.jpg", "conversations": [{"from": "human", "value": "Is there a bus in the image?"}, {"from": "gpt", "value": "This image contains person, train, car. Based on this, is there a bus in the image?"}]}, {"id": 1363, "image": "COCO_val2014_000000115636.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, horse, cow. Based on this, is there a person in the image?"}]}, {"id": 1364, "image": "COCO_val2014_000000115636.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, horse, cow. Based on this, is there a car in the image?"}]}, {"id": 1365, "image": "COCO_val2014_000000115636.jpg", "conversations": [{"from": "human", "value": "Is there a horse in the image?"}, {"from": "gpt", "value": "This image contains person, horse, cow. Based on this, is there a horse in the image?"}]}, {"id": 1366, "image": "COCO_val2014_000000115636.jpg", "conversations": [{"from": "human", "value": "Is there a dog in the image?"}, {"from": "gpt", "value": "This image contains person, horse, cow. Based on this, is there a dog in the image?"}]}, {"id": 1367, "image": "COCO_val2014_000000115636.jpg", "conversations": [{"from": "human", "value": "Is there a cow in the image?"}, {"from": "gpt", "value": "This image contains person, horse, cow. Based on this, is there a cow in the image?"}]}, {"id": 1368, "image": "COCO_val2014_000000115636.jpg", "conversations": [{"from": "human", "value": "Is there a bicycle in the image?"}, {"from": "gpt", "value": "This image contains person, horse, cow. Based on this, is there a bicycle in the image?"}]}, {"id": 1369, "image": "COCO_val2014_000000280810.jpg", "conversations": [{"from": "human", "value": "Is there a broccoli in the image?"}, {"from": "gpt", "value": "This image contains broccoli, fork, laptop, dining table, carrot. Based on this, is there a broccoli in the image?"}]}, {"id": 1370, "image": "COCO_val2014_000000280810.jpg", "conversations": [{"from": "human", "value": "Is there a bowl in the image?"}, {"from": "gpt", "value": "This image contains broccoli, fork, laptop, dining table, carrot. Based on this, is there a bowl in the image?"}]}, {"id": 1371, "image": "COCO_val2014_000000280810.jpg", "conversations": [{"from": "human", "value": "Is there a fork in the image?"}, {"from": "gpt", "value": "This image contains broccoli, fork, laptop, dining table, carrot. Based on this, is there a fork in the image?"}]}, {"id": 1372, "image": "COCO_val2014_000000280810.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains broccoli, fork, laptop, dining table, carrot. Based on this, is there a person in the image?"}]}, {"id": 1373, "image": "COCO_val2014_000000280810.jpg", "conversations": [{"from": "human", "value": "Is there a laptop in the image?"}, {"from": "gpt", "value": "This image contains broccoli, fork, laptop, dining table, carrot. Based on this, is there a laptop in the image?"}]}, {"id": 1374, "image": "COCO_val2014_000000280810.jpg", "conversations": [{"from": "human", "value": "Is there a tv in the image?"}, {"from": "gpt", "value": "This image contains broccoli, fork, laptop, dining table, carrot. Based on this, is there a tv in the image?"}]}, {"id": 1375, "image": "COCO_val2014_000000037900.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains backpack, handbag, knife, book, cell phone. Based on this, is there a backpack in the image?"}]}, {"id": 1376, "image": "COCO_val2014_000000037900.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains backpack, handbag, knife, book, cell phone. Based on this, is there a person in the image?"}]}, {"id": 1377, "image": "COCO_val2014_000000037900.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains backpack, handbag, knife, book, cell phone. Based on this, is there a handbag in the image?"}]}, {"id": 1378, "image": "COCO_val2014_000000037900.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains backpack, handbag, knife, book, cell phone. Based on this, is there a dining table in the image?"}]}, {"id": 1379, "image": "COCO_val2014_000000037900.jpg", "conversations": [{"from": "human", "value": "Is there a knife in the image?"}, {"from": "gpt", "value": "This image contains backpack, handbag, knife, book, cell phone. Based on this, is there a knife in the image?"}]}, {"id": 1380, "image": "COCO_val2014_000000037900.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains backpack, handbag, knife, book, cell phone. Based on this, is there a cup in the image?"}]}, {"id": 1381, "image": "COCO_val2014_000000534516.jpg", "conversations": [{"from": "human", "value": "Is there a traffic light in the image?"}, {"from": "gpt", "value": "This image contains traffic light, person, tie. Based on this, is there a traffic light in the image?"}]}, {"id": 1382, "image": "COCO_val2014_000000534516.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains traffic light, person, tie. Based on this, is there a car in the image?"}]}, {"id": 1383, "image": "COCO_val2014_000000534516.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains traffic light, person, tie. Based on this, is there a person in the image?"}]}, {"id": 1384, "image": "COCO_val2014_000000534516.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains traffic light, person, tie. Based on this, is there a dining table in the image?"}]}, {"id": 1385, "image": "COCO_val2014_000000534516.jpg", "conversations": [{"from": "human", "value": "Is there a tie in the image?"}, {"from": "gpt", "value": "This image contains traffic light, person, tie. Based on this, is there a tie in the image?"}]}, {"id": 1386, "image": "COCO_val2014_000000534516.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains traffic light, person, tie. Based on this, is there a cup in the image?"}]}, {"id": 1387, "image": "COCO_val2014_000000123017.jpg", "conversations": [{"from": "human", "value": "Is there a bowl in the image?"}, {"from": "gpt", "value": "This image contains bowl, dining table, chair, vase, bench. Based on this, is there a bowl in the image?"}]}, {"id": 1388, "image": "COCO_val2014_000000123017.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains bowl, dining table, chair, vase, bench. Based on this, is there a cup in the image?"}]}, {"id": 1389, "image": "COCO_val2014_000000123017.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains bowl, dining table, chair, vase, bench. Based on this, is there a dining table in the image?"}]}, {"id": 1390, "image": "COCO_val2014_000000123017.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains bowl, dining table, chair, vase, bench. Based on this, is there a person in the image?"}]}, {"id": 1391, "image": "COCO_val2014_000000123017.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains bowl, dining table, chair, vase, bench. Based on this, is there a chair in the image?"}]}, {"id": 1392, "image": "COCO_val2014_000000123017.jpg", "conversations": [{"from": "human", "value": "Is there a couch in the image?"}, {"from": "gpt", "value": "This image contains bowl, dining table, chair, vase, bench. Based on this, is there a couch in the image?"}]}, {"id": 1393, "image": "COCO_val2014_000000316237.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, handbag, cell phone. Based on this, is there a person in the image?"}]}, {"id": 1394, "image": "COCO_val2014_000000316237.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, handbag, cell phone. Based on this, is there a car in the image?"}]}, {"id": 1395, "image": "COCO_val2014_000000316237.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains person, handbag, cell phone. Based on this, is there a handbag in the image?"}]}, {"id": 1396, "image": "COCO_val2014_000000316237.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains person, handbag, cell phone. Based on this, is there a backpack in the image?"}]}, {"id": 1397, "image": "COCO_val2014_000000316237.jpg", "conversations": [{"from": "human", "value": "Is there a cell phone in the image?"}, {"from": "gpt", "value": "This image contains person, handbag, cell phone. Based on this, is there a cell phone in the image?"}]}, {"id": 1398, "image": "COCO_val2014_000000316237.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, handbag, cell phone. Based on this, is there a dining table in the image?"}]}, {"id": 1399, "image": "COCO_val2014_000000463522.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, dog, horse, bicycle. Based on this, is there a backpack in the image?"}]}, {"id": 1400, "image": "COCO_val2014_000000463522.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, dog, horse, bicycle. Based on this, is there a handbag in the image?"}]}, {"id": 1401, "image": "COCO_val2014_000000463522.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, dog, horse, bicycle. Based on this, is there a person in the image?"}]}, {"id": 1402, "image": "COCO_val2014_000000463522.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, dog, horse, bicycle. Based on this, is there a car in the image?"}]}, {"id": 1403, "image": "COCO_val2014_000000463522.jpg", "conversations": [{"from": "human", "value": "Is there a dog in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, dog, horse, bicycle. Based on this, is there a dog in the image?"}]}, {"id": 1404, "image": "COCO_val2014_000000463522.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, dog, horse, bicycle. Based on this, is there a truck in the image?"}]}, {"id": 1405, "image": "COCO_val2014_000000511341.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, handbag, car, umbrella. Based on this, is there a backpack in the image?"}]}, {"id": 1406, "image": "COCO_val2014_000000511341.jpg", "conversations": [{"from": "human", "value": "Is there a skis in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, handbag, car, umbrella. Based on this, is there a skis in the image?"}]}, {"id": 1407, "image": "COCO_val2014_000000511341.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, handbag, car, umbrella. Based on this, is there a person in the image?"}]}, {"id": 1408, "image": "COCO_val2014_000000511341.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, handbag, car, umbrella. Based on this, is there a dining table in the image?"}]}, {"id": 1409, "image": "COCO_val2014_000000511341.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, handbag, car, umbrella. Based on this, is there a handbag in the image?"}]}, {"id": 1410, "image": "COCO_val2014_000000511341.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, handbag, car, umbrella. Based on this, is there a chair in the image?"}]}, {"id": 1411, "image": "COCO_val2014_000000200583.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains bottle, boat, bench, dining table, suitcase. Based on this, is there a bottle in the image?"}]}, {"id": 1412, "image": "COCO_val2014_000000200583.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains bottle, boat, bench, dining table, suitcase. Based on this, is there a person in the image?"}]}, {"id": 1413, "image": "COCO_val2014_000000200583.jpg", "conversations": [{"from": "human", "value": "Is there a boat in the image?"}, {"from": "gpt", "value": "This image contains bottle, boat, bench, dining table, suitcase. Based on this, is there a boat in the image?"}]}, {"id": 1414, "image": "COCO_val2014_000000200583.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains bottle, boat, bench, dining table, suitcase. Based on this, is there a car in the image?"}]}, {"id": 1415, "image": "COCO_val2014_000000200583.jpg", "conversations": [{"from": "human", "value": "Is there a bench in the image?"}, {"from": "gpt", "value": "This image contains bottle, boat, bench, dining table, suitcase. Based on this, is there a bench in the image?"}]}, {"id": 1416, "image": "COCO_val2014_000000200583.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains bottle, boat, bench, dining table, suitcase. Based on this, is there a backpack in the image?"}]}, {"id": 1417, "image": "COCO_val2014_000000424585.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains truck, car, person, bed. Based on this, is there a truck in the image?"}]}, {"id": 1418, "image": "COCO_val2014_000000424585.jpg", "conversations": [{"from": "human", "value": "Is there a traffic light in the image?"}, {"from": "gpt", "value": "This image contains truck, car, person, bed. Based on this, is there a traffic light in the image?"}]}, {"id": 1419, "image": "COCO_val2014_000000424585.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains truck, car, person, bed. Based on this, is there a car in the image?"}]}, {"id": 1420, "image": "COCO_val2014_000000424585.jpg", "conversations": [{"from": "human", "value": "Is there a bus in the image?"}, {"from": "gpt", "value": "This image contains truck, car, person, bed. Based on this, is there a bus in the image?"}]}, {"id": 1421, "image": "COCO_val2014_000000424585.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains truck, car, person, bed. Based on this, is there a person in the image?"}]}, {"id": 1422, "image": "COCO_val2014_000000424585.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains truck, car, person, bed. Based on this, is there a dining table in the image?"}]}, {"id": 1423, "image": "COCO_val2014_000000100215.jpg", "conversations": [{"from": "human", "value": "Is there a clock in the image?"}, {"from": "gpt", "value": "This image contains clock, bed, bottle, teddy bear. Based on this, is there a clock in the image?"}]}, {"id": 1424, "image": "COCO_val2014_000000100215.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains clock, bed, bottle, teddy bear. Based on this, is there a person in the image?"}]}, {"id": 1425, "image": "COCO_val2014_000000100215.jpg", "conversations": [{"from": "human", "value": "Is there a bed in the image?"}, {"from": "gpt", "value": "This image contains clock, bed, bottle, teddy bear. Based on this, is there a bed in the image?"}]}, {"id": 1426, "image": "COCO_val2014_000000100215.jpg", "conversations": [{"from": "human", "value": "Is there a book in the image?"}, {"from": "gpt", "value": "This image contains clock, bed, bottle, teddy bear. Based on this, is there a book in the image?"}]}, {"id": 1427, "image": "COCO_val2014_000000100215.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains clock, bed, bottle, teddy bear. Based on this, is there a bottle in the image?"}]}, {"id": 1428, "image": "COCO_val2014_000000100215.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains clock, bed, bottle, teddy bear. Based on this, is there a dining table in the image?"}]}, {"id": 1429, "image": "COCO_val2014_000000017379.jpg", "conversations": [{"from": "human", "value": "Is there a tv in the image?"}, {"from": "gpt", "value": "This image contains tv, sink, person. Based on this, is there a tv in the image?"}]}, {"id": 1430, "image": "COCO_val2014_000000017379.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains tv, sink, person. Based on this, is there a dining table in the image?"}]}, {"id": 1431, "image": "COCO_val2014_000000017379.jpg", "conversations": [{"from": "human", "value": "Is there a sink in the image?"}, {"from": "gpt", "value": "This image contains tv, sink, person. Based on this, is there a sink in the image?"}]}, {"id": 1432, "image": "COCO_val2014_000000017379.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains tv, sink, person. Based on this, is there a bottle in the image?"}]}, {"id": 1433, "image": "COCO_val2014_000000017379.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains tv, sink, person. Based on this, is there a person in the image?"}]}, {"id": 1434, "image": "COCO_val2014_000000017379.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains tv, sink, person. Based on this, is there a car in the image?"}]}, {"id": 1435, "image": "COCO_val2014_000000511622.jpg", "conversations": [{"from": "human", "value": "Is there a bowl in the image?"}, {"from": "gpt", "value": "This image contains bowl, scissors, person, spoon, cup. Based on this, is there a bowl in the image?"}]}, {"id": 1436, "image": "COCO_val2014_000000511622.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains bowl, scissors, person, spoon, cup. Based on this, is there a dining table in the image?"}]}, {"id": 1437, "image": "COCO_val2014_000000511622.jpg", "conversations": [{"from": "human", "value": "Is there a scissors in the image?"}, {"from": "gpt", "value": "This image contains bowl, scissors, person, spoon, cup. Based on this, is there a scissors in the image?"}]}, {"id": 1438, "image": "COCO_val2014_000000511622.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains bowl, scissors, person, spoon, cup. Based on this, is there a bottle in the image?"}]}, {"id": 1439, "image": "COCO_val2014_000000511622.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains bowl, scissors, person, spoon, cup. Based on this, is there a person in the image?"}]}, {"id": 1440, "image": "COCO_val2014_000000511622.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains bowl, scissors, person, spoon, cup. Based on this, is there a car in the image?"}]}, {"id": 1441, "image": "COCO_val2014_000000407386.jpg", "conversations": [{"from": "human", "value": "Is there a tv in the image?"}, {"from": "gpt", "value": "This image contains tv, laptop, dining table, keyboard, cat. Based on this, is there a tv in the image?"}]}, {"id": 1442, "image": "COCO_val2014_000000407386.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains tv, laptop, dining table, keyboard, cat. Based on this, is there a person in the image?"}]}, {"id": 1443, "image": "COCO_val2014_000000407386.jpg", "conversations": [{"from": "human", "value": "Is there a laptop in the image?"}, {"from": "gpt", "value": "This image contains tv, laptop, dining table, keyboard, cat. Based on this, is there a laptop in the image?"}]}, {"id": 1444, "image": "COCO_val2014_000000407386.jpg", "conversations": [{"from": "human", "value": "Is there a mouse in the image?"}, {"from": "gpt", "value": "This image contains tv, laptop, dining table, keyboard, cat. Based on this, is there a mouse in the image?"}]}, {"id": 1445, "image": "COCO_val2014_000000407386.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains tv, laptop, dining table, keyboard, cat. Based on this, is there a dining table in the image?"}]}, {"id": 1446, "image": "COCO_val2014_000000407386.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains tv, laptop, dining table, keyboard, cat. Based on this, is there a cup in the image?"}]}, {"id": 1447, "image": "COCO_val2014_000000039516.jpg", "conversations": [{"from": "human", "value": "Is there a spoon in the image?"}, {"from": "gpt", "value": "This image contains spoon, orange, cake. Based on this, is there a spoon in the image?"}]}, {"id": 1448, "image": "COCO_val2014_000000039516.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains spoon, orange, cake. Based on this, is there a cup in the image?"}]}, {"id": 1449, "image": "COCO_val2014_000000039516.jpg", "conversations": [{"from": "human", "value": "Is there an orange in the image?"}, {"from": "gpt", "value": "This image contains spoon, orange, cake. Based on this, is there an orange in the image?"}]}, {"id": 1450, "image": "COCO_val2014_000000039516.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains spoon, orange, cake. Based on this, is there a person in the image?"}]}, {"id": 1451, "image": "COCO_val2014_000000039516.jpg", "conversations": [{"from": "human", "value": "Is there a cake in the image?"}, {"from": "gpt", "value": "This image contains spoon, orange, cake. Based on this, is there a cake in the image?"}]}, {"id": 1452, "image": "COCO_val2014_000000039516.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains spoon, orange, cake. Based on this, is there a dining table in the image?"}]}, {"id": 1453, "image": "COCO_val2014_000000018918.jpg", "conversations": [{"from": "human", "value": "Is there a sink in the image?"}, {"from": "gpt", "value": "This image contains sink, bowl, oven. Based on this, is there a sink in the image?"}]}, {"id": 1454, "image": "COCO_val2014_000000018918.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains sink, bowl, oven. Based on this, is there a bottle in the image?"}]}, {"id": 1455, "image": "COCO_val2014_000000018918.jpg", "conversations": [{"from": "human", "value": "Is there a bowl in the image?"}, {"from": "gpt", "value": "This image contains sink, bowl, oven. Based on this, is there a bowl in the image?"}]}, {"id": 1456, "image": "COCO_val2014_000000018918.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains sink, bowl, oven. Based on this, is there a cup in the image?"}]}, {"id": 1457, "image": "COCO_val2014_000000018918.jpg", "conversations": [{"from": "human", "value": "Is there an oven in the image?"}, {"from": "gpt", "value": "This image contains sink, bowl, oven. Based on this, is there an oven in the image?"}]}, {"id": 1458, "image": "COCO_val2014_000000018918.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains sink, bowl, oven. Based on this, is there a person in the image?"}]}, {"id": 1459, "image": "COCO_val2014_000000115626.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, motorcycle, parking meter. Based on this, is there a person in the image?"}]}, {"id": 1460, "image": "COCO_val2014_000000115626.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, motorcycle, parking meter. Based on this, is there a car in the image?"}]}, {"id": 1461, "image": "COCO_val2014_000000115626.jpg", "conversations": [{"from": "human", "value": "Is there a motorcycle in the image?"}, {"from": "gpt", "value": "This image contains person, motorcycle, parking meter. Based on this, is there a motorcycle in the image?"}]}, {"id": 1462, "image": "COCO_val2014_000000115626.jpg", "conversations": [{"from": "human", "value": "Is there a bicycle in the image?"}, {"from": "gpt", "value": "This image contains person, motorcycle, parking meter. Based on this, is there a bicycle in the image?"}]}, {"id": 1463, "image": "COCO_val2014_000000115626.jpg", "conversations": [{"from": "human", "value": "Is there a parking meter in the image?"}, {"from": "gpt", "value": "This image contains person, motorcycle, parking meter. Based on this, is there a parking meter in the image?"}]}, {"id": 1464, "image": "COCO_val2014_000000115626.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains person, motorcycle, parking meter. Based on this, is there a truck in the image?"}]}, {"id": 1465, "image": "COCO_val2014_000000391735.jpg", "conversations": [{"from": "human", "value": "Is there a traffic light in the image?"}, {"from": "gpt", "value": "This image contains traffic light, toothbrush, person. Based on this, is there a traffic light in the image?"}]}, {"id": 1466, "image": "COCO_val2014_000000391735.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains traffic light, toothbrush, person. Based on this, is there a car in the image?"}]}, {"id": 1467, "image": "COCO_val2014_000000391735.jpg", "conversations": [{"from": "human", "value": "Is there a toothbrush in the image?"}, {"from": "gpt", "value": "This image contains traffic light, toothbrush, person. Based on this, is there a toothbrush in the image?"}]}, {"id": 1468, "image": "COCO_val2014_000000391735.jpg", "conversations": [{"from": "human", "value": "Is there a sink in the image?"}, {"from": "gpt", "value": "This image contains traffic light, toothbrush, person. Based on this, is there a sink in the image?"}]}, {"id": 1469, "image": "COCO_val2014_000000391735.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains traffic light, toothbrush, person. Based on this, is there a person in the image?"}]}, {"id": 1470, "image": "COCO_val2014_000000391735.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains traffic light, toothbrush, person. Based on this, is there a dining table in the image?"}]}, {"id": 1471, "image": "COCO_val2014_000000236370.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains chair, person, book, tie. Based on this, is there a chair in the image?"}]}, {"id": 1472, "image": "COCO_val2014_000000236370.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains chair, person, book, tie. Based on this, is there a dining table in the image?"}]}, {"id": 1473, "image": "COCO_val2014_000000236370.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains chair, person, book, tie. Based on this, is there a person in the image?"}]}, {"id": 1474, "image": "COCO_val2014_000000236370.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains chair, person, book, tie. Based on this, is there a car in the image?"}]}, {"id": 1475, "image": "COCO_val2014_000000236370.jpg", "conversations": [{"from": "human", "value": "Is there a book in the image?"}, {"from": "gpt", "value": "This image contains chair, person, book, tie. Based on this, is there a book in the image?"}]}, {"id": 1476, "image": "COCO_val2014_000000236370.jpg", "conversations": [{"from": "human", "value": "Is there a tv in the image?"}, {"from": "gpt", "value": "This image contains chair, person, book, tie. Based on this, is there a tv in the image?"}]}, {"id": 1477, "image": "COCO_val2014_000000463542.jpg", "conversations": [{"from": "human", "value": "Is there a snowboard in the image?"}, {"from": "gpt", "value": "This image contains snowboard, skis, person. Based on this, is there a snowboard in the image?"}]}, {"id": 1478, "image": "COCO_val2014_000000463542.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains snowboard, skis, person. Based on this, is there a backpack in the image?"}]}, {"id": 1479, "image": "COCO_val2014_000000463542.jpg", "conversations": [{"from": "human", "value": "Is there a skis in the image?"}, {"from": "gpt", "value": "This image contains snowboard, skis, person. Based on this, is there a skis in the image?"}]}, {"id": 1480, "image": "COCO_val2014_000000463542.jpg", "conversations": [{"from": "human", "value": "Is there a dog in the image?"}, {"from": "gpt", "value": "This image contains snowboard, skis, person. Based on this, is there a dog in the image?"}]}, {"id": 1481, "image": "COCO_val2014_000000463542.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains snowboard, skis, person. Based on this, is there a person in the image?"}]}, {"id": 1482, "image": "COCO_val2014_000000463542.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains snowboard, skis, person. Based on this, is there a car in the image?"}]}, {"id": 1483, "image": "COCO_val2014_000000377352.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, motorcycle, car, bicycle. Based on this, is there a person in the image?"}]}, {"id": 1484, "image": "COCO_val2014_000000377352.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, motorcycle, car, bicycle. Based on this, is there a dining table in the image?"}]}, {"id": 1485, "image": "COCO_val2014_000000377352.jpg", "conversations": [{"from": "human", "value": "Is there a motorcycle in the image?"}, {"from": "gpt", "value": "This image contains person, motorcycle, car, bicycle. Based on this, is there a motorcycle in the image?"}]}, {"id": 1486, "image": "COCO_val2014_000000377352.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains person, motorcycle, car, bicycle. Based on this, is there a truck in the image?"}]}, {"id": 1487, "image": "COCO_val2014_000000377352.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, motorcycle, car, bicycle. Based on this, is there a car in the image?"}]}, {"id": 1488, "image": "COCO_val2014_000000377352.jpg", "conversations": [{"from": "human", "value": "Is there a bus in the image?"}, {"from": "gpt", "value": "This image contains person, motorcycle, car, bicycle. Based on this, is there a bus in the image?"}]}, {"id": 1489, "image": "COCO_val2014_000000302405.jpg", "conversations": [{"from": "human", "value": "Is there a snowboard in the image?"}, {"from": "gpt", "value": "This image contains snowboard, backpack, person. Based on this, is there a snowboard in the image?"}]}, {"id": 1490, "image": "COCO_val2014_000000302405.jpg", "conversations": [{"from": "human", "value": "Is there a skis in the image?"}, {"from": "gpt", "value": "This image contains snowboard, backpack, person. Based on this, is there a skis in the image?"}]}, {"id": 1491, "image": "COCO_val2014_000000302405.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains snowboard, backpack, person. Based on this, is there a backpack in the image?"}]}, {"id": 1492, "image": "COCO_val2014_000000302405.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains snowboard, backpack, person. Based on this, is there a handbag in the image?"}]}, {"id": 1493, "image": "COCO_val2014_000000302405.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains snowboard, backpack, person. Based on this, is there a person in the image?"}]}, {"id": 1494, "image": "COCO_val2014_000000302405.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains snowboard, backpack, person. Based on this, is there a car in the image?"}]}, {"id": 1495, "image": "COCO_val2014_000000554328.jpg", "conversations": [{"from": "human", "value": "Is there a baseball glove in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball. Based on this, is there a baseball glove in the image?"}]}, {"id": 1496, "image": "COCO_val2014_000000554328.jpg", "conversations": [{"from": "human", "value": "Is there a baseball bat in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball. Based on this, is there a baseball bat in the image?"}]}, {"id": 1497, "image": "COCO_val2014_000000554328.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball. Based on this, is there a person in the image?"}]}, {"id": 1498, "image": "COCO_val2014_000000554328.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball. Based on this, is there a car in the image?"}]}, {"id": 1499, "image": "COCO_val2014_000000554328.jpg", "conversations": [{"from": "human", "value": "Is there a sports ball in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball. Based on this, is there a sports ball in the image?"}]}, {"id": 1500, "image": "COCO_val2014_000000554328.jpg", "conversations": [{"from": "human", "value": "Is there a tennis racket in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball. Based on this, is there a tennis racket in the image?"}]}, {"id": 1501, "image": "COCO_val2014_000000384040.jpg", "conversations": [{"from": "human", "value": "Is there a spoon in the image?"}, {"from": "gpt", "value": "This image contains spoon, dining table, knife, donut, sandwich, bottle, fork, cup. Based on this, is there a spoon in the image?"}]}, {"id": 1502, "image": "COCO_val2014_000000384040.jpg", "conversations": [{"from": "human", "value": "Is there a bowl in the image?"}, {"from": "gpt", "value": "This image contains spoon, dining table, knife, donut, sandwich, bottle, fork, cup. Based on this, is there a bowl in the image?"}]}, {"id": 1503, "image": "COCO_val2014_000000384040.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains spoon, dining table, knife, donut, sandwich, bottle, fork, cup. Based on this, is there a dining table in the image?"}]}, {"id": 1504, "image": "COCO_val2014_000000384040.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains spoon, dining table, knife, donut, sandwich, bottle, fork, cup. Based on this, is there a person in the image?"}]}, {"id": 1505, "image": "COCO_val2014_000000384040.jpg", "conversations": [{"from": "human", "value": "Is there a knife in the image?"}, {"from": "gpt", "value": "This image contains spoon, dining table, knife, donut, sandwich, bottle, fork, cup. Based on this, is there a knife in the image?"}]}, {"id": 1506, "image": "COCO_val2014_000000384040.jpg", "conversations": [{"from": "human", "value": "Is there a cake in the image?"}, {"from": "gpt", "value": "This image contains spoon, dining table, knife, donut, sandwich, bottle, fork, cup. Based on this, is there a cake in the image?"}]}, {"id": 1507, "image": "COCO_val2014_000000023731.jpg", "conversations": [{"from": "human", "value": "Is there a clock in the image?"}, {"from": "gpt", "value": "This image contains clock, dining table, chair, orange, cat. Based on this, is there a clock in the image?"}]}, {"id": 1508, "image": "COCO_val2014_000000023731.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains clock, dining table, chair, orange, cat. Based on this, is there a person in the image?"}]}, {"id": 1509, "image": "COCO_val2014_000000023731.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains clock, dining table, chair, orange, cat. Based on this, is there a dining table in the image?"}]}, {"id": 1510, "image": "COCO_val2014_000000023731.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains clock, dining table, chair, orange, cat. Based on this, is there a cup in the image?"}]}, {"id": 1511, "image": "COCO_val2014_000000023731.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains clock, dining table, chair, orange, cat. Based on this, is there a chair in the image?"}]}, {"id": 1512, "image": "COCO_val2014_000000023731.jpg", "conversations": [{"from": "human", "value": "Is there a couch in the image?"}, {"from": "gpt", "value": "This image contains clock, dining table, chair, orange, cat. Based on this, is there a couch in the image?"}]}, {"id": 1513, "image": "COCO_val2014_000000463640.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, wine glass, dining table, knife, cake, tie. Based on this, is there a person in the image?"}]}, {"id": 1514, "image": "COCO_val2014_000000463640.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, wine glass, dining table, knife, cake, tie. Based on this, is there a car in the image?"}]}, {"id": 1515, "image": "COCO_val2014_000000463640.jpg", "conversations": [{"from": "human", "value": "Is there a wine glass in the image?"}, {"from": "gpt", "value": "This image contains person, wine glass, dining table, knife, cake, tie. Based on this, is there a wine glass in the image?"}]}, {"id": 1516, "image": "COCO_val2014_000000463640.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains person, wine glass, dining table, knife, cake, tie. Based on this, is there a cup in the image?"}]}, {"id": 1517, "image": "COCO_val2014_000000463640.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, wine glass, dining table, knife, cake, tie. Based on this, is there a dining table in the image?"}]}, {"id": 1518, "image": "COCO_val2014_000000463640.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains person, wine glass, dining table, knife, cake, tie. Based on this, is there a chair in the image?"}]}, {"id": 1519, "image": "COCO_val2014_000000365822.jpg", "conversations": [{"from": "human", "value": "Is there a potted plant in the image?"}, {"from": "gpt", "value": "This image contains potted plant, bottle, chair, vase, oven. Based on this, is there a potted plant in the image?"}]}, {"id": 1520, "image": "COCO_val2014_000000365822.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains potted plant, bottle, chair, vase, oven. Based on this, is there a person in the image?"}]}, {"id": 1521, "image": "COCO_val2014_000000365822.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains potted plant, bottle, chair, vase, oven. Based on this, is there a bottle in the image?"}]}, {"id": 1522, "image": "COCO_val2014_000000365822.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains potted plant, bottle, chair, vase, oven. Based on this, is there a dining table in the image?"}]}, {"id": 1523, "image": "COCO_val2014_000000365822.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains potted plant, bottle, chair, vase, oven. Based on this, is there a chair in the image?"}]}, {"id": 1524, "image": "COCO_val2014_000000365822.jpg", "conversations": [{"from": "human", "value": "Is there a couch in the image?"}, {"from": "gpt", "value": "This image contains potted plant, bottle, chair, vase, oven. Based on this, is there a couch in the image?"}]}, {"id": 1525, "image": "COCO_val2014_000000524979.jpg", "conversations": [{"from": "human", "value": "Is there a baseball glove in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball, dog. Based on this, is there a baseball glove in the image?"}]}, {"id": 1526, "image": "COCO_val2014_000000524979.jpg", "conversations": [{"from": "human", "value": "Is there a baseball bat in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball, dog. Based on this, is there a baseball bat in the image?"}]}, {"id": 1527, "image": "COCO_val2014_000000524979.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball, dog. Based on this, is there a person in the image?"}]}, {"id": 1528, "image": "COCO_val2014_000000524979.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball, dog. Based on this, is there a car in the image?"}]}, {"id": 1529, "image": "COCO_val2014_000000524979.jpg", "conversations": [{"from": "human", "value": "Is there a sports ball in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball, dog. Based on this, is there a sports ball in the image?"}]}, {"id": 1530, "image": "COCO_val2014_000000524979.jpg", "conversations": [{"from": "human", "value": "Is there a tennis racket in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball, dog. Based on this, is there a tennis racket in the image?"}]}, {"id": 1531, "image": "COCO_val2014_000000070813.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains handbag, bed, bottle, dining table. Based on this, is there a handbag in the image?"}]}, {"id": 1532, "image": "COCO_val2014_000000070813.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains handbag, bed, bottle, dining table. Based on this, is there a person in the image?"}]}, {"id": 1533, "image": "COCO_val2014_000000070813.jpg", "conversations": [{"from": "human", "value": "Is there a bed in the image?"}, {"from": "gpt", "value": "This image contains handbag, bed, bottle, dining table. Based on this, is there a bed in the image?"}]}, {"id": 1534, "image": "COCO_val2014_000000070813.jpg", "conversations": [{"from": "human", "value": "Is there a book in the image?"}, {"from": "gpt", "value": "This image contains handbag, bed, bottle, dining table. Based on this, is there a book in the image?"}]}, {"id": 1535, "image": "COCO_val2014_000000070813.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains handbag, bed, bottle, dining table. Based on this, is there a bottle in the image?"}]}, {"id": 1536, "image": "COCO_val2014_000000070813.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains handbag, bed, bottle, dining table. Based on this, is there a cup in the image?"}]}, {"id": 1537, "image": "COCO_val2014_000000318209.jpg", "conversations": [{"from": "human", "value": "Is there a sandwich in the image?"}, {"from": "gpt", "value": "This image contains sandwich, fork, dining table, refrigerator, cat. Based on this, is there a sandwich in the image?"}]}, {"id": 1538, "image": "COCO_val2014_000000318209.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains sandwich, fork, dining table, refrigerator, cat. Based on this, is there a cup in the image?"}]}, {"id": 1539, "image": "COCO_val2014_000000318209.jpg", "conversations": [{"from": "human", "value": "Is there a fork in the image?"}, {"from": "gpt", "value": "This image contains sandwich, fork, dining table, refrigerator, cat. Based on this, is there a fork in the image?"}]}, {"id": 1540, "image": "COCO_val2014_000000318209.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains sandwich, fork, dining table, refrigerator, cat. Based on this, is there a person in the image?"}]}, {"id": 1541, "image": "COCO_val2014_000000318209.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains sandwich, fork, dining table, refrigerator, cat. Based on this, is there a dining table in the image?"}]}, {"id": 1542, "image": "COCO_val2014_000000318209.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains sandwich, fork, dining table, refrigerator, cat. Based on this, is there a chair in the image?"}]}, {"id": 1543, "image": "COCO_val2014_000000016775.jpg", "conversations": [{"from": "human", "value": "Is there a bird in the image?"}, {"from": "gpt", "value": "This image contains bird, truck, person, dog, handbag. Based on this, is there a bird in the image?"}]}, {"id": 1544, "image": "COCO_val2014_000000016775.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains bird, truck, person, dog, handbag. Based on this, is there a car in the image?"}]}, {"id": 1545, "image": "COCO_val2014_000000016775.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains bird, truck, person, dog, handbag. Based on this, is there a truck in the image?"}]}, {"id": 1546, "image": "COCO_val2014_000000016775.jpg", "conversations": [{"from": "human", "value": "Is there a traffic light in the image?"}, {"from": "gpt", "value": "This image contains bird, truck, person, dog, handbag. Based on this, is there a traffic light in the image?"}]}, {"id": 1547, "image": "COCO_val2014_000000016775.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains bird, truck, person, dog, handbag. Based on this, is there a person in the image?"}]}, {"id": 1548, "image": "COCO_val2014_000000016775.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains bird, truck, person, dog, handbag. Based on this, is there a dining table in the image?"}]}, {"id": 1549, "image": "COCO_val2014_000000015338.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains truck, person, sports ball, car, bus. Based on this, is there a truck in the image?"}]}, {"id": 1550, "image": "COCO_val2014_000000015338.jpg", "conversations": [{"from": "human", "value": "Is there a traffic light in the image?"}, {"from": "gpt", "value": "This image contains truck, person, sports ball, car, bus. Based on this, is there a traffic light in the image?"}]}, {"id": 1551, "image": "COCO_val2014_000000015338.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains truck, person, sports ball, car, bus. Based on this, is there a person in the image?"}]}, {"id": 1552, "image": "COCO_val2014_000000015338.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains truck, person, sports ball, car, bus. Based on this, is there a dining table in the image?"}]}, {"id": 1553, "image": "COCO_val2014_000000015338.jpg", "conversations": [{"from": "human", "value": "Is there a sports ball in the image?"}, {"from": "gpt", "value": "This image contains truck, person, sports ball, car, bus. Based on this, is there a sports ball in the image?"}]}, {"id": 1554, "image": "COCO_val2014_000000015338.jpg", "conversations": [{"from": "human", "value": "Is there a tennis racket in the image?"}, {"from": "gpt", "value": "This image contains truck, person, sports ball, car, bus. Based on this, is there a tennis racket in the image?"}]}, {"id": 1555, "image": "COCO_val2014_000000441156.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, elephant, handbag. Based on this, is there a backpack in the image?"}]}, {"id": 1556, "image": "COCO_val2014_000000441156.jpg", "conversations": [{"from": "human", "value": "Is there a skis in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, elephant, handbag. Based on this, is there a skis in the image?"}]}, {"id": 1557, "image": "COCO_val2014_000000441156.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, elephant, handbag. Based on this, is there a person in the image?"}]}, {"id": 1558, "image": "COCO_val2014_000000441156.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, elephant, handbag. Based on this, is there a car in the image?"}]}, {"id": 1559, "image": "COCO_val2014_000000441156.jpg", "conversations": [{"from": "human", "value": "Is there an elephant in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, elephant, handbag. Based on this, is there an elephant in the image?"}]}, {"id": 1560, "image": "COCO_val2014_000000441156.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, elephant, handbag. Based on this, is there a dining table in the image?"}]}, {"id": 1561, "image": "COCO_val2014_000000408757.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, kite, umbrella. Based on this, is there a person in the image?"}]}, {"id": 1562, "image": "COCO_val2014_000000408757.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, kite, umbrella. Based on this, is there a car in the image?"}]}, {"id": 1563, "image": "COCO_val2014_000000408757.jpg", "conversations": [{"from": "human", "value": "Is there a kite in the image?"}, {"from": "gpt", "value": "This image contains person, kite, umbrella. Based on this, is there a kite in the image?"}]}, {"id": 1564, "image": "COCO_val2014_000000408757.jpg", "conversations": [{"from": "human", "value": "Is there a surfboard in the image?"}, {"from": "gpt", "value": "This image contains person, kite, umbrella. Based on this, is there a surfboard in the image?"}]}, {"id": 1565, "image": "COCO_val2014_000000408757.jpg", "conversations": [{"from": "human", "value": "Is there an umbrella in the image?"}, {"from": "gpt", "value": "This image contains person, kite, umbrella. Based on this, is there an umbrella in the image?"}]}, {"id": 1566, "image": "COCO_val2014_000000408757.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains person, kite, umbrella. Based on this, is there a handbag in the image?"}]}, {"id": 1567, "image": "COCO_val2014_000000550691.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, car, bus, tie. Based on this, is there a person in the image?"}]}, {"id": 1568, "image": "COCO_val2014_000000550691.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, car, bus, tie. Based on this, is there a dining table in the image?"}]}, {"id": 1569, "image": "COCO_val2014_000000550691.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, car, bus, tie. Based on this, is there a car in the image?"}]}, {"id": 1570, "image": "COCO_val2014_000000550691.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains person, car, bus, tie. Based on this, is there a truck in the image?"}]}, {"id": 1571, "image": "COCO_val2014_000000550691.jpg", "conversations": [{"from": "human", "value": "Is there a bus in the image?"}, {"from": "gpt", "value": "This image contains person, car, bus, tie. Based on this, is there a bus in the image?"}]}, {"id": 1572, "image": "COCO_val2014_000000550691.jpg", "conversations": [{"from": "human", "value": "Is there a traffic light in the image?"}, {"from": "gpt", "value": "This image contains person, car, bus, tie. Based on this, is there a traffic light in the image?"}]}, {"id": 1573, "image": "COCO_val2014_000000204100.jpg", "conversations": [{"from": "human", "value": "Is there a banana in the image?"}, {"from": "gpt", "value": "This image contains banana, person, bowl, bench. Based on this, is there a banana in the image?"}]}, {"id": 1574, "image": "COCO_val2014_000000204100.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains banana, person, bowl, bench. Based on this, is there a dining table in the image?"}]}, {"id": 1575, "image": "COCO_val2014_000000204100.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains banana, person, bowl, bench. Based on this, is there a person in the image?"}]}, {"id": 1576, "image": "COCO_val2014_000000204100.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains banana, person, bowl, bench. Based on this, is there a car in the image?"}]}, {"id": 1577, "image": "COCO_val2014_000000204100.jpg", "conversations": [{"from": "human", "value": "Is there a bowl in the image?"}, {"from": "gpt", "value": "This image contains banana, person, bowl, bench. Based on this, is there a bowl in the image?"}]}, {"id": 1578, "image": "COCO_val2014_000000204100.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains banana, person, bowl, bench. Based on this, is there a cup in the image?"}]}, {"id": 1579, "image": "COCO_val2014_000000468169.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, bench, sports ball, baseball bat. Based on this, is there a person in the image?"}]}, {"id": 1580, "image": "COCO_val2014_000000468169.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, bench, sports ball, baseball bat. Based on this, is there a car in the image?"}]}, {"id": 1581, "image": "COCO_val2014_000000468169.jpg", "conversations": [{"from": "human", "value": "Is there a bench in the image?"}, {"from": "gpt", "value": "This image contains person, bench, sports ball, baseball bat. Based on this, is there a bench in the image?"}]}, {"id": 1582, "image": "COCO_val2014_000000468169.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, bench, sports ball, baseball bat. Based on this, is there a dining table in the image?"}]}, {"id": 1583, "image": "COCO_val2014_000000468169.jpg", "conversations": [{"from": "human", "value": "Is there a sports ball in the image?"}, {"from": "gpt", "value": "This image contains person, bench, sports ball, baseball bat. Based on this, is there a sports ball in the image?"}]}, {"id": 1584, "image": "COCO_val2014_000000468169.jpg", "conversations": [{"from": "human", "value": "Is there a tennis racket in the image?"}, {"from": "gpt", "value": "This image contains person, bench, sports ball, baseball bat. Based on this, is there a tennis racket in the image?"}]}, {"id": 1585, "image": "COCO_val2014_000000198312.jpg", "conversations": [{"from": "human", "value": "Is there a bowl in the image?"}, {"from": "gpt", "value": "This image contains bowl, couch, potted plant, dining table, chair, vase. Based on this, is there a bowl in the image?"}]}, {"id": 1586, "image": "COCO_val2014_000000198312.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains bowl, couch, potted plant, dining table, chair, vase. Based on this, is there a cup in the image?"}]}, {"id": 1587, "image": "COCO_val2014_000000198312.jpg", "conversations": [{"from": "human", "value": "Is there a couch in the image?"}, {"from": "gpt", "value": "This image contains bowl, couch, potted plant, dining table, chair, vase. Based on this, is there a couch in the image?"}]}, {"id": 1588, "image": "COCO_val2014_000000198312.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains bowl, couch, potted plant, dining table, chair, vase. Based on this, is there a person in the image?"}]}, {"id": 1589, "image": "COCO_val2014_000000198312.jpg", "conversations": [{"from": "human", "value": "Is there a potted plant in the image?"}, {"from": "gpt", "value": "This image contains bowl, couch, potted plant, dining table, chair, vase. Based on this, is there a potted plant in the image?"}]}, {"id": 1590, "image": "COCO_val2014_000000198312.jpg", "conversations": [{"from": "human", "value": "Is there a tv in the image?"}, {"from": "gpt", "value": "This image contains bowl, couch, potted plant, dining table, chair, vase. Based on this, is there a tv in the image?"}]}, {"id": 1591, "image": "COCO_val2014_000000485485.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, car, elephant. Based on this, is there a person in the image?"}]}, {"id": 1592, "image": "COCO_val2014_000000485485.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, car, elephant. Based on this, is there a dining table in the image?"}]}, {"id": 1593, "image": "COCO_val2014_000000485485.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, car, elephant. Based on this, is there a car in the image?"}]}, {"id": 1594, "image": "COCO_val2014_000000485485.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains person, car, elephant. Based on this, is there a truck in the image?"}]}, {"id": 1595, "image": "COCO_val2014_000000485485.jpg", "conversations": [{"from": "human", "value": "Is there an elephant in the image?"}, {"from": "gpt", "value": "This image contains person, car, elephant. Based on this, is there an elephant in the image?"}]}, {"id": 1596, "image": "COCO_val2014_000000485485.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains person, car, elephant. Based on this, is there a chair in the image?"}]}, {"id": 1597, "image": "COCO_val2014_000000309371.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, bench, cup. Based on this, is there a backpack in the image?"}]}, {"id": 1598, "image": "COCO_val2014_000000309371.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, bench, cup. Based on this, is there a handbag in the image?"}]}, {"id": 1599, "image": "COCO_val2014_000000309371.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, bench, cup. Based on this, is there a person in the image?"}]}, {"id": 1600, "image": "COCO_val2014_000000309371.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, bench, cup. Based on this, is there a car in the image?"}]}, {"id": 1601, "image": "COCO_val2014_000000309371.jpg", "conversations": [{"from": "human", "value": "Is there a bench in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, bench, cup. Based on this, is there a bench in the image?"}]}, {"id": 1602, "image": "COCO_val2014_000000309371.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, bench, cup. Based on this, is there a dining table in the image?"}]}, {"id": 1603, "image": "COCO_val2014_000000472143.jpg", "conversations": [{"from": "human", "value": "Is there a bird in the image?"}, {"from": "gpt", "value": "This image contains bird, person, dining table, chair, bench, backpack, handbag, car, fork. Based on this, is there a bird in the image?"}]}, {"id": 1604, "image": "COCO_val2014_000000472143.jpg", "conversations": [{"from": "human", "value": "Is there a boat in the image?"}, {"from": "gpt", "value": "This image contains bird, person, dining table, chair, bench, backpack, handbag, car, fork. Based on this, is there a boat in the image?"}]}, {"id": 1605, "image": "COCO_val2014_000000472143.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains bird, person, dining table, chair, bench, backpack, handbag, car, fork. Based on this, is there a person in the image?"}]}, {"id": 1606, "image": "COCO_val2014_000000472143.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains bird, person, dining table, chair, bench, backpack, handbag, car, fork. Based on this, is there a cup in the image?"}]}, {"id": 1607, "image": "COCO_val2014_000000472143.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains bird, person, dining table, chair, bench, backpack, handbag, car, fork. Based on this, is there a dining table in the image?"}]}, {"id": 1608, "image": "COCO_val2014_000000472143.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains bird, person, dining table, chair, bench, backpack, handbag, car, fork. Based on this, is there a bottle in the image?"}]}, {"id": 1609, "image": "COCO_val2014_000000236023.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, clock, bottle, knife, refrigerator, oven, cup. Based on this, is there a person in the image?"}]}, {"id": 1610, "image": "COCO_val2014_000000236023.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, clock, bottle, knife, refrigerator, oven, cup. Based on this, is there a car in the image?"}]}, {"id": 1611, "image": "COCO_val2014_000000236023.jpg", "conversations": [{"from": "human", "value": "Is there a clock in the image?"}, {"from": "gpt", "value": "This image contains person, clock, bottle, knife, refrigerator, oven, cup. Based on this, is there a clock in the image?"}]}, {"id": 1612, "image": "COCO_val2014_000000236023.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains person, clock, bottle, knife, refrigerator, oven, cup. Based on this, is there a chair in the image?"}]}, {"id": 1613, "image": "COCO_val2014_000000236023.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains person, clock, bottle, knife, refrigerator, oven, cup. Based on this, is there a bottle in the image?"}]}, {"id": 1614, "image": "COCO_val2014_000000236023.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, clock, bottle, knife, refrigerator, oven, cup. Based on this, is there a dining table in the image?"}]}, {"id": 1615, "image": "COCO_val2014_000000214244.jpg", "conversations": [{"from": "human", "value": "Is there a snowboard in the image?"}, {"from": "gpt", "value": "This image contains snowboard, person, skis. Based on this, is there a snowboard in the image?"}]}, {"id": 1616, "image": "COCO_val2014_000000214244.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains snowboard, person, skis. Based on this, is there a backpack in the image?"}]}, {"id": 1617, "image": "COCO_val2014_000000214244.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains snowboard, person, skis. Based on this, is there a person in the image?"}]}, {"id": 1618, "image": "COCO_val2014_000000214244.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains snowboard, person, skis. Based on this, is there a car in the image?"}]}, {"id": 1619, "image": "COCO_val2014_000000214244.jpg", "conversations": [{"from": "human", "value": "Is there a skis in the image?"}, {"from": "gpt", "value": "This image contains snowboard, person, skis. Based on this, is there a skis in the image?"}]}, {"id": 1620, "image": "COCO_val2014_000000214244.jpg", "conversations": [{"from": "human", "value": "Is there a dog in the image?"}, {"from": "gpt", "value": "This image contains snowboard, person, skis. Based on this, is there a dog in the image?"}]}, {"id": 1621, "image": "COCO_val2014_000000397665.jpg", "conversations": [{"from": "human", "value": "Is there a motorcycle in the image?"}, {"from": "gpt", "value": "This image contains motorcycle, person, handbag, bicycle, car, orange, bus. Based on this, is there a motorcycle in the image?"}]}, {"id": 1622, "image": "COCO_val2014_000000397665.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains motorcycle, person, handbag, bicycle, car, orange, bus. Based on this, is there a truck in the image?"}]}, {"id": 1623, "image": "COCO_val2014_000000397665.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains motorcycle, person, handbag, bicycle, car, orange, bus. Based on this, is there a person in the image?"}]}, {"id": 1624, "image": "COCO_val2014_000000397665.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains motorcycle, person, handbag, bicycle, car, orange, bus. Based on this, is there a dining table in the image?"}]}, {"id": 1625, "image": "COCO_val2014_000000397665.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains motorcycle, person, handbag, bicycle, car, orange, bus. Based on this, is there a handbag in the image?"}]}, {"id": 1626, "image": "COCO_val2014_000000397665.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains motorcycle, person, handbag, bicycle, car, orange, bus. Based on this, is there a backpack in the image?"}]}, {"id": 1627, "image": "COCO_val2014_000000183965.jpg", "conversations": [{"from": "human", "value": "Is there a bowl in the image?"}, {"from": "gpt", "value": "This image contains bowl, sandwich, hot dog, dining table, donut, cup. Based on this, is there a bowl in the image?"}]}, {"id": 1628, "image": "COCO_val2014_000000183965.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains bowl, sandwich, hot dog, dining table, donut, cup. Based on this, is there a person in the image?"}]}, {"id": 1629, "image": "COCO_val2014_000000183965.jpg", "conversations": [{"from": "human", "value": "Is there a sandwich in the image?"}, {"from": "gpt", "value": "This image contains bowl, sandwich, hot dog, dining table, donut, cup. Based on this, is there a sandwich in the image?"}]}, {"id": 1630, "image": "COCO_val2014_000000183965.jpg", "conversations": [{"from": "human", "value": "Is there a fork in the image?"}, {"from": "gpt", "value": "This image contains bowl, sandwich, hot dog, dining table, donut, cup. Based on this, is there a fork in the image?"}]}, {"id": 1631, "image": "COCO_val2014_000000183965.jpg", "conversations": [{"from": "human", "value": "Is there a hot dog in the image?"}, {"from": "gpt", "value": "This image contains bowl, sandwich, hot dog, dining table, donut, cup. Based on this, is there a hot dog in the image?"}]}, {"id": 1632, "image": "COCO_val2014_000000183965.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains bowl, sandwich, hot dog, dining table, donut, cup. Based on this, is there a chair in the image?"}]}, {"id": 1633, "image": "COCO_val2014_000000499105.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket. Based on this, is there a person in the image?"}]}, {"id": 1634, "image": "COCO_val2014_000000499105.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket. Based on this, is there a car in the image?"}]}, {"id": 1635, "image": "COCO_val2014_000000499105.jpg", "conversations": [{"from": "human", "value": "Is there a sports ball in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket. Based on this, is there a sports ball in the image?"}]}, {"id": 1636, "image": "COCO_val2014_000000499105.jpg", "conversations": [{"from": "human", "value": "Is there a baseball glove in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket. Based on this, is there a baseball glove in the image?"}]}, {"id": 1637, "image": "COCO_val2014_000000499105.jpg", "conversations": [{"from": "human", "value": "Is there a tennis racket in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket. Based on this, is there a tennis racket in the image?"}]}, {"id": 1638, "image": "COCO_val2014_000000499105.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket. Based on this, is there a chair in the image?"}]}, {"id": 1639, "image": "COCO_val2014_000000259755.jpg", "conversations": [{"from": "human", "value": "Is there a baseball glove in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball. Based on this, is there a baseball glove in the image?"}]}, {"id": 1640, "image": "COCO_val2014_000000259755.jpg", "conversations": [{"from": "human", "value": "Is there a baseball bat in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball. Based on this, is there a baseball bat in the image?"}]}, {"id": 1641, "image": "COCO_val2014_000000259755.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball. Based on this, is there a person in the image?"}]}, {"id": 1642, "image": "COCO_val2014_000000259755.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball. Based on this, is there a car in the image?"}]}, {"id": 1643, "image": "COCO_val2014_000000259755.jpg", "conversations": [{"from": "human", "value": "Is there a sports ball in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball. Based on this, is there a sports ball in the image?"}]}, {"id": 1644, "image": "COCO_val2014_000000259755.jpg", "conversations": [{"from": "human", "value": "Is there a tennis racket in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball. Based on this, is there a tennis racket in the image?"}]}, {"id": 1645, "image": "COCO_val2014_000000281028.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains chair, person, train, car. Based on this, is there a chair in the image?"}]}, {"id": 1646, "image": "COCO_val2014_000000281028.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains chair, person, train, car. Based on this, is there a dining table in the image?"}]}, {"id": 1647, "image": "COCO_val2014_000000281028.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains chair, person, train, car. Based on this, is there a person in the image?"}]}, {"id": 1648, "image": "COCO_val2014_000000281028.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains chair, person, train, car. Based on this, is there a handbag in the image?"}]}, {"id": 1649, "image": "COCO_val2014_000000281028.jpg", "conversations": [{"from": "human", "value": "Is there a train in the image?"}, {"from": "gpt", "value": "This image contains chair, person, train, car. Based on this, is there a train in the image?"}]}, {"id": 1650, "image": "COCO_val2014_000000281028.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains chair, person, train, car. Based on this, is there a truck in the image?"}]}, {"id": 1651, "image": "COCO_val2014_000000199122.jpg", "conversations": [{"from": "human", "value": "Is there a baseball glove in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball, chair, baseball bat. Based on this, is there a baseball glove in the image?"}]}, {"id": 1652, "image": "COCO_val2014_000000199122.jpg", "conversations": [{"from": "human", "value": "Is there a dog in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball, chair, baseball bat. Based on this, is there a dog in the image?"}]}, {"id": 1653, "image": "COCO_val2014_000000199122.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball, chair, baseball bat. Based on this, is there a person in the image?"}]}, {"id": 1654, "image": "COCO_val2014_000000199122.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball, chair, baseball bat. Based on this, is there a car in the image?"}]}, {"id": 1655, "image": "COCO_val2014_000000199122.jpg", "conversations": [{"from": "human", "value": "Is there a sports ball in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball, chair, baseball bat. Based on this, is there a sports ball in the image?"}]}, {"id": 1656, "image": "COCO_val2014_000000199122.jpg", "conversations": [{"from": "human", "value": "Is there a tennis racket in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball, chair, baseball bat. Based on this, is there a tennis racket in the image?"}]}, {"id": 1657, "image": "COCO_val2014_000000442809.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains bottle, cake, cup. Based on this, is there a bottle in the image?"}]}, {"id": 1658, "image": "COCO_val2014_000000442809.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains bottle, cake, cup. Based on this, is there a person in the image?"}]}, {"id": 1659, "image": "COCO_val2014_000000442809.jpg", "conversations": [{"from": "human", "value": "Is there a cake in the image?"}, {"from": "gpt", "value": "This image contains bottle, cake, cup. Based on this, is there a cake in the image?"}]}, {"id": 1660, "image": "COCO_val2014_000000442809.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains bottle, cake, cup. Based on this, is there a dining table in the image?"}]}, {"id": 1661, "image": "COCO_val2014_000000442809.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains bottle, cake, cup. Based on this, is there a cup in the image?"}]}, {"id": 1662, "image": "COCO_val2014_000000442809.jpg", "conversations": [{"from": "human", "value": "Is there a bowl in the image?"}, {"from": "gpt", "value": "This image contains bottle, cake, cup. Based on this, is there a bowl in the image?"}]}, {"id": 1663, "image": "COCO_val2014_000000482829.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket. Based on this, is there a person in the image?"}]}, {"id": 1664, "image": "COCO_val2014_000000482829.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket. Based on this, is there a car in the image?"}]}, {"id": 1665, "image": "COCO_val2014_000000482829.jpg", "conversations": [{"from": "human", "value": "Is there a sports ball in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket. Based on this, is there a sports ball in the image?"}]}, {"id": 1666, "image": "COCO_val2014_000000482829.jpg", "conversations": [{"from": "human", "value": "Is there a baseball glove in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket. Based on this, is there a baseball glove in the image?"}]}, {"id": 1667, "image": "COCO_val2014_000000482829.jpg", "conversations": [{"from": "human", "value": "Is there a tennis racket in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket. Based on this, is there a tennis racket in the image?"}]}, {"id": 1668, "image": "COCO_val2014_000000482829.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket. Based on this, is there a chair in the image?"}]}, {"id": 1669, "image": "COCO_val2014_000000097994.jpg", "conversations": [{"from": "human", "value": "Is there a clock in the image?"}, {"from": "gpt", "value": "This image contains clock, laptop, dining table, tv, mouse, bottle, keyboard, book, cup. Based on this, is there a clock in the image?"}]}, {"id": 1670, "image": "COCO_val2014_000000097994.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains clock, laptop, dining table, tv, mouse, bottle, keyboard, book, cup. Based on this, is there a person in the image?"}]}, {"id": 1671, "image": "COCO_val2014_000000097994.jpg", "conversations": [{"from": "human", "value": "Is there a laptop in the image?"}, {"from": "gpt", "value": "This image contains clock, laptop, dining table, tv, mouse, bottle, keyboard, book, cup. Based on this, is there a laptop in the image?"}]}, {"id": 1672, "image": "COCO_val2014_000000097994.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains clock, laptop, dining table, tv, mouse, bottle, keyboard, book, cup. Based on this, is there a chair in the image?"}]}, {"id": 1673, "image": "COCO_val2014_000000097994.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains clock, laptop, dining table, tv, mouse, bottle, keyboard, book, cup. Based on this, is there a dining table in the image?"}]}, {"id": 1674, "image": "COCO_val2014_000000097994.jpg", "conversations": [{"from": "human", "value": "Is there a bowl in the image?"}, {"from": "gpt", "value": "This image contains clock, laptop, dining table, tv, mouse, bottle, keyboard, book, cup. Based on this, is there a bowl in the image?"}]}, {"id": 1675, "image": "COCO_val2014_000000246999.jpg", "conversations": [{"from": "human", "value": "Is there a tv in the image?"}, {"from": "gpt", "value": "This image contains tv, clock, couch, potted plant, remote, chair, vase. Based on this, is there a tv in the image?"}]}, {"id": 1676, "image": "COCO_val2014_000000246999.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains tv, clock, couch, potted plant, remote, chair, vase. Based on this, is there a person in the image?"}]}, {"id": 1677, "image": "COCO_val2014_000000246999.jpg", "conversations": [{"from": "human", "value": "Is there a clock in the image?"}, {"from": "gpt", "value": "This image contains tv, clock, couch, potted plant, remote, chair, vase. Based on this, is there a clock in the image?"}]}, {"id": 1678, "image": "COCO_val2014_000000246999.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains tv, clock, couch, potted plant, remote, chair, vase. Based on this, is there a dining table in the image?"}]}, {"id": 1679, "image": "COCO_val2014_000000246999.jpg", "conversations": [{"from": "human", "value": "Is there a couch in the image?"}, {"from": "gpt", "value": "This image contains tv, clock, couch, potted plant, remote, chair, vase. Based on this, is there a couch in the image?"}]}, {"id": 1680, "image": "COCO_val2014_000000246999.jpg", "conversations": [{"from": "human", "value": "Is there a book in the image?"}, {"from": "gpt", "value": "This image contains tv, clock, couch, potted plant, remote, chair, vase. Based on this, is there a book in the image?"}]}, {"id": 1681, "image": "COCO_val2014_000000338291.jpg", "conversations": [{"from": "human", "value": "Is there a snowboard in the image?"}, {"from": "gpt", "value": "This image contains snowboard, backpack, person, bench. Based on this, is there a snowboard in the image?"}]}, {"id": 1682, "image": "COCO_val2014_000000338291.jpg", "conversations": [{"from": "human", "value": "Is there a skis in the image?"}, {"from": "gpt", "value": "This image contains snowboard, backpack, person, bench. Based on this, is there a skis in the image?"}]}, {"id": 1683, "image": "COCO_val2014_000000338291.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains snowboard, backpack, person, bench. Based on this, is there a backpack in the image?"}]}, {"id": 1684, "image": "COCO_val2014_000000338291.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains snowboard, backpack, person, bench. Based on this, is there a handbag in the image?"}]}, {"id": 1685, "image": "COCO_val2014_000000338291.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains snowboard, backpack, person, bench. Based on this, is there a person in the image?"}]}, {"id": 1686, "image": "COCO_val2014_000000338291.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains snowboard, backpack, person, bench. Based on this, is there a car in the image?"}]}, {"id": 1687, "image": "COCO_val2014_000000331366.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains truck, person, bicycle, car, umbrella. Based on this, is there a truck in the image?"}]}, {"id": 1688, "image": "COCO_val2014_000000331366.jpg", "conversations": [{"from": "human", "value": "Is there a traffic light in the image?"}, {"from": "gpt", "value": "This image contains truck, person, bicycle, car, umbrella. Based on this, is there a traffic light in the image?"}]}, {"id": 1689, "image": "COCO_val2014_000000331366.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains truck, person, bicycle, car, umbrella. Based on this, is there a person in the image?"}]}, {"id": 1690, "image": "COCO_val2014_000000331366.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains truck, person, bicycle, car, umbrella. Based on this, is there a dining table in the image?"}]}, {"id": 1691, "image": "COCO_val2014_000000331366.jpg", "conversations": [{"from": "human", "value": "Is there a bicycle in the image?"}, {"from": "gpt", "value": "This image contains truck, person, bicycle, car, umbrella. Based on this, is there a bicycle in the image?"}]}, {"id": 1692, "image": "COCO_val2014_000000331366.jpg", "conversations": [{"from": "human", "value": "Is there a motorcycle in the image?"}, {"from": "gpt", "value": "This image contains truck, person, bicycle, car, umbrella. Based on this, is there a motorcycle in the image?"}]}, {"id": 1693, "image": "COCO_val2014_000000348524.jpg", "conversations": [{"from": "human", "value": "Is there a snowboard in the image?"}, {"from": "gpt", "value": "This image contains snowboard, person, skis. Based on this, is there a snowboard in the image?"}]}, {"id": 1694, "image": "COCO_val2014_000000348524.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains snowboard, person, skis. Based on this, is there a backpack in the image?"}]}, {"id": 1695, "image": "COCO_val2014_000000348524.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains snowboard, person, skis. Based on this, is there a person in the image?"}]}, {"id": 1696, "image": "COCO_val2014_000000348524.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains snowboard, person, skis. Based on this, is there a car in the image?"}]}, {"id": 1697, "image": "COCO_val2014_000000348524.jpg", "conversations": [{"from": "human", "value": "Is there a skis in the image?"}, {"from": "gpt", "value": "This image contains snowboard, person, skis. Based on this, is there a skis in the image?"}]}, {"id": 1698, "image": "COCO_val2014_000000348524.jpg", "conversations": [{"from": "human", "value": "Is there a dog in the image?"}, {"from": "gpt", "value": "This image contains snowboard, person, skis. Based on this, is there a dog in the image?"}]}, {"id": 1699, "image": "COCO_val2014_000000108189.jpg", "conversations": [{"from": "human", "value": "Is there a sandwich in the image?"}, {"from": "gpt", "value": "This image contains sandwich, fork, dining table, knife, cup. Based on this, is there a sandwich in the image?"}]}, {"id": 1700, "image": "COCO_val2014_000000108189.jpg", "conversations": [{"from": "human", "value": "Is there a bowl in the image?"}, {"from": "gpt", "value": "This image contains sandwich, fork, dining table, knife, cup. Based on this, is there a bowl in the image?"}]}, {"id": 1701, "image": "COCO_val2014_000000108189.jpg", "conversations": [{"from": "human", "value": "Is there a fork in the image?"}, {"from": "gpt", "value": "This image contains sandwich, fork, dining table, knife, cup. Based on this, is there a fork in the image?"}]}, {"id": 1702, "image": "COCO_val2014_000000108189.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains sandwich, fork, dining table, knife, cup. Based on this, is there a person in the image?"}]}, {"id": 1703, "image": "COCO_val2014_000000108189.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains sandwich, fork, dining table, knife, cup. Based on this, is there a dining table in the image?"}]}, {"id": 1704, "image": "COCO_val2014_000000108189.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains sandwich, fork, dining table, knife, cup. Based on this, is there a chair in the image?"}]}, {"id": 1705, "image": "COCO_val2014_000000301575.jpg", "conversations": [{"from": "human", "value": "Is there a tv in the image?"}, {"from": "gpt", "value": "This image contains tv, person, couch, potted plant, chair, cat, book. Based on this, is there a tv in the image?"}]}, {"id": 1706, "image": "COCO_val2014_000000301575.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains tv, person, couch, potted plant, chair, cat, book. Based on this, is there a dining table in the image?"}]}, {"id": 1707, "image": "COCO_val2014_000000301575.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains tv, person, couch, potted plant, chair, cat, book. Based on this, is there a person in the image?"}]}, {"id": 1708, "image": "COCO_val2014_000000301575.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains tv, person, couch, potted plant, chair, cat, book. Based on this, is there a car in the image?"}]}, {"id": 1709, "image": "COCO_val2014_000000301575.jpg", "conversations": [{"from": "human", "value": "Is there a couch in the image?"}, {"from": "gpt", "value": "This image contains tv, person, couch, potted plant, chair, cat, book. Based on this, is there a couch in the image?"}]}, {"id": 1710, "image": "COCO_val2014_000000301575.jpg", "conversations": [{"from": "human", "value": "Is there a remote in the image?"}, {"from": "gpt", "value": "This image contains tv, person, couch, potted plant, chair, cat, book. Based on this, is there a remote in the image?"}]}, {"id": 1711, "image": "COCO_val2014_000000239773.jpg", "conversations": [{"from": "human", "value": "Is there a baseball glove in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball, baseball bat. Based on this, is there a baseball glove in the image?"}]}, {"id": 1712, "image": "COCO_val2014_000000239773.jpg", "conversations": [{"from": "human", "value": "Is there a dog in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball, baseball bat. Based on this, is there a dog in the image?"}]}, {"id": 1713, "image": "COCO_val2014_000000239773.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball, baseball bat. Based on this, is there a person in the image?"}]}, {"id": 1714, "image": "COCO_val2014_000000239773.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball, baseball bat. Based on this, is there a car in the image?"}]}, {"id": 1715, "image": "COCO_val2014_000000239773.jpg", "conversations": [{"from": "human", "value": "Is there a sports ball in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball, baseball bat. Based on this, is there a sports ball in the image?"}]}, {"id": 1716, "image": "COCO_val2014_000000239773.jpg", "conversations": [{"from": "human", "value": "Is there a tennis racket in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball, baseball bat. Based on this, is there a tennis racket in the image?"}]}, {"id": 1717, "image": "COCO_val2014_000000354976.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, clock, laptop, dining table, chair, tv, mouse, cell phone. Based on this, is there a person in the image?"}]}, {"id": 1718, "image": "COCO_val2014_000000354976.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, clock, laptop, dining table, chair, tv, mouse, cell phone. Based on this, is there a car in the image?"}]}, {"id": 1719, "image": "COCO_val2014_000000354976.jpg", "conversations": [{"from": "human", "value": "Is there a clock in the image?"}, {"from": "gpt", "value": "This image contains person, clock, laptop, dining table, chair, tv, mouse, cell phone. Based on this, is there a clock in the image?"}]}, {"id": 1720, "image": "COCO_val2014_000000354976.jpg", "conversations": [{"from": "human", "value": "Is there a couch in the image?"}, {"from": "gpt", "value": "This image contains person, clock, laptop, dining table, chair, tv, mouse, cell phone. Based on this, is there a couch in the image?"}]}, {"id": 1721, "image": "COCO_val2014_000000354976.jpg", "conversations": [{"from": "human", "value": "Is there a laptop in the image?"}, {"from": "gpt", "value": "This image contains person, clock, laptop, dining table, chair, tv, mouse, cell phone. Based on this, is there a laptop in the image?"}]}, {"id": 1722, "image": "COCO_val2014_000000354976.jpg", "conversations": [{"from": "human", "value": "Is there a keyboard in the image?"}, {"from": "gpt", "value": "This image contains person, clock, laptop, dining table, chair, tv, mouse, cell phone. Based on this, is there a keyboard in the image?"}]}, {"id": 1723, "image": "COCO_val2014_000000473199.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, handbag, potted plant, dining table, chair, umbrella. Based on this, is there a person in the image?"}]}, {"id": 1724, "image": "COCO_val2014_000000473199.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, handbag, potted plant, dining table, chair, umbrella. Based on this, is there a car in the image?"}]}, {"id": 1725, "image": "COCO_val2014_000000473199.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains person, handbag, potted plant, dining table, chair, umbrella. Based on this, is there a handbag in the image?"}]}, {"id": 1726, "image": "COCO_val2014_000000473199.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains person, handbag, potted plant, dining table, chair, umbrella. Based on this, is there a backpack in the image?"}]}, {"id": 1727, "image": "COCO_val2014_000000473199.jpg", "conversations": [{"from": "human", "value": "Is there a potted plant in the image?"}, {"from": "gpt", "value": "This image contains person, handbag, potted plant, dining table, chair, umbrella. Based on this, is there a potted plant in the image?"}]}, {"id": 1728, "image": "COCO_val2014_000000473199.jpg", "conversations": [{"from": "human", "value": "Is there a vase in the image?"}, {"from": "gpt", "value": "This image contains person, handbag, potted plant, dining table, chair, umbrella. Based on this, is there a vase in the image?"}]}, {"id": 1729, "image": "COCO_val2014_000000311759.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains backpack, teddy bear, bear. Based on this, is there a backpack in the image?"}]}, {"id": 1730, "image": "COCO_val2014_000000311759.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains backpack, teddy bear, bear. Based on this, is there a person in the image?"}]}, {"id": 1731, "image": "COCO_val2014_000000311759.jpg", "conversations": [{"from": "human", "value": "Is there a teddy bear in the image?"}, {"from": "gpt", "value": "This image contains backpack, teddy bear, bear. Based on this, is there a teddy bear in the image?"}]}, {"id": 1732, "image": "COCO_val2014_000000311759.jpg", "conversations": [{"from": "human", "value": "Is there a bed in the image?"}, {"from": "gpt", "value": "This image contains backpack, teddy bear, bear. Based on this, is there a bed in the image?"}]}, {"id": 1733, "image": "COCO_val2014_000000311759.jpg", "conversations": [{"from": "human", "value": "Is there a bear in the image?"}, {"from": "gpt", "value": "This image contains backpack, teddy bear, bear. Based on this, is there a bear in the image?"}]}, {"id": 1734, "image": "COCO_val2014_000000311759.jpg", "conversations": [{"from": "human", "value": "Is there a couch in the image?"}, {"from": "gpt", "value": "This image contains backpack, teddy bear, bear. Based on this, is there a couch in the image?"}]}, {"id": 1735, "image": "COCO_val2014_000000431615.jpg", "conversations": [{"from": "human", "value": "Is there a dog in the image?"}, {"from": "gpt", "value": "This image contains dog, person, boat. Based on this, is there a dog in the image?"}]}, {"id": 1736, "image": "COCO_val2014_000000431615.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains dog, person, boat. Based on this, is there a car in the image?"}]}, {"id": 1737, "image": "COCO_val2014_000000431615.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains dog, person, boat. Based on this, is there a person in the image?"}]}, {"id": 1738, "image": "COCO_val2014_000000431615.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains dog, person, boat. Based on this, is there a dining table in the image?"}]}, {"id": 1739, "image": "COCO_val2014_000000431615.jpg", "conversations": [{"from": "human", "value": "Is there a boat in the image?"}, {"from": "gpt", "value": "This image contains dog, person, boat. Based on this, is there a boat in the image?"}]}, {"id": 1740, "image": "COCO_val2014_000000431615.jpg", "conversations": [{"from": "human", "value": "Is there a bird in the image?"}, {"from": "gpt", "value": "This image contains dog, person, boat. Based on this, is there a bird in the image?"}]}, {"id": 1741, "image": "COCO_val2014_000000343401.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains car, dog, person, horse. Based on this, is there a car in the image?"}]}, {"id": 1742, "image": "COCO_val2014_000000343401.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains car, dog, person, horse. Based on this, is there a truck in the image?"}]}, {"id": 1743, "image": "COCO_val2014_000000343401.jpg", "conversations": [{"from": "human", "value": "Is there a dog in the image?"}, {"from": "gpt", "value": "This image contains car, dog, person, horse. Based on this, is there a dog in the image?"}]}, {"id": 1744, "image": "COCO_val2014_000000343401.jpg", "conversations": [{"from": "human", "value": "Is there a frisbee in the image?"}, {"from": "gpt", "value": "This image contains car, dog, person, horse. Based on this, is there a frisbee in the image?"}]}, {"id": 1745, "image": "COCO_val2014_000000343401.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains car, dog, person, horse. Based on this, is there a person in the image?"}]}, {"id": 1746, "image": "COCO_val2014_000000343401.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains car, dog, person, horse. Based on this, is there a dining table in the image?"}]}, {"id": 1747, "image": "COCO_val2014_000000246199.jpg", "conversations": [{"from": "human", "value": "Is there a banana in the image?"}, {"from": "gpt", "value": "This image contains banana, orange, dining table. Based on this, is there a banana in the image?"}]}, {"id": 1748, "image": "COCO_val2014_000000246199.jpg", "conversations": [{"from": "human", "value": "Is there a bowl in the image?"}, {"from": "gpt", "value": "This image contains banana, orange, dining table. Based on this, is there a bowl in the image?"}]}, {"id": 1749, "image": "COCO_val2014_000000246199.jpg", "conversations": [{"from": "human", "value": "Is there an orange in the image?"}, {"from": "gpt", "value": "This image contains banana, orange, dining table. Based on this, is there an orange in the image?"}]}, {"id": 1750, "image": "COCO_val2014_000000246199.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains banana, orange, dining table. Based on this, is there a person in the image?"}]}, {"id": 1751, "image": "COCO_val2014_000000246199.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains banana, orange, dining table. Based on this, is there a dining table in the image?"}]}, {"id": 1752, "image": "COCO_val2014_000000246199.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains banana, orange, dining table. Based on this, is there a cup in the image?"}]}, {"id": 1753, "image": "COCO_val2014_000000372009.jpg", "conversations": [{"from": "human", "value": "Is there a bird in the image?"}, {"from": "gpt", "value": "This image contains bird, bed, teddy bear. Based on this, is there a bird in the image?"}]}, {"id": 1754, "image": "COCO_val2014_000000372009.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains bird, bed, teddy bear. Based on this, is there a person in the image?"}]}, {"id": 1755, "image": "COCO_val2014_000000372009.jpg", "conversations": [{"from": "human", "value": "Is there a bed in the image?"}, {"from": "gpt", "value": "This image contains bird, bed, teddy bear. Based on this, is there a bed in the image?"}]}, {"id": 1756, "image": "COCO_val2014_000000372009.jpg", "conversations": [{"from": "human", "value": "Is there a book in the image?"}, {"from": "gpt", "value": "This image contains bird, bed, teddy bear. Based on this, is there a book in the image?"}]}, {"id": 1757, "image": "COCO_val2014_000000372009.jpg", "conversations": [{"from": "human", "value": "Is there a teddy bear in the image?"}, {"from": "gpt", "value": "This image contains bird, bed, teddy bear. Based on this, is there a teddy bear in the image?"}]}, {"id": 1758, "image": "COCO_val2014_000000372009.jpg", "conversations": [{"from": "human", "value": "Is there a bear in the image?"}, {"from": "gpt", "value": "This image contains bird, bed, teddy bear. Based on this, is there a bear in the image?"}]}, {"id": 1759, "image": "COCO_val2014_000000346707.jpg", "conversations": [{"from": "human", "value": "Is there a banana in the image?"}, {"from": "gpt", "value": "This image contains banana, bowl, person. Based on this, is there a banana in the image?"}]}, {"id": 1760, "image": "COCO_val2014_000000346707.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains banana, bowl, person. Based on this, is there a dining table in the image?"}]}, {"id": 1761, "image": "COCO_val2014_000000346707.jpg", "conversations": [{"from": "human", "value": "Is there a bowl in the image?"}, {"from": "gpt", "value": "This image contains banana, bowl, person. Based on this, is there a bowl in the image?"}]}, {"id": 1762, "image": "COCO_val2014_000000346707.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains banana, bowl, person. Based on this, is there a cup in the image?"}]}, {"id": 1763, "image": "COCO_val2014_000000346707.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains banana, bowl, person. Based on this, is there a person in the image?"}]}, {"id": 1764, "image": "COCO_val2014_000000346707.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains banana, bowl, person. Based on this, is there a car in the image?"}]}, {"id": 1765, "image": "COCO_val2014_000000501898.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket, bottle, bench. Based on this, is there a person in the image?"}]}, {"id": 1766, "image": "COCO_val2014_000000501898.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket, bottle, bench. Based on this, is there a car in the image?"}]}, {"id": 1767, "image": "COCO_val2014_000000501898.jpg", "conversations": [{"from": "human", "value": "Is there a sports ball in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket, bottle, bench. Based on this, is there a sports ball in the image?"}]}, {"id": 1768, "image": "COCO_val2014_000000501898.jpg", "conversations": [{"from": "human", "value": "Is there a baseball glove in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket, bottle, bench. Based on this, is there a baseball glove in the image?"}]}, {"id": 1769, "image": "COCO_val2014_000000501898.jpg", "conversations": [{"from": "human", "value": "Is there a tennis racket in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket, bottle, bench. Based on this, is there a tennis racket in the image?"}]}, {"id": 1770, "image": "COCO_val2014_000000501898.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket, bottle, bench. Based on this, is there a chair in the image?"}]}, {"id": 1771, "image": "COCO_val2014_000000281766.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, bicycle, handbag. Based on this, is there a person in the image?"}]}, {"id": 1772, "image": "COCO_val2014_000000281766.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, bicycle, handbag. Based on this, is there a car in the image?"}]}, {"id": 1773, "image": "COCO_val2014_000000281766.jpg", "conversations": [{"from": "human", "value": "Is there a bicycle in the image?"}, {"from": "gpt", "value": "This image contains person, bicycle, handbag. Based on this, is there a bicycle in the image?"}]}, {"id": 1774, "image": "COCO_val2014_000000281766.jpg", "conversations": [{"from": "human", "value": "Is there a motorcycle in the image?"}, {"from": "gpt", "value": "This image contains person, bicycle, handbag. Based on this, is there a motorcycle in the image?"}]}, {"id": 1775, "image": "COCO_val2014_000000281766.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains person, bicycle, handbag. Based on this, is there a handbag in the image?"}]}, {"id": 1776, "image": "COCO_val2014_000000281766.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains person, bicycle, handbag. Based on this, is there a backpack in the image?"}]}, {"id": 1777, "image": "COCO_val2014_000000245448.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains truck, person, motorcycle. Based on this, is there a truck in the image?"}]}, {"id": 1778, "image": "COCO_val2014_000000245448.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains truck, person, motorcycle. Based on this, is there a car in the image?"}]}, {"id": 1779, "image": "COCO_val2014_000000245448.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains truck, person, motorcycle. Based on this, is there a person in the image?"}]}, {"id": 1780, "image": "COCO_val2014_000000245448.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains truck, person, motorcycle. Based on this, is there a dining table in the image?"}]}, {"id": 1781, "image": "COCO_val2014_000000245448.jpg", "conversations": [{"from": "human", "value": "Is there a motorcycle in the image?"}, {"from": "gpt", "value": "This image contains truck, person, motorcycle. Based on this, is there a motorcycle in the image?"}]}, {"id": 1782, "image": "COCO_val2014_000000245448.jpg", "conversations": [{"from": "human", "value": "Is there a bicycle in the image?"}, {"from": "gpt", "value": "This image contains truck, person, motorcycle. Based on this, is there a bicycle in the image?"}]}, {"id": 1783, "image": "COCO_val2014_000000510138.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, wine glass, couch, bottle, laptop, dining table, cell phone. Based on this, is there a person in the image?"}]}, {"id": 1784, "image": "COCO_val2014_000000510138.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, wine glass, couch, bottle, laptop, dining table, cell phone. Based on this, is there a car in the image?"}]}, {"id": 1785, "image": "COCO_val2014_000000510138.jpg", "conversations": [{"from": "human", "value": "Is there a wine glass in the image?"}, {"from": "gpt", "value": "This image contains person, wine glass, couch, bottle, laptop, dining table, cell phone. Based on this, is there a wine glass in the image?"}]}, {"id": 1786, "image": "COCO_val2014_000000510138.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains person, wine glass, couch, bottle, laptop, dining table, cell phone. Based on this, is there a cup in the image?"}]}, {"id": 1787, "image": "COCO_val2014_000000510138.jpg", "conversations": [{"from": "human", "value": "Is there a couch in the image?"}, {"from": "gpt", "value": "This image contains person, wine glass, couch, bottle, laptop, dining table, cell phone. Based on this, is there a couch in the image?"}]}, {"id": 1788, "image": "COCO_val2014_000000510138.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains person, wine glass, couch, bottle, laptop, dining table, cell phone. Based on this, is there a chair in the image?"}]}, {"id": 1789, "image": "COCO_val2014_000000001171.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains truck, train, car, bed. Based on this, is there a truck in the image?"}]}, {"id": 1790, "image": "COCO_val2014_000000001171.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains truck, train, car, bed. Based on this, is there a person in the image?"}]}, {"id": 1791, "image": "COCO_val2014_000000001171.jpg", "conversations": [{"from": "human", "value": "Is there a train in the image?"}, {"from": "gpt", "value": "This image contains truck, train, car, bed. Based on this, is there a train in the image?"}]}, {"id": 1792, "image": "COCO_val2014_000000001171.jpg", "conversations": [{"from": "human", "value": "Is there a traffic light in the image?"}, {"from": "gpt", "value": "This image contains truck, train, car, bed. Based on this, is there a traffic light in the image?"}]}, {"id": 1793, "image": "COCO_val2014_000000001171.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains truck, train, car, bed. Based on this, is there a car in the image?"}]}, {"id": 1794, "image": "COCO_val2014_000000001171.jpg", "conversations": [{"from": "human", "value": "Is there a bus in the image?"}, {"from": "gpt", "value": "This image contains truck, train, car, bed. Based on this, is there a bus in the image?"}]}, {"id": 1795, "image": "COCO_val2014_000000100238.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, bottle, frisbee, handbag. Based on this, is there a person in the image?"}]}, {"id": 1796, "image": "COCO_val2014_000000100238.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, bottle, frisbee, handbag. Based on this, is there a car in the image?"}]}, {"id": 1797, "image": "COCO_val2014_000000100238.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains person, bottle, frisbee, handbag. Based on this, is there a bottle in the image?"}]}, {"id": 1798, "image": "COCO_val2014_000000100238.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, bottle, frisbee, handbag. Based on this, is there a dining table in the image?"}]}, {"id": 1799, "image": "COCO_val2014_000000100238.jpg", "conversations": [{"from": "human", "value": "Is there a frisbee in the image?"}, {"from": "gpt", "value": "This image contains person, bottle, frisbee, handbag. Based on this, is there a frisbee in the image?"}]}, {"id": 1800, "image": "COCO_val2014_000000100238.jpg", "conversations": [{"from": "human", "value": "Is there a dog in the image?"}, {"from": "gpt", "value": "This image contains person, bottle, frisbee, handbag. Based on this, is there a dog in the image?"}]}, {"id": 1801, "image": "COCO_val2014_000000465418.jpg", "conversations": [{"from": "human", "value": "Is there a traffic light in the image?"}, {"from": "gpt", "value": "This image contains traffic light, person, bus. Based on this, is there a traffic light in the image?"}]}, {"id": 1802, "image": "COCO_val2014_000000465418.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains traffic light, person, bus. Based on this, is there a car in the image?"}]}, {"id": 1803, "image": "COCO_val2014_000000465418.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains traffic light, person, bus. Based on this, is there a person in the image?"}]}, {"id": 1804, "image": "COCO_val2014_000000465418.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains traffic light, person, bus. Based on this, is there a dining table in the image?"}]}, {"id": 1805, "image": "COCO_val2014_000000465418.jpg", "conversations": [{"from": "human", "value": "Is there a bus in the image?"}, {"from": "gpt", "value": "This image contains traffic light, person, bus. Based on this, is there a bus in the image?"}]}, {"id": 1806, "image": "COCO_val2014_000000465418.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains traffic light, person, bus. Based on this, is there a handbag in the image?"}]}, {"id": 1807, "image": "COCO_val2014_000000392364.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains car, traffic light, person, horse. Based on this, is there a car in the image?"}]}, {"id": 1808, "image": "COCO_val2014_000000392364.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains car, traffic light, person, horse. Based on this, is there a truck in the image?"}]}, {"id": 1809, "image": "COCO_val2014_000000392364.jpg", "conversations": [{"from": "human", "value": "Is there a traffic light in the image?"}, {"from": "gpt", "value": "This image contains car, traffic light, person, horse. Based on this, is there a traffic light in the image?"}]}, {"id": 1810, "image": "COCO_val2014_000000392364.jpg", "conversations": [{"from": "human", "value": "Is there a bus in the image?"}, {"from": "gpt", "value": "This image contains car, traffic light, person, horse. Based on this, is there a bus in the image?"}]}, {"id": 1811, "image": "COCO_val2014_000000392364.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains car, traffic light, person, horse. Based on this, is there a person in the image?"}]}, {"id": 1812, "image": "COCO_val2014_000000392364.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains car, traffic light, person, horse. Based on this, is there a dining table in the image?"}]}, {"id": 1813, "image": "COCO_val2014_000000188958.jpg", "conversations": [{"from": "human", "value": "Is there a snowboard in the image?"}, {"from": "gpt", "value": "This image contains snowboard, person, skis. Based on this, is there a snowboard in the image?"}]}, {"id": 1814, "image": "COCO_val2014_000000188958.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains snowboard, person, skis. Based on this, is there a backpack in the image?"}]}, {"id": 1815, "image": "COCO_val2014_000000188958.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains snowboard, person, skis. Based on this, is there a person in the image?"}]}, {"id": 1816, "image": "COCO_val2014_000000188958.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains snowboard, person, skis. Based on this, is there a car in the image?"}]}, {"id": 1817, "image": "COCO_val2014_000000188958.jpg", "conversations": [{"from": "human", "value": "Is there a skis in the image?"}, {"from": "gpt", "value": "This image contains snowboard, person, skis. Based on this, is there a skis in the image?"}]}, {"id": 1818, "image": "COCO_val2014_000000188958.jpg", "conversations": [{"from": "human", "value": "Is there a dog in the image?"}, {"from": "gpt", "value": "This image contains snowboard, person, skis. Based on this, is there a dog in the image?"}]}, {"id": 1819, "image": "COCO_val2014_000000436127.jpg", "conversations": [{"from": "human", "value": "Is there a clock in the image?"}, {"from": "gpt", "value": "This image contains clock, person, horse, car, bus. Based on this, is there a clock in the image?"}]}, {"id": 1820, "image": "COCO_val2014_000000436127.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains clock, person, horse, car, bus. Based on this, is there a chair in the image?"}]}, {"id": 1821, "image": "COCO_val2014_000000436127.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains clock, person, horse, car, bus. Based on this, is there a person in the image?"}]}, {"id": 1822, "image": "COCO_val2014_000000436127.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains clock, person, horse, car, bus. Based on this, is there a dining table in the image?"}]}, {"id": 1823, "image": "COCO_val2014_000000436127.jpg", "conversations": [{"from": "human", "value": "Is there a horse in the image?"}, {"from": "gpt", "value": "This image contains clock, person, horse, car, bus. Based on this, is there a horse in the image?"}]}, {"id": 1824, "image": "COCO_val2014_000000436127.jpg", "conversations": [{"from": "human", "value": "Is there a dog in the image?"}, {"from": "gpt", "value": "This image contains clock, person, horse, car, bus. Based on this, is there a dog in the image?"}]}, {"id": 1825, "image": "COCO_val2014_000000198397.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains chair, person, sports ball, tennis racket. Based on this, is there a chair in the image?"}]}, {"id": 1826, "image": "COCO_val2014_000000198397.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains chair, person, sports ball, tennis racket. Based on this, is there a dining table in the image?"}]}, {"id": 1827, "image": "COCO_val2014_000000198397.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains chair, person, sports ball, tennis racket. Based on this, is there a person in the image?"}]}, {"id": 1828, "image": "COCO_val2014_000000198397.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains chair, person, sports ball, tennis racket. Based on this, is there a car in the image?"}]}, {"id": 1829, "image": "COCO_val2014_000000198397.jpg", "conversations": [{"from": "human", "value": "Is there a sports ball in the image?"}, {"from": "gpt", "value": "This image contains chair, person, sports ball, tennis racket. Based on this, is there a sports ball in the image?"}]}, {"id": 1830, "image": "COCO_val2014_000000198397.jpg", "conversations": [{"from": "human", "value": "Is there a baseball glove in the image?"}, {"from": "gpt", "value": "This image contains chair, person, sports ball, tennis racket. Based on this, is there a baseball glove in the image?"}]}, {"id": 1831, "image": "COCO_val2014_000000349936.jpg", "conversations": [{"from": "human", "value": "Is there an oven in the image?"}, {"from": "gpt", "value": "This image contains oven, dining table, chair, cake, tv, couch, book, cup. Based on this, is there an oven in the image?"}]}, {"id": 1832, "image": "COCO_val2014_000000349936.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains oven, dining table, chair, cake, tv, couch, book, cup. Based on this, is there a bottle in the image?"}]}, {"id": 1833, "image": "COCO_val2014_000000349936.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains oven, dining table, chair, cake, tv, couch, book, cup. Based on this, is there a dining table in the image?"}]}, {"id": 1834, "image": "COCO_val2014_000000349936.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains oven, dining table, chair, cake, tv, couch, book, cup. Based on this, is there a person in the image?"}]}, {"id": 1835, "image": "COCO_val2014_000000349936.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains oven, dining table, chair, cake, tv, couch, book, cup. Based on this, is there a chair in the image?"}]}, {"id": 1836, "image": "COCO_val2014_000000349936.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains oven, dining table, chair, cake, tv, couch, book, cup. Based on this, is there a handbag in the image?"}]}, {"id": 1837, "image": "COCO_val2014_000000333756.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket. Based on this, is there a person in the image?"}]}, {"id": 1838, "image": "COCO_val2014_000000333756.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket. Based on this, is there a car in the image?"}]}, {"id": 1839, "image": "COCO_val2014_000000333756.jpg", "conversations": [{"from": "human", "value": "Is there a sports ball in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket. Based on this, is there a sports ball in the image?"}]}, {"id": 1840, "image": "COCO_val2014_000000333756.jpg", "conversations": [{"from": "human", "value": "Is there a baseball glove in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket. Based on this, is there a baseball glove in the image?"}]}, {"id": 1841, "image": "COCO_val2014_000000333756.jpg", "conversations": [{"from": "human", "value": "Is there a tennis racket in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket. Based on this, is there a tennis racket in the image?"}]}, {"id": 1842, "image": "COCO_val2014_000000333756.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket. Based on this, is there a chair in the image?"}]}, {"id": 1843, "image": "COCO_val2014_000000474741.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains backpack, clock, person, handbag, dining table, vase, tie. Based on this, is there a backpack in the image?"}]}, {"id": 1844, "image": "COCO_val2014_000000474741.jpg", "conversations": [{"from": "human", "value": "Is there a skis in the image?"}, {"from": "gpt", "value": "This image contains backpack, clock, person, handbag, dining table, vase, tie. Based on this, is there a skis in the image?"}]}, {"id": 1845, "image": "COCO_val2014_000000474741.jpg", "conversations": [{"from": "human", "value": "Is there a clock in the image?"}, {"from": "gpt", "value": "This image contains backpack, clock, person, handbag, dining table, vase, tie. Based on this, is there a clock in the image?"}]}, {"id": 1846, "image": "COCO_val2014_000000474741.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains backpack, clock, person, handbag, dining table, vase, tie. Based on this, is there a chair in the image?"}]}, {"id": 1847, "image": "COCO_val2014_000000474741.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains backpack, clock, person, handbag, dining table, vase, tie. Based on this, is there a person in the image?"}]}, {"id": 1848, "image": "COCO_val2014_000000474741.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains backpack, clock, person, handbag, dining table, vase, tie. Based on this, is there a car in the image?"}]}, {"id": 1849, "image": "COCO_val2014_000000286342.jpg", "conversations": [{"from": "human", "value": "Is there a keyboard in the image?"}, {"from": "gpt", "value": "This image contains keyboard, mouse, laptop, dining table. Based on this, is there a keyboard in the image?"}]}, {"id": 1850, "image": "COCO_val2014_000000286342.jpg", "conversations": [{"from": "human", "value": "Is there a tv in the image?"}, {"from": "gpt", "value": "This image contains keyboard, mouse, laptop, dining table. Based on this, is there a tv in the image?"}]}, {"id": 1851, "image": "COCO_val2014_000000286342.jpg", "conversations": [{"from": "human", "value": "Is there a mouse in the image?"}, {"from": "gpt", "value": "This image contains keyboard, mouse, laptop, dining table. Based on this, is there a mouse in the image?"}]}, {"id": 1852, "image": "COCO_val2014_000000286342.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains keyboard, mouse, laptop, dining table. Based on this, is there a chair in the image?"}]}, {"id": 1853, "image": "COCO_val2014_000000286342.jpg", "conversations": [{"from": "human", "value": "Is there a laptop in the image?"}, {"from": "gpt", "value": "This image contains keyboard, mouse, laptop, dining table. Based on this, is there a laptop in the image?"}]}, {"id": 1854, "image": "COCO_val2014_000000286342.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains keyboard, mouse, laptop, dining table. Based on this, is there a person in the image?"}]}, {"id": 1855, "image": "COCO_val2014_000000093948.jpg", "conversations": [{"from": "human", "value": "Is there a tv in the image?"}, {"from": "gpt", "value": "This image contains tv, mouse, laptop, dining table, keyboard, cat. Based on this, is there a tv in the image?"}]}, {"id": 1856, "image": "COCO_val2014_000000093948.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains tv, mouse, laptop, dining table, keyboard, cat. Based on this, is there a person in the image?"}]}, {"id": 1857, "image": "COCO_val2014_000000093948.jpg", "conversations": [{"from": "human", "value": "Is there a mouse in the image?"}, {"from": "gpt", "value": "This image contains tv, mouse, laptop, dining table, keyboard, cat. Based on this, is there a mouse in the image?"}]}, {"id": 1858, "image": "COCO_val2014_000000093948.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains tv, mouse, laptop, dining table, keyboard, cat. Based on this, is there a chair in the image?"}]}, {"id": 1859, "image": "COCO_val2014_000000093948.jpg", "conversations": [{"from": "human", "value": "Is there a laptop in the image?"}, {"from": "gpt", "value": "This image contains tv, mouse, laptop, dining table, keyboard, cat. Based on this, is there a laptop in the image?"}]}, {"id": 1860, "image": "COCO_val2014_000000093948.jpg", "conversations": [{"from": "human", "value": "Is there a cell phone in the image?"}, {"from": "gpt", "value": "This image contains tv, mouse, laptop, dining table, keyboard, cat. Based on this, is there a cell phone in the image?"}]}, {"id": 1861, "image": "COCO_val2014_000000405740.jpg", "conversations": [{"from": "human", "value": "Is there a wine glass in the image?"}, {"from": "gpt", "value": "This image contains wine glass, person, laptop, cup. Based on this, is there a wine glass in the image?"}]}, {"id": 1862, "image": "COCO_val2014_000000405740.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains wine glass, person, laptop, cup. Based on this, is there a dining table in the image?"}]}, {"id": 1863, "image": "COCO_val2014_000000405740.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains wine glass, person, laptop, cup. Based on this, is there a person in the image?"}]}, {"id": 1864, "image": "COCO_val2014_000000405740.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains wine glass, person, laptop, cup. Based on this, is there a car in the image?"}]}, {"id": 1865, "image": "COCO_val2014_000000405740.jpg", "conversations": [{"from": "human", "value": "Is there a laptop in the image?"}, {"from": "gpt", "value": "This image contains wine glass, person, laptop, cup. Based on this, is there a laptop in the image?"}]}, {"id": 1866, "image": "COCO_val2014_000000405740.jpg", "conversations": [{"from": "human", "value": "Is there a tv in the image?"}, {"from": "gpt", "value": "This image contains wine glass, person, laptop, cup. Based on this, is there a tv in the image?"}]}, {"id": 1867, "image": "COCO_val2014_000000304387.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, surfboard, kite. Based on this, is there a person in the image?"}]}, {"id": 1868, "image": "COCO_val2014_000000304387.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, surfboard, kite. Based on this, is there a car in the image?"}]}, {"id": 1869, "image": "COCO_val2014_000000304387.jpg", "conversations": [{"from": "human", "value": "Is there a surfboard in the image?"}, {"from": "gpt", "value": "This image contains person, surfboard, kite. Based on this, is there a surfboard in the image?"}]}, {"id": 1870, "image": "COCO_val2014_000000304387.jpg", "conversations": [{"from": "human", "value": "Is there an umbrella in the image?"}, {"from": "gpt", "value": "This image contains person, surfboard, kite. Based on this, is there an umbrella in the image?"}]}, {"id": 1871, "image": "COCO_val2014_000000304387.jpg", "conversations": [{"from": "human", "value": "Is there a kite in the image?"}, {"from": "gpt", "value": "This image contains person, surfboard, kite. Based on this, is there a kite in the image?"}]}, {"id": 1872, "image": "COCO_val2014_000000304387.jpg", "conversations": [{"from": "human", "value": "Is there a bicycle in the image?"}, {"from": "gpt", "value": "This image contains person, surfboard, kite. Based on this, is there a bicycle in the image?"}]}, {"id": 1873, "image": "COCO_val2014_000000147165.jpg", "conversations": [{"from": "human", "value": "Is there a sink in the image?"}, {"from": "gpt", "value": "This image contains sink, person, spoon, oven. Based on this, is there a sink in the image?"}]}, {"id": 1874, "image": "COCO_val2014_000000147165.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains sink, person, spoon, oven. Based on this, is there a bottle in the image?"}]}, {"id": 1875, "image": "COCO_val2014_000000147165.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains sink, person, spoon, oven. Based on this, is there a person in the image?"}]}, {"id": 1876, "image": "COCO_val2014_000000147165.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains sink, person, spoon, oven. Based on this, is there a car in the image?"}]}, {"id": 1877, "image": "COCO_val2014_000000147165.jpg", "conversations": [{"from": "human", "value": "Is there a spoon in the image?"}, {"from": "gpt", "value": "This image contains sink, person, spoon, oven. Based on this, is there a spoon in the image?"}]}, {"id": 1878, "image": "COCO_val2014_000000147165.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains sink, person, spoon, oven. Based on this, is there a cup in the image?"}]}, {"id": 1879, "image": "COCO_val2014_000000495311.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains truck, person, airplane. Based on this, is there a truck in the image?"}]}, {"id": 1880, "image": "COCO_val2014_000000495311.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains truck, person, airplane. Based on this, is there a car in the image?"}]}, {"id": 1881, "image": "COCO_val2014_000000495311.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains truck, person, airplane. Based on this, is there a person in the image?"}]}, {"id": 1882, "image": "COCO_val2014_000000495311.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains truck, person, airplane. Based on this, is there a dining table in the image?"}]}, {"id": 1883, "image": "COCO_val2014_000000495311.jpg", "conversations": [{"from": "human", "value": "Is there an airplane in the image?"}, {"from": "gpt", "value": "This image contains truck, person, airplane. Based on this, is there an airplane in the image?"}]}, {"id": 1884, "image": "COCO_val2014_000000495311.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains truck, person, airplane. Based on this, is there a backpack in the image?"}]}, {"id": 1885, "image": "COCO_val2014_000000312406.jpg", "conversations": [{"from": "human", "value": "Is there a banana in the image?"}, {"from": "gpt", "value": "This image contains banana, bowl, cup, dining table. Based on this, is there a banana in the image?"}]}, {"id": 1886, "image": "COCO_val2014_000000312406.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains banana, bowl, cup, dining table. Based on this, is there a person in the image?"}]}, {"id": 1887, "image": "COCO_val2014_000000312406.jpg", "conversations": [{"from": "human", "value": "Is there a bowl in the image?"}, {"from": "gpt", "value": "This image contains banana, bowl, cup, dining table. Based on this, is there a bowl in the image?"}]}, {"id": 1888, "image": "COCO_val2014_000000312406.jpg", "conversations": [{"from": "human", "value": "Is there a spoon in the image?"}, {"from": "gpt", "value": "This image contains banana, bowl, cup, dining table. Based on this, is there a spoon in the image?"}]}, {"id": 1889, "image": "COCO_val2014_000000312406.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains banana, bowl, cup, dining table. Based on this, is there a cup in the image?"}]}, {"id": 1890, "image": "COCO_val2014_000000312406.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains banana, bowl, cup, dining table. Based on this, is there a bottle in the image?"}]}, {"id": 1891, "image": "COCO_val2014_000000515820.jpg", "conversations": [{"from": "human", "value": "Is there a tv in the image?"}, {"from": "gpt", "value": "This image contains tv, clock, person, train, bench. Based on this, is there a tv in the image?"}]}, {"id": 1892, "image": "COCO_val2014_000000515820.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains tv, clock, person, train, bench. Based on this, is there a dining table in the image?"}]}, {"id": 1893, "image": "COCO_val2014_000000515820.jpg", "conversations": [{"from": "human", "value": "Is there a clock in the image?"}, {"from": "gpt", "value": "This image contains tv, clock, person, train, bench. Based on this, is there a clock in the image?"}]}, {"id": 1894, "image": "COCO_val2014_000000515820.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains tv, clock, person, train, bench. Based on this, is there a chair in the image?"}]}, {"id": 1895, "image": "COCO_val2014_000000515820.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains tv, clock, person, train, bench. Based on this, is there a person in the image?"}]}, {"id": 1896, "image": "COCO_val2014_000000515820.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains tv, clock, person, train, bench. Based on this, is there a car in the image?"}]}, {"id": 1897, "image": "COCO_val2014_000000031971.jpg", "conversations": [{"from": "human", "value": "Is there an orange in the image?"}, {"from": "gpt", "value": "This image contains orange, bed, book. Based on this, is there an orange in the image?"}]}, {"id": 1898, "image": "COCO_val2014_000000031971.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains orange, bed, book. Based on this, is there a person in the image?"}]}, {"id": 1899, "image": "COCO_val2014_000000031971.jpg", "conversations": [{"from": "human", "value": "Is there a bed in the image?"}, {"from": "gpt", "value": "This image contains orange, bed, book. Based on this, is there a bed in the image?"}]}, {"id": 1900, "image": "COCO_val2014_000000031971.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains orange, bed, book. Based on this, is there a dining table in the image?"}]}, {"id": 1901, "image": "COCO_val2014_000000031971.jpg", "conversations": [{"from": "human", "value": "Is there a book in the image?"}, {"from": "gpt", "value": "This image contains orange, bed, book. Based on this, is there a book in the image?"}]}, {"id": 1902, "image": "COCO_val2014_000000031971.jpg", "conversations": [{"from": "human", "value": "Is there a tv in the image?"}, {"from": "gpt", "value": "This image contains orange, bed, book. Based on this, is there a tv in the image?"}]}, {"id": 1903, "image": "COCO_val2014_000000418680.jpg", "conversations": [{"from": "human", "value": "Is there a snowboard in the image?"}, {"from": "gpt", "value": "This image contains snowboard, person, skis. Based on this, is there a snowboard in the image?"}]}, {"id": 1904, "image": "COCO_val2014_000000418680.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains snowboard, person, skis. Based on this, is there a backpack in the image?"}]}, {"id": 1905, "image": "COCO_val2014_000000418680.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains snowboard, person, skis. Based on this, is there a person in the image?"}]}, {"id": 1906, "image": "COCO_val2014_000000418680.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains snowboard, person, skis. Based on this, is there a car in the image?"}]}, {"id": 1907, "image": "COCO_val2014_000000418680.jpg", "conversations": [{"from": "human", "value": "Is there a skis in the image?"}, {"from": "gpt", "value": "This image contains snowboard, person, skis. Based on this, is there a skis in the image?"}]}, {"id": 1908, "image": "COCO_val2014_000000418680.jpg", "conversations": [{"from": "human", "value": "Is there a dog in the image?"}, {"from": "gpt", "value": "This image contains snowboard, person, skis. Based on this, is there a dog in the image?"}]}, {"id": 1909, "image": "COCO_val2014_000000459680.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, orange, umbrella. Based on this, is there a person in the image?"}]}, {"id": 1910, "image": "COCO_val2014_000000459680.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, orange, umbrella. Based on this, is there a car in the image?"}]}, {"id": 1911, "image": "COCO_val2014_000000459680.jpg", "conversations": [{"from": "human", "value": "Is there an orange in the image?"}, {"from": "gpt", "value": "This image contains person, orange, umbrella. Based on this, is there an orange in the image?"}]}, {"id": 1912, "image": "COCO_val2014_000000459680.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, orange, umbrella. Based on this, is there a dining table in the image?"}]}, {"id": 1913, "image": "COCO_val2014_000000459680.jpg", "conversations": [{"from": "human", "value": "Is there an umbrella in the image?"}, {"from": "gpt", "value": "This image contains person, orange, umbrella. Based on this, is there an umbrella in the image?"}]}, {"id": 1914, "image": "COCO_val2014_000000459680.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains person, orange, umbrella. Based on this, is there a handbag in the image?"}]}, {"id": 1915, "image": "COCO_val2014_000000196462.jpg", "conversations": [{"from": "human", "value": "Is there a bowl in the image?"}, {"from": "gpt", "value": "This image contains bowl, fork, cup. Based on this, is there a bowl in the image?"}]}, {"id": 1916, "image": "COCO_val2014_000000196462.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains bowl, fork, cup. Based on this, is there a dining table in the image?"}]}, {"id": 1917, "image": "COCO_val2014_000000196462.jpg", "conversations": [{"from": "human", "value": "Is there a fork in the image?"}, {"from": "gpt", "value": "This image contains bowl, fork, cup. Based on this, is there a fork in the image?"}]}, {"id": 1918, "image": "COCO_val2014_000000196462.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains bowl, fork, cup. Based on this, is there a person in the image?"}]}, {"id": 1919, "image": "COCO_val2014_000000196462.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains bowl, fork, cup. Based on this, is there a cup in the image?"}]}, {"id": 1920, "image": "COCO_val2014_000000196462.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains bowl, fork, cup. Based on this, is there a bottle in the image?"}]}, {"id": 1921, "image": "COCO_val2014_000000276693.jpg", "conversations": [{"from": "human", "value": "Is there a dog in the image?"}, {"from": "gpt", "value": "This image contains dog, person, skis. Based on this, is there a dog in the image?"}]}, {"id": 1922, "image": "COCO_val2014_000000276693.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains dog, person, skis. Based on this, is there a car in the image?"}]}, {"id": 1923, "image": "COCO_val2014_000000276693.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains dog, person, skis. Based on this, is there a person in the image?"}]}, {"id": 1924, "image": "COCO_val2014_000000276693.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains dog, person, skis. Based on this, is there a dining table in the image?"}]}, {"id": 1925, "image": "COCO_val2014_000000276693.jpg", "conversations": [{"from": "human", "value": "Is there a skis in the image?"}, {"from": "gpt", "value": "This image contains dog, person, skis. Based on this, is there a skis in the image?"}]}, {"id": 1926, "image": "COCO_val2014_000000276693.jpg", "conversations": [{"from": "human", "value": "Is there a snowboard in the image?"}, {"from": "gpt", "value": "This image contains dog, person, skis. Based on this, is there a snowboard in the image?"}]}, {"id": 1927, "image": "COCO_val2014_000000356424.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, car, bottle, dining table, chair, cup. Based on this, is there a person in the image?"}]}, {"id": 1928, "image": "COCO_val2014_000000356424.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains person, car, bottle, dining table, chair, cup. Based on this, is there a handbag in the image?"}]}, {"id": 1929, "image": "COCO_val2014_000000356424.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, car, bottle, dining table, chair, cup. Based on this, is there a car in the image?"}]}, {"id": 1930, "image": "COCO_val2014_000000356424.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains person, car, bottle, dining table, chair, cup. Based on this, is there a truck in the image?"}]}, {"id": 1931, "image": "COCO_val2014_000000356424.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains person, car, bottle, dining table, chair, cup. Based on this, is there a bottle in the image?"}]}, {"id": 1932, "image": "COCO_val2014_000000356424.jpg", "conversations": [{"from": "human", "value": "Is there a spoon in the image?"}, {"from": "gpt", "value": "This image contains person, car, bottle, dining table, chair, cup. Based on this, is there a spoon in the image?"}]}, {"id": 1933, "image": "COCO_val2014_000000505335.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, bottle, umbrella, tie. Based on this, is there a person in the image?"}]}, {"id": 1934, "image": "COCO_val2014_000000505335.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, bottle, umbrella, tie. Based on this, is there a car in the image?"}]}, {"id": 1935, "image": "COCO_val2014_000000505335.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains person, bottle, umbrella, tie. Based on this, is there a bottle in the image?"}]}, {"id": 1936, "image": "COCO_val2014_000000505335.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, bottle, umbrella, tie. Based on this, is there a dining table in the image?"}]}, {"id": 1937, "image": "COCO_val2014_000000505335.jpg", "conversations": [{"from": "human", "value": "Is there an umbrella in the image?"}, {"from": "gpt", "value": "This image contains person, bottle, umbrella, tie. Based on this, is there an umbrella in the image?"}]}, {"id": 1938, "image": "COCO_val2014_000000505335.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains person, bottle, umbrella, tie. Based on this, is there a handbag in the image?"}]}, {"id": 1939, "image": "COCO_val2014_000000172342.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, spoon, bowl, clock, dining table, bottle, fork, book, cup. Based on this, is there a person in the image?"}]}, {"id": 1940, "image": "COCO_val2014_000000172342.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, spoon, bowl, clock, dining table, bottle, fork, book, cup. Based on this, is there a car in the image?"}]}, {"id": 1941, "image": "COCO_val2014_000000172342.jpg", "conversations": [{"from": "human", "value": "Is there a spoon in the image?"}, {"from": "gpt", "value": "This image contains person, spoon, bowl, clock, dining table, bottle, fork, book, cup. Based on this, is there a spoon in the image?"}]}, {"id": 1942, "image": "COCO_val2014_000000172342.jpg", "conversations": [{"from": "human", "value": "Is there a knife in the image?"}, {"from": "gpt", "value": "This image contains person, spoon, bowl, clock, dining table, bottle, fork, book, cup. Based on this, is there a knife in the image?"}]}, {"id": 1943, "image": "COCO_val2014_000000172342.jpg", "conversations": [{"from": "human", "value": "Is there a bowl in the image?"}, {"from": "gpt", "value": "This image contains person, spoon, bowl, clock, dining table, bottle, fork, book, cup. Based on this, is there a bowl in the image?"}]}, {"id": 1944, "image": "COCO_val2014_000000172342.jpg", "conversations": [{"from": "human", "value": "Is there a banana in the image?"}, {"from": "gpt", "value": "This image contains person, spoon, bowl, clock, dining table, bottle, fork, book, cup. Based on this, is there a banana in the image?"}]}, {"id": 1945, "image": "COCO_val2014_000000384970.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains truck, person, car, motorcycle, cell phone. Based on this, is there a truck in the image?"}]}, {"id": 1946, "image": "COCO_val2014_000000384970.jpg", "conversations": [{"from": "human", "value": "Is there a traffic light in the image?"}, {"from": "gpt", "value": "This image contains truck, person, car, motorcycle, cell phone. Based on this, is there a traffic light in the image?"}]}, {"id": 1947, "image": "COCO_val2014_000000384970.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains truck, person, car, motorcycle, cell phone. Based on this, is there a person in the image?"}]}, {"id": 1948, "image": "COCO_val2014_000000384970.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains truck, person, car, motorcycle, cell phone. Based on this, is there a dining table in the image?"}]}, {"id": 1949, "image": "COCO_val2014_000000384970.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains truck, person, car, motorcycle, cell phone. Based on this, is there a car in the image?"}]}, {"id": 1950, "image": "COCO_val2014_000000384970.jpg", "conversations": [{"from": "human", "value": "Is there a bus in the image?"}, {"from": "gpt", "value": "This image contains truck, person, car, motorcycle, cell phone. Based on this, is there a bus in the image?"}]}, {"id": 1951, "image": "COCO_val2014_000000572260.jpg", "conversations": [{"from": "human", "value": "Is there a wine glass in the image?"}, {"from": "gpt", "value": "This image contains wine glass, teddy bear, apple, book, cup. Based on this, is there a wine glass in the image?"}]}, {"id": 1952, "image": "COCO_val2014_000000572260.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains wine glass, teddy bear, apple, book, cup. Based on this, is there a person in the image?"}]}, {"id": 1953, "image": "COCO_val2014_000000572260.jpg", "conversations": [{"from": "human", "value": "Is there a teddy bear in the image?"}, {"from": "gpt", "value": "This image contains wine glass, teddy bear, apple, book, cup. Based on this, is there a teddy bear in the image?"}]}, {"id": 1954, "image": "COCO_val2014_000000572260.jpg", "conversations": [{"from": "human", "value": "Is there a bear in the image?"}, {"from": "gpt", "value": "This image contains wine glass, teddy bear, apple, book, cup. Based on this, is there a bear in the image?"}]}, {"id": 1955, "image": "COCO_val2014_000000572260.jpg", "conversations": [{"from": "human", "value": "Is there an apple in the image?"}, {"from": "gpt", "value": "This image contains wine glass, teddy bear, apple, book, cup. Based on this, is there an apple in the image?"}]}, {"id": 1956, "image": "COCO_val2014_000000572260.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains wine glass, teddy bear, apple, book, cup. Based on this, is there a dining table in the image?"}]}, {"id": 1957, "image": "COCO_val2014_000000418471.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, dining table, chair, pizza, cup. Based on this, is there a person in the image?"}]}, {"id": 1958, "image": "COCO_val2014_000000418471.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, dining table, chair, pizza, cup. Based on this, is there a car in the image?"}]}, {"id": 1959, "image": "COCO_val2014_000000418471.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, dining table, chair, pizza, cup. Based on this, is there a dining table in the image?"}]}, {"id": 1960, "image": "COCO_val2014_000000418471.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains person, dining table, chair, pizza, cup. Based on this, is there a bottle in the image?"}]}, {"id": 1961, "image": "COCO_val2014_000000418471.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains person, dining table, chair, pizza, cup. Based on this, is there a chair in the image?"}]}, {"id": 1962, "image": "COCO_val2014_000000418471.jpg", "conversations": [{"from": "human", "value": "Is there a couch in the image?"}, {"from": "gpt", "value": "This image contains person, dining table, chair, pizza, cup. Based on this, is there a couch in the image?"}]}, {"id": 1963, "image": "COCO_val2014_000000379404.jpg", "conversations": [{"from": "human", "value": "Is there a banana in the image?"}, {"from": "gpt", "value": "This image contains banana, sandwich, dining table. Based on this, is there a banana in the image?"}]}, {"id": 1964, "image": "COCO_val2014_000000379404.jpg", "conversations": [{"from": "human", "value": "Is there a bowl in the image?"}, {"from": "gpt", "value": "This image contains banana, sandwich, dining table. Based on this, is there a bowl in the image?"}]}, {"id": 1965, "image": "COCO_val2014_000000379404.jpg", "conversations": [{"from": "human", "value": "Is there a sandwich in the image?"}, {"from": "gpt", "value": "This image contains banana, sandwich, dining table. Based on this, is there a sandwich in the image?"}]}, {"id": 1966, "image": "COCO_val2014_000000379404.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains banana, sandwich, dining table. Based on this, is there a cup in the image?"}]}, {"id": 1967, "image": "COCO_val2014_000000379404.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains banana, sandwich, dining table. Based on this, is there a dining table in the image?"}]}, {"id": 1968, "image": "COCO_val2014_000000379404.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains banana, sandwich, dining table. Based on this, is there a person in the image?"}]}, {"id": 1969, "image": "COCO_val2014_000000044801.jpg", "conversations": [{"from": "human", "value": "Is there a traffic light in the image?"}, {"from": "gpt", "value": "This image contains traffic light, person, truck, car, motorcycle, bus. Based on this, is there a traffic light in the image?"}]}, {"id": 1970, "image": "COCO_val2014_000000044801.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains traffic light, person, truck, car, motorcycle, bus. Based on this, is there a backpack in the image?"}]}, {"id": 1971, "image": "COCO_val2014_000000044801.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains traffic light, person, truck, car, motorcycle, bus. Based on this, is there a person in the image?"}]}, {"id": 1972, "image": "COCO_val2014_000000044801.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains traffic light, person, truck, car, motorcycle, bus. Based on this, is there a dining table in the image?"}]}, {"id": 1973, "image": "COCO_val2014_000000044801.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains traffic light, person, truck, car, motorcycle, bus. Based on this, is there a truck in the image?"}]}, {"id": 1974, "image": "COCO_val2014_000000044801.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains traffic light, person, truck, car, motorcycle, bus. Based on this, is there a handbag in the image?"}]}, {"id": 1975, "image": "COCO_val2014_000000293564.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, surfboard, umbrella. Based on this, is there a person in the image?"}]}, {"id": 1976, "image": "COCO_val2014_000000293564.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, surfboard, umbrella. Based on this, is there a car in the image?"}]}, {"id": 1977, "image": "COCO_val2014_000000293564.jpg", "conversations": [{"from": "human", "value": "Is there a surfboard in the image?"}, {"from": "gpt", "value": "This image contains person, surfboard, umbrella. Based on this, is there a surfboard in the image?"}]}, {"id": 1978, "image": "COCO_val2014_000000293564.jpg", "conversations": [{"from": "human", "value": "Is there a kite in the image?"}, {"from": "gpt", "value": "This image contains person, surfboard, umbrella. Based on this, is there a kite in the image?"}]}, {"id": 1979, "image": "COCO_val2014_000000293564.jpg", "conversations": [{"from": "human", "value": "Is there an umbrella in the image?"}, {"from": "gpt", "value": "This image contains person, surfboard, umbrella. Based on this, is there an umbrella in the image?"}]}, {"id": 1980, "image": "COCO_val2014_000000293564.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains person, surfboard, umbrella. Based on this, is there a handbag in the image?"}]}, {"id": 1981, "image": "COCO_val2014_000000452297.jpg", "conversations": [{"from": "human", "value": "Is there a banana in the image?"}, {"from": "gpt", "value": "This image contains banana, spoon, bowl, cup. Based on this, is there a banana in the image?"}]}, {"id": 1982, "image": "COCO_val2014_000000452297.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains banana, spoon, bowl, cup. Based on this, is there a dining table in the image?"}]}, {"id": 1983, "image": "COCO_val2014_000000452297.jpg", "conversations": [{"from": "human", "value": "Is there a spoon in the image?"}, {"from": "gpt", "value": "This image contains banana, spoon, bowl, cup. Based on this, is there a spoon in the image?"}]}, {"id": 1984, "image": "COCO_val2014_000000452297.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains banana, spoon, bowl, cup. Based on this, is there a bottle in the image?"}]}, {"id": 1985, "image": "COCO_val2014_000000452297.jpg", "conversations": [{"from": "human", "value": "Is there a bowl in the image?"}, {"from": "gpt", "value": "This image contains banana, spoon, bowl, cup. Based on this, is there a bowl in the image?"}]}, {"id": 1986, "image": "COCO_val2014_000000452297.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains banana, spoon, bowl, cup. Based on this, is there a person in the image?"}]}, {"id": 1987, "image": "COCO_val2014_000000543393.jpg", "conversations": [{"from": "human", "value": "Is there a fire hydrant in the image?"}, {"from": "gpt", "value": "This image contains fire hydrant, car, stop sign. Based on this, is there a fire hydrant in the image?"}]}, {"id": 1988, "image": "COCO_val2014_000000543393.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains fire hydrant, car, stop sign. Based on this, is there a person in the image?"}]}, {"id": 1989, "image": "COCO_val2014_000000543393.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains fire hydrant, car, stop sign. Based on this, is there a car in the image?"}]}, {"id": 1990, "image": "COCO_val2014_000000543393.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains fire hydrant, car, stop sign. Based on this, is there a truck in the image?"}]}, {"id": 1991, "image": "COCO_val2014_000000543393.jpg", "conversations": [{"from": "human", "value": "Is there a stop sign in the image?"}, {"from": "gpt", "value": "This image contains fire hydrant, car, stop sign. Based on this, is there a stop sign in the image?"}]}, {"id": 1992, "image": "COCO_val2014_000000543393.jpg", "conversations": [{"from": "human", "value": "Is there a traffic light in the image?"}, {"from": "gpt", "value": "This image contains fire hydrant, car, stop sign. Based on this, is there a traffic light in the image?"}]}, {"id": 1993, "image": "COCO_val2014_000000172648.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains truck, car, person, bed. Based on this, is there a truck in the image?"}]}, {"id": 1994, "image": "COCO_val2014_000000172648.jpg", "conversations": [{"from": "human", "value": "Is there a traffic light in the image?"}, {"from": "gpt", "value": "This image contains truck, car, person, bed. Based on this, is there a traffic light in the image?"}]}, {"id": 1995, "image": "COCO_val2014_000000172648.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains truck, car, person, bed. Based on this, is there a car in the image?"}]}, {"id": 1996, "image": "COCO_val2014_000000172648.jpg", "conversations": [{"from": "human", "value": "Is there a bus in the image?"}, {"from": "gpt", "value": "This image contains truck, car, person, bed. Based on this, is there a bus in the image?"}]}, {"id": 1997, "image": "COCO_val2014_000000172648.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains truck, car, person, bed. Based on this, is there a person in the image?"}]}, {"id": 1998, "image": "COCO_val2014_000000172648.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains truck, car, person, bed. Based on this, is there a dining table in the image?"}]}, {"id": 1999, "image": "COCO_val2014_000000308907.jpg", "conversations": [{"from": "human", "value": "Is there a traffic light in the image?"}, {"from": "gpt", "value": "This image contains traffic light, person, bicycle, potted plant. Based on this, is there a traffic light in the image?"}]}, {"id": 2000, "image": "COCO_val2014_000000308907.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains traffic light, person, bicycle, potted plant. Based on this, is there a car in the image?"}]}, {"id": 2001, "image": "COCO_val2014_000000308907.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains traffic light, person, bicycle, potted plant. Based on this, is there a person in the image?"}]}, {"id": 2002, "image": "COCO_val2014_000000308907.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains traffic light, person, bicycle, potted plant. Based on this, is there a dining table in the image?"}]}, {"id": 2003, "image": "COCO_val2014_000000308907.jpg", "conversations": [{"from": "human", "value": "Is there a bicycle in the image?"}, {"from": "gpt", "value": "This image contains traffic light, person, bicycle, potted plant. Based on this, is there a bicycle in the image?"}]}, {"id": 2004, "image": "COCO_val2014_000000308907.jpg", "conversations": [{"from": "human", "value": "Is there a motorcycle in the image?"}, {"from": "gpt", "value": "This image contains traffic light, person, bicycle, potted plant. Based on this, is there a motorcycle in the image?"}]}, {"id": 2005, "image": "COCO_val2014_000000263594.jpg", "conversations": [{"from": "human", "value": "Is there a bird in the image?"}, {"from": "gpt", "value": "This image contains bird, truck, car. Based on this, is there a bird in the image?"}]}, {"id": 2006, "image": "COCO_val2014_000000263594.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains bird, truck, car. Based on this, is there a person in the image?"}]}, {"id": 2007, "image": "COCO_val2014_000000263594.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains bird, truck, car. Based on this, is there a truck in the image?"}]}, {"id": 2008, "image": "COCO_val2014_000000263594.jpg", "conversations": [{"from": "human", "value": "Is there a traffic light in the image?"}, {"from": "gpt", "value": "This image contains bird, truck, car. Based on this, is there a traffic light in the image?"}]}, {"id": 2009, "image": "COCO_val2014_000000263594.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains bird, truck, car. Based on this, is there a car in the image?"}]}, {"id": 2010, "image": "COCO_val2014_000000263594.jpg", "conversations": [{"from": "human", "value": "Is there a bus in the image?"}, {"from": "gpt", "value": "This image contains bird, truck, car. Based on this, is there a bus in the image?"}]}, {"id": 2011, "image": "COCO_val2014_000000501294.jpg", "conversations": [{"from": "human", "value": "Is there a tv in the image?"}, {"from": "gpt", "value": "This image contains tv, person, couch. Based on this, is there a tv in the image?"}]}, {"id": 2012, "image": "COCO_val2014_000000501294.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains tv, person, couch. Based on this, is there a dining table in the image?"}]}, {"id": 2013, "image": "COCO_val2014_000000501294.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains tv, person, couch. Based on this, is there a person in the image?"}]}, {"id": 2014, "image": "COCO_val2014_000000501294.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains tv, person, couch. Based on this, is there a car in the image?"}]}, {"id": 2015, "image": "COCO_val2014_000000501294.jpg", "conversations": [{"from": "human", "value": "Is there a couch in the image?"}, {"from": "gpt", "value": "This image contains tv, person, couch. Based on this, is there a couch in the image?"}]}, {"id": 2016, "image": "COCO_val2014_000000501294.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains tv, person, couch. Based on this, is there a chair in the image?"}]}, {"id": 2017, "image": "COCO_val2014_000000500680.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, handbag, dining table. Based on this, is there a person in the image?"}]}, {"id": 2018, "image": "COCO_val2014_000000500680.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, handbag, dining table. Based on this, is there a car in the image?"}]}, {"id": 2019, "image": "COCO_val2014_000000500680.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains person, handbag, dining table. Based on this, is there a handbag in the image?"}]}, {"id": 2020, "image": "COCO_val2014_000000500680.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains person, handbag, dining table. Based on this, is there a backpack in the image?"}]}, {"id": 2021, "image": "COCO_val2014_000000500680.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, handbag, dining table. Based on this, is there a dining table in the image?"}]}, {"id": 2022, "image": "COCO_val2014_000000500680.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains person, handbag, dining table. Based on this, is there a cup in the image?"}]}, {"id": 2023, "image": "COCO_val2014_000000091954.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains truck, train, car. Based on this, is there a truck in the image?"}]}, {"id": 2024, "image": "COCO_val2014_000000091954.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains truck, train, car. Based on this, is there a person in the image?"}]}, {"id": 2025, "image": "COCO_val2014_000000091954.jpg", "conversations": [{"from": "human", "value": "Is there a train in the image?"}, {"from": "gpt", "value": "This image contains truck, train, car. Based on this, is there a train in the image?"}]}, {"id": 2026, "image": "COCO_val2014_000000091954.jpg", "conversations": [{"from": "human", "value": "Is there a traffic light in the image?"}, {"from": "gpt", "value": "This image contains truck, train, car. Based on this, is there a traffic light in the image?"}]}, {"id": 2027, "image": "COCO_val2014_000000091954.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains truck, train, car. Based on this, is there a car in the image?"}]}, {"id": 2028, "image": "COCO_val2014_000000091954.jpg", "conversations": [{"from": "human", "value": "Is there a bus in the image?"}, {"from": "gpt", "value": "This image contains truck, train, car. Based on this, is there a bus in the image?"}]}, {"id": 2029, "image": "COCO_val2014_000000454607.jpg", "conversations": [{"from": "human", "value": "Is there a book in the image?"}, {"from": "gpt", "value": "This image contains book, person, cell phone, apple. Based on this, is there a book in the image?"}]}, {"id": 2030, "image": "COCO_val2014_000000454607.jpg", "conversations": [{"from": "human", "value": "Is there a tv in the image?"}, {"from": "gpt", "value": "This image contains book, person, cell phone, apple. Based on this, is there a tv in the image?"}]}, {"id": 2031, "image": "COCO_val2014_000000454607.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains book, person, cell phone, apple. Based on this, is there a person in the image?"}]}, {"id": 2032, "image": "COCO_val2014_000000454607.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains book, person, cell phone, apple. Based on this, is there a car in the image?"}]}, {"id": 2033, "image": "COCO_val2014_000000454607.jpg", "conversations": [{"from": "human", "value": "Is there a cell phone in the image?"}, {"from": "gpt", "value": "This image contains book, person, cell phone, apple. Based on this, is there a cell phone in the image?"}]}, {"id": 2034, "image": "COCO_val2014_000000454607.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains book, person, cell phone, apple. Based on this, is there a dining table in the image?"}]}, {"id": 2035, "image": "COCO_val2014_000000363908.jpg", "conversations": [{"from": "human", "value": "Is there a baseball glove in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball, baseball bat. Based on this, is there a baseball glove in the image?"}]}, {"id": 2036, "image": "COCO_val2014_000000363908.jpg", "conversations": [{"from": "human", "value": "Is there a dog in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball, baseball bat. Based on this, is there a dog in the image?"}]}, {"id": 2037, "image": "COCO_val2014_000000363908.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball, baseball bat. Based on this, is there a person in the image?"}]}, {"id": 2038, "image": "COCO_val2014_000000363908.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball, baseball bat. Based on this, is there a car in the image?"}]}, {"id": 2039, "image": "COCO_val2014_000000363908.jpg", "conversations": [{"from": "human", "value": "Is there a sports ball in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball, baseball bat. Based on this, is there a sports ball in the image?"}]}, {"id": 2040, "image": "COCO_val2014_000000363908.jpg", "conversations": [{"from": "human", "value": "Is there a tennis racket in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball, baseball bat. Based on this, is there a tennis racket in the image?"}]}, {"id": 2041, "image": "COCO_val2014_000000560064.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, bench, potted plant, donut. Based on this, is there a person in the image?"}]}, {"id": 2042, "image": "COCO_val2014_000000560064.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, bench, potted plant, donut. Based on this, is there a car in the image?"}]}, {"id": 2043, "image": "COCO_val2014_000000560064.jpg", "conversations": [{"from": "human", "value": "Is there a bench in the image?"}, {"from": "gpt", "value": "This image contains person, bench, potted plant, donut. Based on this, is there a bench in the image?"}]}, {"id": 2044, "image": "COCO_val2014_000000560064.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, bench, potted plant, donut. Based on this, is there a dining table in the image?"}]}, {"id": 2045, "image": "COCO_val2014_000000560064.jpg", "conversations": [{"from": "human", "value": "Is there a potted plant in the image?"}, {"from": "gpt", "value": "This image contains person, bench, potted plant, donut. Based on this, is there a potted plant in the image?"}]}, {"id": 2046, "image": "COCO_val2014_000000560064.jpg", "conversations": [{"from": "human", "value": "Is there a vase in the image?"}, {"from": "gpt", "value": "This image contains person, bench, potted plant, donut. Based on this, is there a vase in the image?"}]}, {"id": 2047, "image": "COCO_val2014_000000348469.jpg", "conversations": [{"from": "human", "value": "Is there a bird in the image?"}, {"from": "gpt", "value": "This image contains bird, person, baseball bat. Based on this, is there a bird in the image?"}]}, {"id": 2048, "image": "COCO_val2014_000000348469.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains bird, person, baseball bat. Based on this, is there a handbag in the image?"}]}, {"id": 2049, "image": "COCO_val2014_000000348469.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains bird, person, baseball bat. Based on this, is there a person in the image?"}]}, {"id": 2050, "image": "COCO_val2014_000000348469.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains bird, person, baseball bat. Based on this, is there a car in the image?"}]}, {"id": 2051, "image": "COCO_val2014_000000348469.jpg", "conversations": [{"from": "human", "value": "Is there a baseball bat in the image?"}, {"from": "gpt", "value": "This image contains bird, person, baseball bat. Based on this, is there a baseball bat in the image?"}]}, {"id": 2052, "image": "COCO_val2014_000000348469.jpg", "conversations": [{"from": "human", "value": "Is there a sports ball in the image?"}, {"from": "gpt", "value": "This image contains bird, person, baseball bat. Based on this, is there a sports ball in the image?"}]}, {"id": 2053, "image": "COCO_val2014_000000167724.jpg", "conversations": [{"from": "human", "value": "Is there an oven in the image?"}, {"from": "gpt", "value": "This image contains oven, spoon, bottle, person. Based on this, is there an oven in the image?"}]}, {"id": 2054, "image": "COCO_val2014_000000167724.jpg", "conversations": [{"from": "human", "value": "Is there a bowl in the image?"}, {"from": "gpt", "value": "This image contains oven, spoon, bottle, person. Based on this, is there a bowl in the image?"}]}, {"id": 2055, "image": "COCO_val2014_000000167724.jpg", "conversations": [{"from": "human", "value": "Is there a spoon in the image?"}, {"from": "gpt", "value": "This image contains oven, spoon, bottle, person. Based on this, is there a spoon in the image?"}]}, {"id": 2056, "image": "COCO_val2014_000000167724.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains oven, spoon, bottle, person. Based on this, is there a cup in the image?"}]}, {"id": 2057, "image": "COCO_val2014_000000167724.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains oven, spoon, bottle, person. Based on this, is there a bottle in the image?"}]}, {"id": 2058, "image": "COCO_val2014_000000167724.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains oven, spoon, bottle, person. Based on this, is there a dining table in the image?"}]}, {"id": 2059, "image": "COCO_val2014_000000262736.jpg", "conversations": [{"from": "human", "value": "Is there a dog in the image?"}, {"from": "gpt", "value": "This image contains dog, truck, car, frisbee. Based on this, is there a dog in the image?"}]}, {"id": 2060, "image": "COCO_val2014_000000262736.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains dog, truck, car, frisbee. Based on this, is there a person in the image?"}]}, {"id": 2061, "image": "COCO_val2014_000000262736.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains dog, truck, car, frisbee. Based on this, is there a truck in the image?"}]}, {"id": 2062, "image": "COCO_val2014_000000262736.jpg", "conversations": [{"from": "human", "value": "Is there a traffic light in the image?"}, {"from": "gpt", "value": "This image contains dog, truck, car, frisbee. Based on this, is there a traffic light in the image?"}]}, {"id": 2063, "image": "COCO_val2014_000000262736.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains dog, truck, car, frisbee. Based on this, is there a car in the image?"}]}, {"id": 2064, "image": "COCO_val2014_000000262736.jpg", "conversations": [{"from": "human", "value": "Is there a bus in the image?"}, {"from": "gpt", "value": "This image contains dog, truck, car, frisbee. Based on this, is there a bus in the image?"}]}, {"id": 2065, "image": "COCO_val2014_000000076416.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, bicycle, cell phone, bus. Based on this, is there a person in the image?"}]}, {"id": 2066, "image": "COCO_val2014_000000076416.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, bicycle, cell phone, bus. Based on this, is there a car in the image?"}]}, {"id": 2067, "image": "COCO_val2014_000000076416.jpg", "conversations": [{"from": "human", "value": "Is there a bicycle in the image?"}, {"from": "gpt", "value": "This image contains person, bicycle, cell phone, bus. Based on this, is there a bicycle in the image?"}]}, {"id": 2068, "image": "COCO_val2014_000000076416.jpg", "conversations": [{"from": "human", "value": "Is there a motorcycle in the image?"}, {"from": "gpt", "value": "This image contains person, bicycle, cell phone, bus. Based on this, is there a motorcycle in the image?"}]}, {"id": 2069, "image": "COCO_val2014_000000076416.jpg", "conversations": [{"from": "human", "value": "Is there a cell phone in the image?"}, {"from": "gpt", "value": "This image contains person, bicycle, cell phone, bus. Based on this, is there a cell phone in the image?"}]}, {"id": 2070, "image": "COCO_val2014_000000076416.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, bicycle, cell phone, bus. Based on this, is there a dining table in the image?"}]}, {"id": 2071, "image": "COCO_val2014_000000541783.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, motorcycle. Based on this, is there a backpack in the image?"}]}, {"id": 2072, "image": "COCO_val2014_000000541783.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, motorcycle. Based on this, is there a handbag in the image?"}]}, {"id": 2073, "image": "COCO_val2014_000000541783.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, motorcycle. Based on this, is there a person in the image?"}]}, {"id": 2074, "image": "COCO_val2014_000000541783.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, motorcycle. Based on this, is there a car in the image?"}]}, {"id": 2075, "image": "COCO_val2014_000000541783.jpg", "conversations": [{"from": "human", "value": "Is there a motorcycle in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, motorcycle. Based on this, is there a motorcycle in the image?"}]}, {"id": 2076, "image": "COCO_val2014_000000541783.jpg", "conversations": [{"from": "human", "value": "Is there a bicycle in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, motorcycle. Based on this, is there a bicycle in the image?"}]}, {"id": 2077, "image": "COCO_val2014_000000445200.jpg", "conversations": [{"from": "human", "value": "Is there a bowl in the image?"}, {"from": "gpt", "value": "This image contains bowl, broccoli, dining table, knife, carrot, cup. Based on this, is there a bowl in the image?"}]}, {"id": 2078, "image": "COCO_val2014_000000445200.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains bowl, broccoli, dining table, knife, carrot, cup. Based on this, is there a person in the image?"}]}, {"id": 2079, "image": "COCO_val2014_000000445200.jpg", "conversations": [{"from": "human", "value": "Is there a broccoli in the image?"}, {"from": "gpt", "value": "This image contains bowl, broccoli, dining table, knife, carrot, cup. Based on this, is there a broccoli in the image?"}]}, {"id": 2080, "image": "COCO_val2014_000000445200.jpg", "conversations": [{"from": "human", "value": "Is there a fork in the image?"}, {"from": "gpt", "value": "This image contains bowl, broccoli, dining table, knife, carrot, cup. Based on this, is there a fork in the image?"}]}, {"id": 2081, "image": "COCO_val2014_000000445200.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains bowl, broccoli, dining table, knife, carrot, cup. Based on this, is there a dining table in the image?"}]}, {"id": 2082, "image": "COCO_val2014_000000445200.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains bowl, broccoli, dining table, knife, carrot, cup. Based on this, is there a chair in the image?"}]}, {"id": 2083, "image": "COCO_val2014_000000433574.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, couch, dining table, chair, cell phone. Based on this, is there a person in the image?"}]}, {"id": 2084, "image": "COCO_val2014_000000433574.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, couch, dining table, chair, cell phone. Based on this, is there a car in the image?"}]}, {"id": 2085, "image": "COCO_val2014_000000433574.jpg", "conversations": [{"from": "human", "value": "Is there a couch in the image?"}, {"from": "gpt", "value": "This image contains person, couch, dining table, chair, cell phone. Based on this, is there a couch in the image?"}]}, {"id": 2086, "image": "COCO_val2014_000000433574.jpg", "conversations": [{"from": "human", "value": "Is there a tv in the image?"}, {"from": "gpt", "value": "This image contains person, couch, dining table, chair, cell phone. Based on this, is there a tv in the image?"}]}, {"id": 2087, "image": "COCO_val2014_000000433574.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, couch, dining table, chair, cell phone. Based on this, is there a dining table in the image?"}]}, {"id": 2088, "image": "COCO_val2014_000000433574.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains person, couch, dining table, chair, cell phone. Based on this, is there a cup in the image?"}]}, {"id": 2089, "image": "COCO_val2014_000000212241.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains truck, person, train, car. Based on this, is there a truck in the image?"}]}, {"id": 2090, "image": "COCO_val2014_000000212241.jpg", "conversations": [{"from": "human", "value": "Is there a traffic light in the image?"}, {"from": "gpt", "value": "This image contains truck, person, train, car. Based on this, is there a traffic light in the image?"}]}, {"id": 2091, "image": "COCO_val2014_000000212241.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains truck, person, train, car. Based on this, is there a person in the image?"}]}, {"id": 2092, "image": "COCO_val2014_000000212241.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains truck, person, train, car. Based on this, is there a dining table in the image?"}]}, {"id": 2093, "image": "COCO_val2014_000000212241.jpg", "conversations": [{"from": "human", "value": "Is there a train in the image?"}, {"from": "gpt", "value": "This image contains truck, person, train, car. Based on this, is there a train in the image?"}]}, {"id": 2094, "image": "COCO_val2014_000000212241.jpg", "conversations": [{"from": "human", "value": "Is there a bus in the image?"}, {"from": "gpt", "value": "This image contains truck, person, train, car. Based on this, is there a bus in the image?"}]}, {"id": 2095, "image": "COCO_val2014_000000114941.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, train, car. Based on this, is there a person in the image?"}]}, {"id": 2096, "image": "COCO_val2014_000000114941.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, train, car. Based on this, is there a dining table in the image?"}]}, {"id": 2097, "image": "COCO_val2014_000000114941.jpg", "conversations": [{"from": "human", "value": "Is there a train in the image?"}, {"from": "gpt", "value": "This image contains person, train, car. Based on this, is there a train in the image?"}]}, {"id": 2098, "image": "COCO_val2014_000000114941.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains person, train, car. Based on this, is there a truck in the image?"}]}, {"id": 2099, "image": "COCO_val2014_000000114941.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, train, car. Based on this, is there a car in the image?"}]}, {"id": 2100, "image": "COCO_val2014_000000114941.jpg", "conversations": [{"from": "human", "value": "Is there a bus in the image?"}, {"from": "gpt", "value": "This image contains person, train, car. Based on this, is there a bus in the image?"}]}, {"id": 2101, "image": "COCO_val2014_000000493753.jpg", "conversations": [{"from": "human", "value": "Is there a remote in the image?"}, {"from": "gpt", "value": "This image contains remote, laptop, chair, dining table, tv, mouse, bottle, keyboard, cup. Based on this, is there a remote in the image?"}]}, {"id": 2102, "image": "COCO_val2014_000000493753.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains remote, laptop, chair, dining table, tv, mouse, bottle, keyboard, cup. Based on this, is there a person in the image?"}]}, {"id": 2103, "image": "COCO_val2014_000000493753.jpg", "conversations": [{"from": "human", "value": "Is there a laptop in the image?"}, {"from": "gpt", "value": "This image contains remote, laptop, chair, dining table, tv, mouse, bottle, keyboard, cup. Based on this, is there a laptop in the image?"}]}, {"id": 2104, "image": "COCO_val2014_000000493753.jpg", "conversations": [{"from": "human", "value": "Is there a cell phone in the image?"}, {"from": "gpt", "value": "This image contains remote, laptop, chair, dining table, tv, mouse, bottle, keyboard, cup. Based on this, is there a cell phone in the image?"}]}, {"id": 2105, "image": "COCO_val2014_000000493753.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains remote, laptop, chair, dining table, tv, mouse, bottle, keyboard, cup. Based on this, is there a chair in the image?"}]}, {"id": 2106, "image": "COCO_val2014_000000493753.jpg", "conversations": [{"from": "human", "value": "Is there a couch in the image?"}, {"from": "gpt", "value": "This image contains remote, laptop, chair, dining table, tv, mouse, bottle, keyboard, cup. Based on this, is there a couch in the image?"}]}, {"id": 2107, "image": "COCO_val2014_000000410597.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, wine glass, dining table, cup, cake, tie. Based on this, is there a person in the image?"}]}, {"id": 2108, "image": "COCO_val2014_000000410597.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, wine glass, dining table, cup, cake, tie. Based on this, is there a car in the image?"}]}, {"id": 2109, "image": "COCO_val2014_000000410597.jpg", "conversations": [{"from": "human", "value": "Is there a wine glass in the image?"}, {"from": "gpt", "value": "This image contains person, wine glass, dining table, cup, cake, tie. Based on this, is there a wine glass in the image?"}]}, {"id": 2110, "image": "COCO_val2014_000000410597.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains person, wine glass, dining table, cup, cake, tie. Based on this, is there a bottle in the image?"}]}, {"id": 2111, "image": "COCO_val2014_000000410597.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, wine glass, dining table, cup, cake, tie. Based on this, is there a dining table in the image?"}]}, {"id": 2112, "image": "COCO_val2014_000000410597.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains person, wine glass, dining table, cup, cake, tie. Based on this, is there a chair in the image?"}]}, {"id": 2113, "image": "COCO_val2014_000000382617.jpg", "conversations": [{"from": "human", "value": "Is there a mouse in the image?"}, {"from": "gpt", "value": "This image contains mouse, dining table, book, cup. Based on this, is there a mouse in the image?"}]}, {"id": 2114, "image": "COCO_val2014_000000382617.jpg", "conversations": [{"from": "human", "value": "Is there a laptop in the image?"}, {"from": "gpt", "value": "This image contains mouse, dining table, book, cup. Based on this, is there a laptop in the image?"}]}, {"id": 2115, "image": "COCO_val2014_000000382617.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains mouse, dining table, book, cup. Based on this, is there a dining table in the image?"}]}, {"id": 2116, "image": "COCO_val2014_000000382617.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains mouse, dining table, book, cup. Based on this, is there a person in the image?"}]}, {"id": 2117, "image": "COCO_val2014_000000382617.jpg", "conversations": [{"from": "human", "value": "Is there a book in the image?"}, {"from": "gpt", "value": "This image contains mouse, dining table, book, cup. Based on this, is there a book in the image?"}]}, {"id": 2118, "image": "COCO_val2014_000000382617.jpg", "conversations": [{"from": "human", "value": "Is there a tv in the image?"}, {"from": "gpt", "value": "This image contains mouse, dining table, book, cup. Based on this, is there a tv in the image?"}]}, {"id": 2119, "image": "COCO_val2014_000000467887.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, mouse, couch, laptop, dining table, chair. Based on this, is there a person in the image?"}]}, {"id": 2120, "image": "COCO_val2014_000000467887.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, mouse, couch, laptop, dining table, chair. Based on this, is there a car in the image?"}]}, {"id": 2121, "image": "COCO_val2014_000000467887.jpg", "conversations": [{"from": "human", "value": "Is there a mouse in the image?"}, {"from": "gpt", "value": "This image contains person, mouse, couch, laptop, dining table, chair. Based on this, is there a mouse in the image?"}]}, {"id": 2122, "image": "COCO_val2014_000000467887.jpg", "conversations": [{"from": "human", "value": "Is there a tv in the image?"}, {"from": "gpt", "value": "This image contains person, mouse, couch, laptop, dining table, chair. Based on this, is there a tv in the image?"}]}, {"id": 2123, "image": "COCO_val2014_000000467887.jpg", "conversations": [{"from": "human", "value": "Is there a couch in the image?"}, {"from": "gpt", "value": "This image contains person, mouse, couch, laptop, dining table, chair. Based on this, is there a couch in the image?"}]}, {"id": 2124, "image": "COCO_val2014_000000467887.jpg", "conversations": [{"from": "human", "value": "Is there a book in the image?"}, {"from": "gpt", "value": "This image contains person, mouse, couch, laptop, dining table, chair. Based on this, is there a book in the image?"}]}, {"id": 2125, "image": "COCO_val2014_000000120792.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, remote, chair, refrigerator, tv, couch, bottle, book, cup. Based on this, is there a person in the image?"}]}, {"id": 2126, "image": "COCO_val2014_000000120792.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, remote, chair, refrigerator, tv, couch, bottle, book, cup. Based on this, is there a car in the image?"}]}, {"id": 2127, "image": "COCO_val2014_000000120792.jpg", "conversations": [{"from": "human", "value": "Is there a remote in the image?"}, {"from": "gpt", "value": "This image contains person, remote, chair, refrigerator, tv, couch, bottle, book, cup. Based on this, is there a remote in the image?"}]}, {"id": 2128, "image": "COCO_val2014_000000120792.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, remote, chair, refrigerator, tv, couch, bottle, book, cup. Based on this, is there a dining table in the image?"}]}, {"id": 2129, "image": "COCO_val2014_000000120792.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains person, remote, chair, refrigerator, tv, couch, bottle, book, cup. Based on this, is there a chair in the image?"}]}, {"id": 2130, "image": "COCO_val2014_000000120792.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains person, remote, chair, refrigerator, tv, couch, bottle, book, cup. Based on this, is there a handbag in the image?"}]}, {"id": 2131, "image": "COCO_val2014_000000125524.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, bus, fire hydrant. Based on this, is there a person in the image?"}]}, {"id": 2132, "image": "COCO_val2014_000000125524.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, bus, fire hydrant. Based on this, is there a car in the image?"}]}, {"id": 2133, "image": "COCO_val2014_000000125524.jpg", "conversations": [{"from": "human", "value": "Is there a bus in the image?"}, {"from": "gpt", "value": "This image contains person, bus, fire hydrant. Based on this, is there a bus in the image?"}]}, {"id": 2134, "image": "COCO_val2014_000000125524.jpg", "conversations": [{"from": "human", "value": "Is there a traffic light in the image?"}, {"from": "gpt", "value": "This image contains person, bus, fire hydrant. Based on this, is there a traffic light in the image?"}]}, {"id": 2135, "image": "COCO_val2014_000000125524.jpg", "conversations": [{"from": "human", "value": "Is there a fire hydrant in the image?"}, {"from": "gpt", "value": "This image contains person, bus, fire hydrant. Based on this, is there a fire hydrant in the image?"}]}, {"id": 2136, "image": "COCO_val2014_000000125524.jpg", "conversations": [{"from": "human", "value": "Is there a stop sign in the image?"}, {"from": "gpt", "value": "This image contains person, bus, fire hydrant. Based on this, is there a stop sign in the image?"}]}, {"id": 2137, "image": "COCO_val2014_000000196053.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket. Based on this, is there a person in the image?"}]}, {"id": 2138, "image": "COCO_val2014_000000196053.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket. Based on this, is there a car in the image?"}]}, {"id": 2139, "image": "COCO_val2014_000000196053.jpg", "conversations": [{"from": "human", "value": "Is there a sports ball in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket. Based on this, is there a sports ball in the image?"}]}, {"id": 2140, "image": "COCO_val2014_000000196053.jpg", "conversations": [{"from": "human", "value": "Is there a baseball glove in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket. Based on this, is there a baseball glove in the image?"}]}, {"id": 2141, "image": "COCO_val2014_000000196053.jpg", "conversations": [{"from": "human", "value": "Is there a tennis racket in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket. Based on this, is there a tennis racket in the image?"}]}, {"id": 2142, "image": "COCO_val2014_000000196053.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket. Based on this, is there a chair in the image?"}]}, {"id": 2143, "image": "COCO_val2014_000000156704.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, surfboard, umbrella. Based on this, is there a person in the image?"}]}, {"id": 2144, "image": "COCO_val2014_000000156704.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, surfboard, umbrella. Based on this, is there a car in the image?"}]}, {"id": 2145, "image": "COCO_val2014_000000156704.jpg", "conversations": [{"from": "human", "value": "Is there a surfboard in the image?"}, {"from": "gpt", "value": "This image contains person, surfboard, umbrella. Based on this, is there a surfboard in the image?"}]}, {"id": 2146, "image": "COCO_val2014_000000156704.jpg", "conversations": [{"from": "human", "value": "Is there a kite in the image?"}, {"from": "gpt", "value": "This image contains person, surfboard, umbrella. Based on this, is there a kite in the image?"}]}, {"id": 2147, "image": "COCO_val2014_000000156704.jpg", "conversations": [{"from": "human", "value": "Is there an umbrella in the image?"}, {"from": "gpt", "value": "This image contains person, surfboard, umbrella. Based on this, is there an umbrella in the image?"}]}, {"id": 2148, "image": "COCO_val2014_000000156704.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains person, surfboard, umbrella. Based on this, is there a handbag in the image?"}]}, {"id": 2149, "image": "COCO_val2014_000000088507.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, orange, skis. Based on this, is there a backpack in the image?"}]}, {"id": 2150, "image": "COCO_val2014_000000088507.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, orange, skis. Based on this, is there a handbag in the image?"}]}, {"id": 2151, "image": "COCO_val2014_000000088507.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, orange, skis. Based on this, is there a person in the image?"}]}, {"id": 2152, "image": "COCO_val2014_000000088507.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, orange, skis. Based on this, is there a car in the image?"}]}, {"id": 2153, "image": "COCO_val2014_000000088507.jpg", "conversations": [{"from": "human", "value": "Is there an orange in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, orange, skis. Based on this, is there an orange in the image?"}]}, {"id": 2154, "image": "COCO_val2014_000000088507.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, orange, skis. Based on this, is there a dining table in the image?"}]}, {"id": 2155, "image": "COCO_val2014_000000279499.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, bus, umbrella. Based on this, is there a person in the image?"}]}, {"id": 2156, "image": "COCO_val2014_000000279499.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, bus, umbrella. Based on this, is there a car in the image?"}]}, {"id": 2157, "image": "COCO_val2014_000000279499.jpg", "conversations": [{"from": "human", "value": "Is there a bus in the image?"}, {"from": "gpt", "value": "This image contains person, bus, umbrella. Based on this, is there a bus in the image?"}]}, {"id": 2158, "image": "COCO_val2014_000000279499.jpg", "conversations": [{"from": "human", "value": "Is there a traffic light in the image?"}, {"from": "gpt", "value": "This image contains person, bus, umbrella. Based on this, is there a traffic light in the image?"}]}, {"id": 2159, "image": "COCO_val2014_000000279499.jpg", "conversations": [{"from": "human", "value": "Is there an umbrella in the image?"}, {"from": "gpt", "value": "This image contains person, bus, umbrella. Based on this, is there an umbrella in the image?"}]}, {"id": 2160, "image": "COCO_val2014_000000279499.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains person, bus, umbrella. Based on this, is there a handbag in the image?"}]}, {"id": 2161, "image": "COCO_val2014_000000155131.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket, bench, tie. Based on this, is there a person in the image?"}]}, {"id": 2162, "image": "COCO_val2014_000000155131.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket, bench, tie. Based on this, is there a car in the image?"}]}, {"id": 2163, "image": "COCO_val2014_000000155131.jpg", "conversations": [{"from": "human", "value": "Is there a sports ball in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket, bench, tie. Based on this, is there a sports ball in the image?"}]}, {"id": 2164, "image": "COCO_val2014_000000155131.jpg", "conversations": [{"from": "human", "value": "Is there a baseball glove in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket, bench, tie. Based on this, is there a baseball glove in the image?"}]}, {"id": 2165, "image": "COCO_val2014_000000155131.jpg", "conversations": [{"from": "human", "value": "Is there a tennis racket in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket, bench, tie. Based on this, is there a tennis racket in the image?"}]}, {"id": 2166, "image": "COCO_val2014_000000155131.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket, bench, tie. Based on this, is there a chair in the image?"}]}, {"id": 2167, "image": "COCO_val2014_000000252135.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains chair, person, couch, remote. Based on this, is there a chair in the image?"}]}, {"id": 2168, "image": "COCO_val2014_000000252135.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains chair, person, couch, remote. Based on this, is there a dining table in the image?"}]}, {"id": 2169, "image": "COCO_val2014_000000252135.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains chair, person, couch, remote. Based on this, is there a person in the image?"}]}, {"id": 2170, "image": "COCO_val2014_000000252135.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains chair, person, couch, remote. Based on this, is there a car in the image?"}]}, {"id": 2171, "image": "COCO_val2014_000000252135.jpg", "conversations": [{"from": "human", "value": "Is there a couch in the image?"}, {"from": "gpt", "value": "This image contains chair, person, couch, remote. Based on this, is there a couch in the image?"}]}, {"id": 2172, "image": "COCO_val2014_000000252135.jpg", "conversations": [{"from": "human", "value": "Is there a tv in the image?"}, {"from": "gpt", "value": "This image contains chair, person, couch, remote. Based on this, is there a tv in the image?"}]}, {"id": 2173, "image": "COCO_val2014_000000501652.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains chair, person, car, cell phone. Based on this, is there a chair in the image?"}]}, {"id": 2174, "image": "COCO_val2014_000000501652.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains chair, person, car, cell phone. Based on this, is there a dining table in the image?"}]}, {"id": 2175, "image": "COCO_val2014_000000501652.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains chair, person, car, cell phone. Based on this, is there a person in the image?"}]}, {"id": 2176, "image": "COCO_val2014_000000501652.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains chair, person, car, cell phone. Based on this, is there a handbag in the image?"}]}, {"id": 2177, "image": "COCO_val2014_000000501652.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains chair, person, car, cell phone. Based on this, is there a car in the image?"}]}, {"id": 2178, "image": "COCO_val2014_000000501652.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains chair, person, car, cell phone. Based on this, is there a truck in the image?"}]}, {"id": 2179, "image": "COCO_val2014_000000238691.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, handbag, bottle, suitcase. Based on this, is there a backpack in the image?"}]}, {"id": 2180, "image": "COCO_val2014_000000238691.jpg", "conversations": [{"from": "human", "value": "Is there a skis in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, handbag, bottle, suitcase. Based on this, is there a skis in the image?"}]}, {"id": 2181, "image": "COCO_val2014_000000238691.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, handbag, bottle, suitcase. Based on this, is there a person in the image?"}]}, {"id": 2182, "image": "COCO_val2014_000000238691.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, handbag, bottle, suitcase. Based on this, is there a car in the image?"}]}, {"id": 2183, "image": "COCO_val2014_000000238691.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, handbag, bottle, suitcase. Based on this, is there a handbag in the image?"}]}, {"id": 2184, "image": "COCO_val2014_000000238691.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, handbag, bottle, suitcase. Based on this, is there a dining table in the image?"}]}, {"id": 2185, "image": "COCO_val2014_000000332908.jpg", "conversations": [{"from": "human", "value": "Is there a bowl in the image?"}, {"from": "gpt", "value": "This image contains bowl, bottle, oven. Based on this, is there a bowl in the image?"}]}, {"id": 2186, "image": "COCO_val2014_000000332908.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains bowl, bottle, oven. Based on this, is there a cup in the image?"}]}, {"id": 2187, "image": "COCO_val2014_000000332908.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains bowl, bottle, oven. Based on this, is there a bottle in the image?"}]}, {"id": 2188, "image": "COCO_val2014_000000332908.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains bowl, bottle, oven. Based on this, is there a person in the image?"}]}, {"id": 2189, "image": "COCO_val2014_000000332908.jpg", "conversations": [{"from": "human", "value": "Is there an oven in the image?"}, {"from": "gpt", "value": "This image contains bowl, bottle, oven. Based on this, is there an oven in the image?"}]}, {"id": 2190, "image": "COCO_val2014_000000332908.jpg", "conversations": [{"from": "human", "value": "Is there a spoon in the image?"}, {"from": "gpt", "value": "This image contains bowl, bottle, oven. Based on this, is there a spoon in the image?"}]}, {"id": 2191, "image": "COCO_val2014_000000372819.jpg", "conversations": [{"from": "human", "value": "Is there a dog in the image?"}, {"from": "gpt", "value": "This image contains dog, person, bench, dining table. Based on this, is there a dog in the image?"}]}, {"id": 2192, "image": "COCO_val2014_000000372819.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains dog, person, bench, dining table. Based on this, is there a car in the image?"}]}, {"id": 2193, "image": "COCO_val2014_000000372819.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains dog, person, bench, dining table. Based on this, is there a person in the image?"}]}, {"id": 2194, "image": "COCO_val2014_000000372819.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains dog, person, bench, dining table. Based on this, is there a chair in the image?"}]}, {"id": 2195, "image": "COCO_val2014_000000372819.jpg", "conversations": [{"from": "human", "value": "Is there a bench in the image?"}, {"from": "gpt", "value": "This image contains dog, person, bench, dining table. Based on this, is there a bench in the image?"}]}, {"id": 2196, "image": "COCO_val2014_000000372819.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains dog, person, bench, dining table. Based on this, is there a backpack in the image?"}]}, {"id": 2197, "image": "COCO_val2014_000000470699.jpg", "conversations": [{"from": "human", "value": "Is there a dog in the image?"}, {"from": "gpt", "value": "This image contains dog, person, surfboard. Based on this, is there a dog in the image?"}]}, {"id": 2198, "image": "COCO_val2014_000000470699.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains dog, person, surfboard. Based on this, is there a car in the image?"}]}, {"id": 2199, "image": "COCO_val2014_000000470699.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains dog, person, surfboard. Based on this, is there a person in the image?"}]}, {"id": 2200, "image": "COCO_val2014_000000470699.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains dog, person, surfboard. Based on this, is there a dining table in the image?"}]}, {"id": 2201, "image": "COCO_val2014_000000470699.jpg", "conversations": [{"from": "human", "value": "Is there a surfboard in the image?"}, {"from": "gpt", "value": "This image contains dog, person, surfboard. Based on this, is there a surfboard in the image?"}]}, {"id": 2202, "image": "COCO_val2014_000000470699.jpg", "conversations": [{"from": "human", "value": "Is there an umbrella in the image?"}, {"from": "gpt", "value": "This image contains dog, person, surfboard. Based on this, is there an umbrella in the image?"}]}, {"id": 2203, "image": "COCO_val2014_000000023084.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket. Based on this, is there a person in the image?"}]}, {"id": 2204, "image": "COCO_val2014_000000023084.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket. Based on this, is there a car in the image?"}]}, {"id": 2205, "image": "COCO_val2014_000000023084.jpg", "conversations": [{"from": "human", "value": "Is there a sports ball in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket. Based on this, is there a sports ball in the image?"}]}, {"id": 2206, "image": "COCO_val2014_000000023084.jpg", "conversations": [{"from": "human", "value": "Is there a baseball glove in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket. Based on this, is there a baseball glove in the image?"}]}, {"id": 2207, "image": "COCO_val2014_000000023084.jpg", "conversations": [{"from": "human", "value": "Is there a tennis racket in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket. Based on this, is there a tennis racket in the image?"}]}, {"id": 2208, "image": "COCO_val2014_000000023084.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket. Based on this, is there a chair in the image?"}]}, {"id": 2209, "image": "COCO_val2014_000000545353.jpg", "conversations": [{"from": "human", "value": "Is there a pizza in the image?"}, {"from": "gpt", "value": "This image contains pizza, person, sink, dining table. Based on this, is there a pizza in the image?"}]}, {"id": 2210, "image": "COCO_val2014_000000545353.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains pizza, person, sink, dining table. Based on this, is there a cup in the image?"}]}, {"id": 2211, "image": "COCO_val2014_000000545353.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains pizza, person, sink, dining table. Based on this, is there a person in the image?"}]}, {"id": 2212, "image": "COCO_val2014_000000545353.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains pizza, person, sink, dining table. Based on this, is there a car in the image?"}]}, {"id": 2213, "image": "COCO_val2014_000000545353.jpg", "conversations": [{"from": "human", "value": "Is there a sink in the image?"}, {"from": "gpt", "value": "This image contains pizza, person, sink, dining table. Based on this, is there a sink in the image?"}]}, {"id": 2214, "image": "COCO_val2014_000000545353.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains pizza, person, sink, dining table. Based on this, is there a bottle in the image?"}]}, {"id": 2215, "image": "COCO_val2014_000000394535.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, handbag, surfboard, car, bus. Based on this, is there a backpack in the image?"}]}, {"id": 2216, "image": "COCO_val2014_000000394535.jpg", "conversations": [{"from": "human", "value": "Is there a skis in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, handbag, surfboard, car, bus. Based on this, is there a skis in the image?"}]}, {"id": 2217, "image": "COCO_val2014_000000394535.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, handbag, surfboard, car, bus. Based on this, is there a person in the image?"}]}, {"id": 2218, "image": "COCO_val2014_000000394535.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, handbag, surfboard, car, bus. Based on this, is there a dining table in the image?"}]}, {"id": 2219, "image": "COCO_val2014_000000394535.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, handbag, surfboard, car, bus. Based on this, is there a handbag in the image?"}]}, {"id": 2220, "image": "COCO_val2014_000000394535.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, handbag, surfboard, car, bus. Based on this, is there a chair in the image?"}]}, {"id": 2221, "image": "COCO_val2014_000000579415.jpg", "conversations": [{"from": "human", "value": "Is there a traffic light in the image?"}, {"from": "gpt", "value": "This image contains traffic light, person, handbag, bus, umbrella. Based on this, is there a traffic light in the image?"}]}, {"id": 2222, "image": "COCO_val2014_000000579415.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains traffic light, person, handbag, bus, umbrella. Based on this, is there a car in the image?"}]}, {"id": 2223, "image": "COCO_val2014_000000579415.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains traffic light, person, handbag, bus, umbrella. Based on this, is there a person in the image?"}]}, {"id": 2224, "image": "COCO_val2014_000000579415.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains traffic light, person, handbag, bus, umbrella. Based on this, is there a dining table in the image?"}]}, {"id": 2225, "image": "COCO_val2014_000000579415.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains traffic light, person, handbag, bus, umbrella. Based on this, is there a handbag in the image?"}]}, {"id": 2226, "image": "COCO_val2014_000000579415.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains traffic light, person, handbag, bus, umbrella. Based on this, is there a backpack in the image?"}]}, {"id": 2227, "image": "COCO_val2014_000000233521.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, couch, bottle, remote, vase, book. Based on this, is there a person in the image?"}]}, {"id": 2228, "image": "COCO_val2014_000000233521.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, couch, bottle, remote, vase, book. Based on this, is there a car in the image?"}]}, {"id": 2229, "image": "COCO_val2014_000000233521.jpg", "conversations": [{"from": "human", "value": "Is there a couch in the image?"}, {"from": "gpt", "value": "This image contains person, couch, bottle, remote, vase, book. Based on this, is there a couch in the image?"}]}, {"id": 2230, "image": "COCO_val2014_000000233521.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains person, couch, bottle, remote, vase, book. Based on this, is there a chair in the image?"}]}, {"id": 2231, "image": "COCO_val2014_000000233521.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains person, couch, bottle, remote, vase, book. Based on this, is there a bottle in the image?"}]}, {"id": 2232, "image": "COCO_val2014_000000233521.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, couch, bottle, remote, vase, book. Based on this, is there a dining table in the image?"}]}, {"id": 2233, "image": "COCO_val2014_000000355256.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, bottle, chair, refrigerator, microwave, donut. Based on this, is there a person in the image?"}]}, {"id": 2234, "image": "COCO_val2014_000000355256.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, bottle, chair, refrigerator, microwave, donut. Based on this, is there a car in the image?"}]}, {"id": 2235, "image": "COCO_val2014_000000355256.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains person, bottle, chair, refrigerator, microwave, donut. Based on this, is there a bottle in the image?"}]}, {"id": 2236, "image": "COCO_val2014_000000355256.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, bottle, chair, refrigerator, microwave, donut. Based on this, is there a dining table in the image?"}]}, {"id": 2237, "image": "COCO_val2014_000000355256.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains person, bottle, chair, refrigerator, microwave, donut. Based on this, is there a chair in the image?"}]}, {"id": 2238, "image": "COCO_val2014_000000355256.jpg", "conversations": [{"from": "human", "value": "Is there a couch in the image?"}, {"from": "gpt", "value": "This image contains person, bottle, chair, refrigerator, microwave, donut. Based on this, is there a couch in the image?"}]}, {"id": 2239, "image": "COCO_val2014_000000304819.jpg", "conversations": [{"from": "human", "value": "Is there a tv in the image?"}, {"from": "gpt", "value": "This image contains tv, cat, laptop, dining table. Based on this, is there a tv in the image?"}]}, {"id": 2240, "image": "COCO_val2014_000000304819.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains tv, cat, laptop, dining table. Based on this, is there a person in the image?"}]}, {"id": 2241, "image": "COCO_val2014_000000304819.jpg", "conversations": [{"from": "human", "value": "Is there a cat in the image?"}, {"from": "gpt", "value": "This image contains tv, cat, laptop, dining table. Based on this, is there a cat in the image?"}]}, {"id": 2242, "image": "COCO_val2014_000000304819.jpg", "conversations": [{"from": "human", "value": "Is there a couch in the image?"}, {"from": "gpt", "value": "This image contains tv, cat, laptop, dining table. Based on this, is there a couch in the image?"}]}, {"id": 2243, "image": "COCO_val2014_000000304819.jpg", "conversations": [{"from": "human", "value": "Is there a laptop in the image?"}, {"from": "gpt", "value": "This image contains tv, cat, laptop, dining table. Based on this, is there a laptop in the image?"}]}, {"id": 2244, "image": "COCO_val2014_000000304819.jpg", "conversations": [{"from": "human", "value": "Is there a keyboard in the image?"}, {"from": "gpt", "value": "This image contains tv, cat, laptop, dining table. Based on this, is there a keyboard in the image?"}]}, {"id": 2245, "image": "COCO_val2014_000000240434.jpg", "conversations": [{"from": "human", "value": "Is there a clock in the image?"}, {"from": "gpt", "value": "This image contains clock, person, remote, chair, refrigerator, book, tv, handbag, couch, cell phone. Based on this, is there a clock in the image?"}]}, {"id": 2246, "image": "COCO_val2014_000000240434.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains clock, person, remote, chair, refrigerator, book, tv, handbag, couch, cell phone. Based on this, is there a dining table in the image?"}]}, {"id": 2247, "image": "COCO_val2014_000000240434.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains clock, person, remote, chair, refrigerator, book, tv, handbag, couch, cell phone. Based on this, is there a person in the image?"}]}, {"id": 2248, "image": "COCO_val2014_000000240434.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains clock, person, remote, chair, refrigerator, book, tv, handbag, couch, cell phone. Based on this, is there a car in the image?"}]}, {"id": 2249, "image": "COCO_val2014_000000240434.jpg", "conversations": [{"from": "human", "value": "Is there a remote in the image?"}, {"from": "gpt", "value": "This image contains clock, person, remote, chair, refrigerator, book, tv, handbag, couch, cell phone. Based on this, is there a remote in the image?"}]}, {"id": 2250, "image": "COCO_val2014_000000240434.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains clock, person, remote, chair, refrigerator, book, tv, handbag, couch, cell phone. Based on this, is there a cup in the image?"}]}, {"id": 2251, "image": "COCO_val2014_000000199940.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains backpack, bowl, bottle, refrigerator, cat, oven. Based on this, is there a backpack in the image?"}]}, {"id": 2252, "image": "COCO_val2014_000000199940.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains backpack, bowl, bottle, refrigerator, cat, oven. Based on this, is there a person in the image?"}]}, {"id": 2253, "image": "COCO_val2014_000000199940.jpg", "conversations": [{"from": "human", "value": "Is there a bowl in the image?"}, {"from": "gpt", "value": "This image contains backpack, bowl, bottle, refrigerator, cat, oven. Based on this, is there a bowl in the image?"}]}, {"id": 2254, "image": "COCO_val2014_000000199940.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains backpack, bowl, bottle, refrigerator, cat, oven. Based on this, is there a cup in the image?"}]}, {"id": 2255, "image": "COCO_val2014_000000199940.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains backpack, bowl, bottle, refrigerator, cat, oven. Based on this, is there a bottle in the image?"}]}, {"id": 2256, "image": "COCO_val2014_000000199940.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains backpack, bowl, bottle, refrigerator, cat, oven. Based on this, is there a dining table in the image?"}]}, {"id": 2257, "image": "COCO_val2014_000000549390.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, bicycle. Based on this, is there a backpack in the image?"}]}, {"id": 2258, "image": "COCO_val2014_000000549390.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, bicycle. Based on this, is there a handbag in the image?"}]}, {"id": 2259, "image": "COCO_val2014_000000549390.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, bicycle. Based on this, is there a person in the image?"}]}, {"id": 2260, "image": "COCO_val2014_000000549390.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, bicycle. Based on this, is there a car in the image?"}]}, {"id": 2261, "image": "COCO_val2014_000000549390.jpg", "conversations": [{"from": "human", "value": "Is there a bicycle in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, bicycle. Based on this, is there a bicycle in the image?"}]}, {"id": 2262, "image": "COCO_val2014_000000549390.jpg", "conversations": [{"from": "human", "value": "Is there a motorcycle in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, bicycle. Based on this, is there a motorcycle in the image?"}]}, {"id": 2263, "image": "COCO_val2014_000000235541.jpg", "conversations": [{"from": "human", "value": "Is there a giraffe in the image?"}, {"from": "gpt", "value": "This image contains giraffe, person, tie. Based on this, is there a giraffe in the image?"}]}, {"id": 2264, "image": "COCO_val2014_000000235541.jpg", "conversations": [{"from": "human", "value": "Is there a cow in the image?"}, {"from": "gpt", "value": "This image contains giraffe, person, tie. Based on this, is there a cow in the image?"}]}, {"id": 2265, "image": "COCO_val2014_000000235541.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains giraffe, person, tie. Based on this, is there a person in the image?"}]}, {"id": 2266, "image": "COCO_val2014_000000235541.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains giraffe, person, tie. Based on this, is there a car in the image?"}]}, {"id": 2267, "image": "COCO_val2014_000000235541.jpg", "conversations": [{"from": "human", "value": "Is there a tie in the image?"}, {"from": "gpt", "value": "This image contains giraffe, person, tie. Based on this, is there a tie in the image?"}]}, {"id": 2268, "image": "COCO_val2014_000000235541.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains giraffe, person, tie. Based on this, is there a dining table in the image?"}]}, {"id": 2269, "image": "COCO_val2014_000000068418.jpg", "conversations": [{"from": "human", "value": "Is there a tv in the image?"}, {"from": "gpt", "value": "This image contains tv, mouse, laptop, keyboard, apple. Based on this, is there a tv in the image?"}]}, {"id": 2270, "image": "COCO_val2014_000000068418.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains tv, mouse, laptop, keyboard, apple. Based on this, is there a person in the image?"}]}, {"id": 2271, "image": "COCO_val2014_000000068418.jpg", "conversations": [{"from": "human", "value": "Is there a mouse in the image?"}, {"from": "gpt", "value": "This image contains tv, mouse, laptop, keyboard, apple. Based on this, is there a mouse in the image?"}]}, {"id": 2272, "image": "COCO_val2014_000000068418.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains tv, mouse, laptop, keyboard, apple. Based on this, is there a dining table in the image?"}]}, {"id": 2273, "image": "COCO_val2014_000000068418.jpg", "conversations": [{"from": "human", "value": "Is there a laptop in the image?"}, {"from": "gpt", "value": "This image contains tv, mouse, laptop, keyboard, apple. Based on this, is there a laptop in the image?"}]}, {"id": 2274, "image": "COCO_val2014_000000068418.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains tv, mouse, laptop, keyboard, apple. Based on this, is there a chair in the image?"}]}, {"id": 2275, "image": "COCO_val2014_000000368541.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains backpack, truck, person, handbag, suitcase, bottle, airplane. Based on this, is there a backpack in the image?"}]}, {"id": 2276, "image": "COCO_val2014_000000368541.jpg", "conversations": [{"from": "human", "value": "Is there a skis in the image?"}, {"from": "gpt", "value": "This image contains backpack, truck, person, handbag, suitcase, bottle, airplane. Based on this, is there a skis in the image?"}]}, {"id": 2277, "image": "COCO_val2014_000000368541.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains backpack, truck, person, handbag, suitcase, bottle, airplane. Based on this, is there a truck in the image?"}]}, {"id": 2278, "image": "COCO_val2014_000000368541.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains backpack, truck, person, handbag, suitcase, bottle, airplane. Based on this, is there a car in the image?"}]}, {"id": 2279, "image": "COCO_val2014_000000368541.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains backpack, truck, person, handbag, suitcase, bottle, airplane. Based on this, is there a person in the image?"}]}, {"id": 2280, "image": "COCO_val2014_000000368541.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains backpack, truck, person, handbag, suitcase, bottle, airplane. Based on this, is there a dining table in the image?"}]}, {"id": 2281, "image": "COCO_val2014_000000006033.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, suitcase, bus, sheep. Based on this, is there a person in the image?"}]}, {"id": 2282, "image": "COCO_val2014_000000006033.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, suitcase, bus, sheep. Based on this, is there a car in the image?"}]}, {"id": 2283, "image": "COCO_val2014_000000006033.jpg", "conversations": [{"from": "human", "value": "Is there a suitcase in the image?"}, {"from": "gpt", "value": "This image contains person, suitcase, bus, sheep. Based on this, is there a suitcase in the image?"}]}, {"id": 2284, "image": "COCO_val2014_000000006033.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains person, suitcase, bus, sheep. Based on this, is there a handbag in the image?"}]}, {"id": 2285, "image": "COCO_val2014_000000006033.jpg", "conversations": [{"from": "human", "value": "Is there a bus in the image?"}, {"from": "gpt", "value": "This image contains person, suitcase, bus, sheep. Based on this, is there a bus in the image?"}]}, {"id": 2286, "image": "COCO_val2014_000000006033.jpg", "conversations": [{"from": "human", "value": "Is there a traffic light in the image?"}, {"from": "gpt", "value": "This image contains person, suitcase, bus, sheep. Based on this, is there a traffic light in the image?"}]}, {"id": 2287, "image": "COCO_val2014_000000021327.jpg", "conversations": [{"from": "human", "value": "Is there a tv in the image?"}, {"from": "gpt", "value": "This image contains tv, pizza, dining table, cup. Based on this, is there a tv in the image?"}]}, {"id": 2288, "image": "COCO_val2014_000000021327.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains tv, pizza, dining table, cup. Based on this, is there a person in the image?"}]}, {"id": 2289, "image": "COCO_val2014_000000021327.jpg", "conversations": [{"from": "human", "value": "Is there a pizza in the image?"}, {"from": "gpt", "value": "This image contains tv, pizza, dining table, cup. Based on this, is there a pizza in the image?"}]}, {"id": 2290, "image": "COCO_val2014_000000021327.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains tv, pizza, dining table, cup. Based on this, is there a bottle in the image?"}]}, {"id": 2291, "image": "COCO_val2014_000000021327.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains tv, pizza, dining table, cup. Based on this, is there a dining table in the image?"}]}, {"id": 2292, "image": "COCO_val2014_000000021327.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains tv, pizza, dining table, cup. Based on this, is there a chair in the image?"}]}, {"id": 2293, "image": "COCO_val2014_000000390157.jpg", "conversations": [{"from": "human", "value": "Is there a wine glass in the image?"}, {"from": "gpt", "value": "This image contains wine glass, person, bottle, dining table. Based on this, is there a wine glass in the image?"}]}, {"id": 2294, "image": "COCO_val2014_000000390157.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains wine glass, person, bottle, dining table. Based on this, is there a cup in the image?"}]}, {"id": 2295, "image": "COCO_val2014_000000390157.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains wine glass, person, bottle, dining table. Based on this, is there a person in the image?"}]}, {"id": 2296, "image": "COCO_val2014_000000390157.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains wine glass, person, bottle, dining table. Based on this, is there a car in the image?"}]}, {"id": 2297, "image": "COCO_val2014_000000390157.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains wine glass, person, bottle, dining table. Based on this, is there a bottle in the image?"}]}, {"id": 2298, "image": "COCO_val2014_000000390157.jpg", "conversations": [{"from": "human", "value": "Is there a spoon in the image?"}, {"from": "gpt", "value": "This image contains wine glass, person, bottle, dining table. Based on this, is there a spoon in the image?"}]}, {"id": 2299, "image": "COCO_val2014_000000298633.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket. Based on this, is there a person in the image?"}]}, {"id": 2300, "image": "COCO_val2014_000000298633.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket. Based on this, is there a car in the image?"}]}, {"id": 2301, "image": "COCO_val2014_000000298633.jpg", "conversations": [{"from": "human", "value": "Is there a sports ball in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket. Based on this, is there a sports ball in the image?"}]}, {"id": 2302, "image": "COCO_val2014_000000298633.jpg", "conversations": [{"from": "human", "value": "Is there a baseball glove in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket. Based on this, is there a baseball glove in the image?"}]}, {"id": 2303, "image": "COCO_val2014_000000298633.jpg", "conversations": [{"from": "human", "value": "Is there a tennis racket in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket. Based on this, is there a tennis racket in the image?"}]}, {"id": 2304, "image": "COCO_val2014_000000298633.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket. Based on this, is there a chair in the image?"}]}, {"id": 2305, "image": "COCO_val2014_000000579277.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, motorcycle, carrot. Based on this, is there a person in the image?"}]}, {"id": 2306, "image": "COCO_val2014_000000579277.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, motorcycle, carrot. Based on this, is there a car in the image?"}]}, {"id": 2307, "image": "COCO_val2014_000000579277.jpg", "conversations": [{"from": "human", "value": "Is there a motorcycle in the image?"}, {"from": "gpt", "value": "This image contains person, motorcycle, carrot. Based on this, is there a motorcycle in the image?"}]}, {"id": 2308, "image": "COCO_val2014_000000579277.jpg", "conversations": [{"from": "human", "value": "Is there a bicycle in the image?"}, {"from": "gpt", "value": "This image contains person, motorcycle, carrot. Based on this, is there a bicycle in the image?"}]}, {"id": 2309, "image": "COCO_val2014_000000579277.jpg", "conversations": [{"from": "human", "value": "Is there a carrot in the image?"}, {"from": "gpt", "value": "This image contains person, motorcycle, carrot. Based on this, is there a carrot in the image?"}]}, {"id": 2310, "image": "COCO_val2014_000000579277.jpg", "conversations": [{"from": "human", "value": "Is there a broccoli in the image?"}, {"from": "gpt", "value": "This image contains person, motorcycle, carrot. Based on this, is there a broccoli in the image?"}]}, {"id": 2311, "image": "COCO_val2014_000000042685.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, bowl, pizza, bed, cell phone, cup. Based on this, is there a person in the image?"}]}, {"id": 2312, "image": "COCO_val2014_000000042685.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, bowl, pizza, bed, cell phone, cup. Based on this, is there a car in the image?"}]}, {"id": 2313, "image": "COCO_val2014_000000042685.jpg", "conversations": [{"from": "human", "value": "Is there a bowl in the image?"}, {"from": "gpt", "value": "This image contains person, bowl, pizza, bed, cell phone, cup. Based on this, is there a bowl in the image?"}]}, {"id": 2314, "image": "COCO_val2014_000000042685.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, bowl, pizza, bed, cell phone, cup. Based on this, is there a dining table in the image?"}]}, {"id": 2315, "image": "COCO_val2014_000000042685.jpg", "conversations": [{"from": "human", "value": "Is there a pizza in the image?"}, {"from": "gpt", "value": "This image contains person, bowl, pizza, bed, cell phone, cup. Based on this, is there a pizza in the image?"}]}, {"id": 2316, "image": "COCO_val2014_000000042685.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains person, bowl, pizza, bed, cell phone, cup. Based on this, is there a bottle in the image?"}]}, {"id": 2317, "image": "COCO_val2014_000000553992.jpg", "conversations": [{"from": "human", "value": "Is there a tv in the image?"}, {"from": "gpt", "value": "This image contains tv, person, remote, chair, tie. Based on this, is there a tv in the image?"}]}, {"id": 2318, "image": "COCO_val2014_000000553992.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains tv, person, remote, chair, tie. Based on this, is there a dining table in the image?"}]}, {"id": 2319, "image": "COCO_val2014_000000553992.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains tv, person, remote, chair, tie. Based on this, is there a person in the image?"}]}, {"id": 2320, "image": "COCO_val2014_000000553992.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains tv, person, remote, chair, tie. Based on this, is there a car in the image?"}]}, {"id": 2321, "image": "COCO_val2014_000000553992.jpg", "conversations": [{"from": "human", "value": "Is there a remote in the image?"}, {"from": "gpt", "value": "This image contains tv, person, remote, chair, tie. Based on this, is there a remote in the image?"}]}, {"id": 2322, "image": "COCO_val2014_000000553992.jpg", "conversations": [{"from": "human", "value": "Is there a couch in the image?"}, {"from": "gpt", "value": "This image contains tv, person, remote, chair, tie. Based on this, is there a couch in the image?"}]}, {"id": 2323, "image": "COCO_val2014_000000243158.jpg", "conversations": [{"from": "human", "value": "Is there a vase in the image?"}, {"from": "gpt", "value": "This image contains vase, couch, bottle, dining table. Based on this, is there a vase in the image?"}]}, {"id": 2324, "image": "COCO_val2014_000000243158.jpg", "conversations": [{"from": "human", "value": "Is there a potted plant in the image?"}, {"from": "gpt", "value": "This image contains vase, couch, bottle, dining table. Based on this, is there a potted plant in the image?"}]}, {"id": 2325, "image": "COCO_val2014_000000243158.jpg", "conversations": [{"from": "human", "value": "Is there a couch in the image?"}, {"from": "gpt", "value": "This image contains vase, couch, bottle, dining table. Based on this, is there a couch in the image?"}]}, {"id": 2326, "image": "COCO_val2014_000000243158.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains vase, couch, bottle, dining table. Based on this, is there a person in the image?"}]}, {"id": 2327, "image": "COCO_val2014_000000243158.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains vase, couch, bottle, dining table. Based on this, is there a bottle in the image?"}]}, {"id": 2328, "image": "COCO_val2014_000000243158.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains vase, couch, bottle, dining table. Based on this, is there a cup in the image?"}]}, {"id": 2329, "image": "COCO_val2014_000000303971.jpg", "conversations": [{"from": "human", "value": "Is there a tv in the image?"}, {"from": "gpt", "value": "This image contains tv, person, remote. Based on this, is there a tv in the image?"}]}, {"id": 2330, "image": "COCO_val2014_000000303971.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains tv, person, remote. Based on this, is there a dining table in the image?"}]}, {"id": 2331, "image": "COCO_val2014_000000303971.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains tv, person, remote. Based on this, is there a person in the image?"}]}, {"id": 2332, "image": "COCO_val2014_000000303971.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains tv, person, remote. Based on this, is there a car in the image?"}]}, {"id": 2333, "image": "COCO_val2014_000000303971.jpg", "conversations": [{"from": "human", "value": "Is there a remote in the image?"}, {"from": "gpt", "value": "This image contains tv, person, remote. Based on this, is there a remote in the image?"}]}, {"id": 2334, "image": "COCO_val2014_000000303971.jpg", "conversations": [{"from": "human", "value": "Is there a couch in the image?"}, {"from": "gpt", "value": "This image contains tv, person, remote. Based on this, is there a couch in the image?"}]}, {"id": 2335, "image": "COCO_val2014_000000405762.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains car, truck, sports ball, person. Based on this, is there a car in the image?"}]}, {"id": 2336, "image": "COCO_val2014_000000405762.jpg", "conversations": [{"from": "human", "value": "Is there a bus in the image?"}, {"from": "gpt", "value": "This image contains car, truck, sports ball, person. Based on this, is there a bus in the image?"}]}, {"id": 2337, "image": "COCO_val2014_000000405762.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains car, truck, sports ball, person. Based on this, is there a truck in the image?"}]}, {"id": 2338, "image": "COCO_val2014_000000405762.jpg", "conversations": [{"from": "human", "value": "Is there a traffic light in the image?"}, {"from": "gpt", "value": "This image contains car, truck, sports ball, person. Based on this, is there a traffic light in the image?"}]}, {"id": 2339, "image": "COCO_val2014_000000405762.jpg", "conversations": [{"from": "human", "value": "Is there a sports ball in the image?"}, {"from": "gpt", "value": "This image contains car, truck, sports ball, person. Based on this, is there a sports ball in the image?"}]}, {"id": 2340, "image": "COCO_val2014_000000405762.jpg", "conversations": [{"from": "human", "value": "Is there a tennis racket in the image?"}, {"from": "gpt", "value": "This image contains car, truck, sports ball, person. Based on this, is there a tennis racket in the image?"}]}, {"id": 2341, "image": "COCO_val2014_000000343967.jpg", "conversations": [{"from": "human", "value": "Is there a clock in the image?"}, {"from": "gpt", "value": "This image contains clock, couch, potted plant, chair, vase. Based on this, is there a clock in the image?"}]}, {"id": 2342, "image": "COCO_val2014_000000343967.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains clock, couch, potted plant, chair, vase. Based on this, is there a person in the image?"}]}, {"id": 2343, "image": "COCO_val2014_000000343967.jpg", "conversations": [{"from": "human", "value": "Is there a couch in the image?"}, {"from": "gpt", "value": "This image contains clock, couch, potted plant, chair, vase. Based on this, is there a couch in the image?"}]}, {"id": 2344, "image": "COCO_val2014_000000343967.jpg", "conversations": [{"from": "human", "value": "Is there a tv in the image?"}, {"from": "gpt", "value": "This image contains clock, couch, potted plant, chair, vase. Based on this, is there a tv in the image?"}]}, {"id": 2345, "image": "COCO_val2014_000000343967.jpg", "conversations": [{"from": "human", "value": "Is there a potted plant in the image?"}, {"from": "gpt", "value": "This image contains clock, couch, potted plant, chair, vase. Based on this, is there a potted plant in the image?"}]}, {"id": 2346, "image": "COCO_val2014_000000343967.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains clock, couch, potted plant, chair, vase. Based on this, is there a dining table in the image?"}]}, {"id": 2347, "image": "COCO_val2014_000000477598.jpg", "conversations": [{"from": "human", "value": "Is there a dog in the image?"}, {"from": "gpt", "value": "This image contains dog, person, frisbee. Based on this, is there a dog in the image?"}]}, {"id": 2348, "image": "COCO_val2014_000000477598.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains dog, person, frisbee. Based on this, is there a car in the image?"}]}, {"id": 2349, "image": "COCO_val2014_000000477598.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains dog, person, frisbee. Based on this, is there a person in the image?"}]}, {"id": 2350, "image": "COCO_val2014_000000477598.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains dog, person, frisbee. Based on this, is there a dining table in the image?"}]}, {"id": 2351, "image": "COCO_val2014_000000477598.jpg", "conversations": [{"from": "human", "value": "Is there a frisbee in the image?"}, {"from": "gpt", "value": "This image contains dog, person, frisbee. Based on this, is there a frisbee in the image?"}]}, {"id": 2352, "image": "COCO_val2014_000000477598.jpg", "conversations": [{"from": "human", "value": "Is there an orange in the image?"}, {"from": "gpt", "value": "This image contains dog, person, frisbee. Based on this, is there an orange in the image?"}]}, {"id": 2353, "image": "COCO_val2014_000000044993.jpg", "conversations": [{"from": "human", "value": "Is there a banana in the image?"}, {"from": "gpt", "value": "This image contains banana, bowl, orange, apple. Based on this, is there a banana in the image?"}]}, {"id": 2354, "image": "COCO_val2014_000000044993.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains banana, bowl, orange, apple. Based on this, is there a dining table in the image?"}]}, {"id": 2355, "image": "COCO_val2014_000000044993.jpg", "conversations": [{"from": "human", "value": "Is there a bowl in the image?"}, {"from": "gpt", "value": "This image contains banana, bowl, orange, apple. Based on this, is there a bowl in the image?"}]}, {"id": 2356, "image": "COCO_val2014_000000044993.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains banana, bowl, orange, apple. Based on this, is there a cup in the image?"}]}, {"id": 2357, "image": "COCO_val2014_000000044993.jpg", "conversations": [{"from": "human", "value": "Is there an orange in the image?"}, {"from": "gpt", "value": "This image contains banana, bowl, orange, apple. Based on this, is there an orange in the image?"}]}, {"id": 2358, "image": "COCO_val2014_000000044993.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains banana, bowl, orange, apple. Based on this, is there a person in the image?"}]}, {"id": 2359, "image": "COCO_val2014_000000381195.jpg", "conversations": [{"from": "human", "value": "Is there a bowl in the image?"}, {"from": "gpt", "value": "This image contains bowl, broccoli, dining table. Based on this, is there a bowl in the image?"}]}, {"id": 2360, "image": "COCO_val2014_000000381195.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains bowl, broccoli, dining table. Based on this, is there a cup in the image?"}]}, {"id": 2361, "image": "COCO_val2014_000000381195.jpg", "conversations": [{"from": "human", "value": "Is there a broccoli in the image?"}, {"from": "gpt", "value": "This image contains bowl, broccoli, dining table. Based on this, is there a broccoli in the image?"}]}, {"id": 2362, "image": "COCO_val2014_000000381195.jpg", "conversations": [{"from": "human", "value": "Is there a carrot in the image?"}, {"from": "gpt", "value": "This image contains bowl, broccoli, dining table. Based on this, is there a carrot in the image?"}]}, {"id": 2363, "image": "COCO_val2014_000000381195.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains bowl, broccoli, dining table. Based on this, is there a dining table in the image?"}]}, {"id": 2364, "image": "COCO_val2014_000000381195.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains bowl, broccoli, dining table. Based on this, is there a person in the image?"}]}, {"id": 2365, "image": "COCO_val2014_000000337502.jpg", "conversations": [{"from": "human", "value": "Is there a pizza in the image?"}, {"from": "gpt", "value": "This image contains pizza, broccoli, oven. Based on this, is there a pizza in the image?"}]}, {"id": 2366, "image": "COCO_val2014_000000337502.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains pizza, broccoli, oven. Based on this, is there a dining table in the image?"}]}, {"id": 2367, "image": "COCO_val2014_000000337502.jpg", "conversations": [{"from": "human", "value": "Is there a broccoli in the image?"}, {"from": "gpt", "value": "This image contains pizza, broccoli, oven. Based on this, is there a broccoli in the image?"}]}, {"id": 2368, "image": "COCO_val2014_000000337502.jpg", "conversations": [{"from": "human", "value": "Is there a carrot in the image?"}, {"from": "gpt", "value": "This image contains pizza, broccoli, oven. Based on this, is there a carrot in the image?"}]}, {"id": 2369, "image": "COCO_val2014_000000337502.jpg", "conversations": [{"from": "human", "value": "Is there an oven in the image?"}, {"from": "gpt", "value": "This image contains pizza, broccoli, oven. Based on this, is there an oven in the image?"}]}, {"id": 2370, "image": "COCO_val2014_000000337502.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains pizza, broccoli, oven. Based on this, is there a bottle in the image?"}]}, {"id": 2371, "image": "COCO_val2014_000000325347.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, sports ball, tennis racket, chair. Based on this, is there a backpack in the image?"}]}, {"id": 2372, "image": "COCO_val2014_000000325347.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, sports ball, tennis racket, chair. Based on this, is there a handbag in the image?"}]}, {"id": 2373, "image": "COCO_val2014_000000325347.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, sports ball, tennis racket, chair. Based on this, is there a person in the image?"}]}, {"id": 2374, "image": "COCO_val2014_000000325347.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, sports ball, tennis racket, chair. Based on this, is there a car in the image?"}]}, {"id": 2375, "image": "COCO_val2014_000000325347.jpg", "conversations": [{"from": "human", "value": "Is there a sports ball in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, sports ball, tennis racket, chair. Based on this, is there a sports ball in the image?"}]}, {"id": 2376, "image": "COCO_val2014_000000325347.jpg", "conversations": [{"from": "human", "value": "Is there a baseball glove in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, sports ball, tennis racket, chair. Based on this, is there a baseball glove in the image?"}]}, {"id": 2377, "image": "COCO_val2014_000000256906.jpg", "conversations": [{"from": "human", "value": "Is there a traffic light in the image?"}, {"from": "gpt", "value": "This image contains traffic light, person, truck, handbag, car, bus, tie. Based on this, is there a traffic light in the image?"}]}, {"id": 2378, "image": "COCO_val2014_000000256906.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains traffic light, person, truck, handbag, car, bus, tie. Based on this, is there a backpack in the image?"}]}, {"id": 2379, "image": "COCO_val2014_000000256906.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains traffic light, person, truck, handbag, car, bus, tie. Based on this, is there a person in the image?"}]}, {"id": 2380, "image": "COCO_val2014_000000256906.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains traffic light, person, truck, handbag, car, bus, tie. Based on this, is there a dining table in the image?"}]}, {"id": 2381, "image": "COCO_val2014_000000256906.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains traffic light, person, truck, handbag, car, bus, tie. Based on this, is there a truck in the image?"}]}, {"id": 2382, "image": "COCO_val2014_000000256906.jpg", "conversations": [{"from": "human", "value": "Is there a motorcycle in the image?"}, {"from": "gpt", "value": "This image contains traffic light, person, truck, handbag, car, bus, tie. Based on this, is there a motorcycle in the image?"}]}, {"id": 2383, "image": "COCO_val2014_000000061507.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, bicycle, suitcase, kite, umbrella. Based on this, is there a person in the image?"}]}, {"id": 2384, "image": "COCO_val2014_000000061507.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, bicycle, suitcase, kite, umbrella. Based on this, is there a car in the image?"}]}, {"id": 2385, "image": "COCO_val2014_000000061507.jpg", "conversations": [{"from": "human", "value": "Is there a bicycle in the image?"}, {"from": "gpt", "value": "This image contains person, bicycle, suitcase, kite, umbrella. Based on this, is there a bicycle in the image?"}]}, {"id": 2386, "image": "COCO_val2014_000000061507.jpg", "conversations": [{"from": "human", "value": "Is there a motorcycle in the image?"}, {"from": "gpt", "value": "This image contains person, bicycle, suitcase, kite, umbrella. Based on this, is there a motorcycle in the image?"}]}, {"id": 2387, "image": "COCO_val2014_000000061507.jpg", "conversations": [{"from": "human", "value": "Is there a suitcase in the image?"}, {"from": "gpt", "value": "This image contains person, bicycle, suitcase, kite, umbrella. Based on this, is there a suitcase in the image?"}]}, {"id": 2388, "image": "COCO_val2014_000000061507.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains person, bicycle, suitcase, kite, umbrella. Based on this, is there a handbag in the image?"}]}, {"id": 2389, "image": "COCO_val2014_000000084410.jpg", "conversations": [{"from": "human", "value": "Is there a vase in the image?"}, {"from": "gpt", "value": "This image contains vase, wine glass, cup. Based on this, is there a vase in the image?"}]}, {"id": 2390, "image": "COCO_val2014_000000084410.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains vase, wine glass, cup. Based on this, is there a dining table in the image?"}]}, {"id": 2391, "image": "COCO_val2014_000000084410.jpg", "conversations": [{"from": "human", "value": "Is there a wine glass in the image?"}, {"from": "gpt", "value": "This image contains vase, wine glass, cup. Based on this, is there a wine glass in the image?"}]}, {"id": 2392, "image": "COCO_val2014_000000084410.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains vase, wine glass, cup. Based on this, is there a person in the image?"}]}, {"id": 2393, "image": "COCO_val2014_000000084410.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains vase, wine glass, cup. Based on this, is there a cup in the image?"}]}, {"id": 2394, "image": "COCO_val2014_000000084410.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains vase, wine glass, cup. Based on this, is there a bottle in the image?"}]}, {"id": 2395, "image": "COCO_val2014_000000288576.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, bicycle, frisbee. Based on this, is there a person in the image?"}]}, {"id": 2396, "image": "COCO_val2014_000000288576.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, bicycle, frisbee. Based on this, is there a car in the image?"}]}, {"id": 2397, "image": "COCO_val2014_000000288576.jpg", "conversations": [{"from": "human", "value": "Is there a bicycle in the image?"}, {"from": "gpt", "value": "This image contains person, bicycle, frisbee. Based on this, is there a bicycle in the image?"}]}, {"id": 2398, "image": "COCO_val2014_000000288576.jpg", "conversations": [{"from": "human", "value": "Is there a motorcycle in the image?"}, {"from": "gpt", "value": "This image contains person, bicycle, frisbee. Based on this, is there a motorcycle in the image?"}]}, {"id": 2399, "image": "COCO_val2014_000000288576.jpg", "conversations": [{"from": "human", "value": "Is there a frisbee in the image?"}, {"from": "gpt", "value": "This image contains person, bicycle, frisbee. Based on this, is there a frisbee in the image?"}]}, {"id": 2400, "image": "COCO_val2014_000000288576.jpg", "conversations": [{"from": "human", "value": "Is there a dog in the image?"}, {"from": "gpt", "value": "This image contains person, bicycle, frisbee. Based on this, is there a dog in the image?"}]}, {"id": 2401, "image": "COCO_val2014_000000328301.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains car, boat, fire hydrant. Based on this, is there a car in the image?"}]}, {"id": 2402, "image": "COCO_val2014_000000328301.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains car, boat, fire hydrant. Based on this, is there a person in the image?"}]}, {"id": 2403, "image": "COCO_val2014_000000328301.jpg", "conversations": [{"from": "human", "value": "Is there a boat in the image?"}, {"from": "gpt", "value": "This image contains car, boat, fire hydrant. Based on this, is there a boat in the image?"}]}, {"id": 2404, "image": "COCO_val2014_000000328301.jpg", "conversations": [{"from": "human", "value": "Is there a bird in the image?"}, {"from": "gpt", "value": "This image contains car, boat, fire hydrant. Based on this, is there a bird in the image?"}]}, {"id": 2405, "image": "COCO_val2014_000000328301.jpg", "conversations": [{"from": "human", "value": "Is there a fire hydrant in the image?"}, {"from": "gpt", "value": "This image contains car, boat, fire hydrant. Based on this, is there a fire hydrant in the image?"}]}, {"id": 2406, "image": "COCO_val2014_000000328301.jpg", "conversations": [{"from": "human", "value": "Is there a stop sign in the image?"}, {"from": "gpt", "value": "This image contains car, boat, fire hydrant. Based on this, is there a stop sign in the image?"}]}, {"id": 2407, "image": "COCO_val2014_000000307262.jpg", "conversations": [{"from": "human", "value": "Is there a bowl in the image?"}, {"from": "gpt", "value": "This image contains bowl, fork, bottle, pizza, orange. Based on this, is there a bowl in the image?"}]}, {"id": 2408, "image": "COCO_val2014_000000307262.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains bowl, fork, bottle, pizza, orange. Based on this, is there a cup in the image?"}]}, {"id": 2409, "image": "COCO_val2014_000000307262.jpg", "conversations": [{"from": "human", "value": "Is there a fork in the image?"}, {"from": "gpt", "value": "This image contains bowl, fork, bottle, pizza, orange. Based on this, is there a fork in the image?"}]}, {"id": 2410, "image": "COCO_val2014_000000307262.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains bowl, fork, bottle, pizza, orange. Based on this, is there a dining table in the image?"}]}, {"id": 2411, "image": "COCO_val2014_000000307262.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains bowl, fork, bottle, pizza, orange. Based on this, is there a bottle in the image?"}]}, {"id": 2412, "image": "COCO_val2014_000000307262.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains bowl, fork, bottle, pizza, orange. Based on this, is there a person in the image?"}]}, {"id": 2413, "image": "COCO_val2014_000000573796.jpg", "conversations": [{"from": "human", "value": "Is there a knife in the image?"}, {"from": "gpt", "value": "This image contains knife, apple, dining table. Based on this, is there a knife in the image?"}]}, {"id": 2414, "image": "COCO_val2014_000000573796.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains knife, apple, dining table. Based on this, is there a cup in the image?"}]}, {"id": 2415, "image": "COCO_val2014_000000573796.jpg", "conversations": [{"from": "human", "value": "Is there an apple in the image?"}, {"from": "gpt", "value": "This image contains knife, apple, dining table. Based on this, is there an apple in the image?"}]}, {"id": 2416, "image": "COCO_val2014_000000573796.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains knife, apple, dining table. Based on this, is there a person in the image?"}]}, {"id": 2417, "image": "COCO_val2014_000000573796.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains knife, apple, dining table. Based on this, is there a dining table in the image?"}]}, {"id": 2418, "image": "COCO_val2014_000000573796.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains knife, apple, dining table. Based on this, is there a chair in the image?"}]}, {"id": 2419, "image": "COCO_val2014_000000154846.jpg", "conversations": [{"from": "human", "value": "Is there a pizza in the image?"}, {"from": "gpt", "value": "This image contains pizza, person, dining table. Based on this, is there a pizza in the image?"}]}, {"id": 2420, "image": "COCO_val2014_000000154846.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains pizza, person, dining table. Based on this, is there a cup in the image?"}]}, {"id": 2421, "image": "COCO_val2014_000000154846.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains pizza, person, dining table. Based on this, is there a person in the image?"}]}, {"id": 2422, "image": "COCO_val2014_000000154846.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains pizza, person, dining table. Based on this, is there a car in the image?"}]}, {"id": 2423, "image": "COCO_val2014_000000154846.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains pizza, person, dining table. Based on this, is there a dining table in the image?"}]}, {"id": 2424, "image": "COCO_val2014_000000154846.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains pizza, person, dining table. Based on this, is there a chair in the image?"}]}, {"id": 2425, "image": "COCO_val2014_000000472375.jpg", "conversations": [{"from": "human", "value": "Is there a dog in the image?"}, {"from": "gpt", "value": "This image contains dog, motorcycle, cup. Based on this, is there a dog in the image?"}]}, {"id": 2426, "image": "COCO_val2014_000000472375.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains dog, motorcycle, cup. Based on this, is there a person in the image?"}]}, {"id": 2427, "image": "COCO_val2014_000000472375.jpg", "conversations": [{"from": "human", "value": "Is there a motorcycle in the image?"}, {"from": "gpt", "value": "This image contains dog, motorcycle, cup. Based on this, is there a motorcycle in the image?"}]}, {"id": 2428, "image": "COCO_val2014_000000472375.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains dog, motorcycle, cup. Based on this, is there a car in the image?"}]}, {"id": 2429, "image": "COCO_val2014_000000472375.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains dog, motorcycle, cup. Based on this, is there a cup in the image?"}]}, {"id": 2430, "image": "COCO_val2014_000000472375.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains dog, motorcycle, cup. Based on this, is there a dining table in the image?"}]}, {"id": 2431, "image": "COCO_val2014_000000446651.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, motorcycle, car. Based on this, is there a person in the image?"}]}, {"id": 2432, "image": "COCO_val2014_000000446651.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, motorcycle, car. Based on this, is there a dining table in the image?"}]}, {"id": 2433, "image": "COCO_val2014_000000446651.jpg", "conversations": [{"from": "human", "value": "Is there a motorcycle in the image?"}, {"from": "gpt", "value": "This image contains person, motorcycle, car. Based on this, is there a motorcycle in the image?"}]}, {"id": 2434, "image": "COCO_val2014_000000446651.jpg", "conversations": [{"from": "human", "value": "Is there a bicycle in the image?"}, {"from": "gpt", "value": "This image contains person, motorcycle, car. Based on this, is there a bicycle in the image?"}]}, {"id": 2435, "image": "COCO_val2014_000000446651.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, motorcycle, car. Based on this, is there a car in the image?"}]}, {"id": 2436, "image": "COCO_val2014_000000446651.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains person, motorcycle, car. Based on this, is there a truck in the image?"}]}, {"id": 2437, "image": "COCO_val2014_000000267684.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, skis. Based on this, is there a backpack in the image?"}]}, {"id": 2438, "image": "COCO_val2014_000000267684.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, skis. Based on this, is there a handbag in the image?"}]}, {"id": 2439, "image": "COCO_val2014_000000267684.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, skis. Based on this, is there a person in the image?"}]}, {"id": 2440, "image": "COCO_val2014_000000267684.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, skis. Based on this, is there a car in the image?"}]}, {"id": 2441, "image": "COCO_val2014_000000267684.jpg", "conversations": [{"from": "human", "value": "Is there a skis in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, skis. Based on this, is there a skis in the image?"}]}, {"id": 2442, "image": "COCO_val2014_000000267684.jpg", "conversations": [{"from": "human", "value": "Is there a snowboard in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, skis. Based on this, is there a snowboard in the image?"}]}, {"id": 2443, "image": "COCO_val2014_000000238029.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, wine glass, fork, dining table, knife, pizza. Based on this, is there a person in the image?"}]}, {"id": 2444, "image": "COCO_val2014_000000238029.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, wine glass, fork, dining table, knife, pizza. Based on this, is there a car in the image?"}]}, {"id": 2445, "image": "COCO_val2014_000000238029.jpg", "conversations": [{"from": "human", "value": "Is there a wine glass in the image?"}, {"from": "gpt", "value": "This image contains person, wine glass, fork, dining table, knife, pizza. Based on this, is there a wine glass in the image?"}]}, {"id": 2446, "image": "COCO_val2014_000000238029.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains person, wine glass, fork, dining table, knife, pizza. Based on this, is there a cup in the image?"}]}, {"id": 2447, "image": "COCO_val2014_000000238029.jpg", "conversations": [{"from": "human", "value": "Is there a fork in the image?"}, {"from": "gpt", "value": "This image contains person, wine glass, fork, dining table, knife, pizza. Based on this, is there a fork in the image?"}]}, {"id": 2448, "image": "COCO_val2014_000000238029.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains person, wine glass, fork, dining table, knife, pizza. Based on this, is there a bottle in the image?"}]}, {"id": 2449, "image": "COCO_val2014_000000294475.jpg", "conversations": [{"from": "human", "value": "Is there a potted plant in the image?"}, {"from": "gpt", "value": "This image contains potted plant, bottle, dining table, chair, pizza, cup. Based on this, is there a potted plant in the image?"}]}, {"id": 2450, "image": "COCO_val2014_000000294475.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains potted plant, bottle, dining table, chair, pizza, cup. Based on this, is there a person in the image?"}]}, {"id": 2451, "image": "COCO_val2014_000000294475.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains potted plant, bottle, dining table, chair, pizza, cup. Based on this, is there a bottle in the image?"}]}, {"id": 2452, "image": "COCO_val2014_000000294475.jpg", "conversations": [{"from": "human", "value": "Is there a spoon in the image?"}, {"from": "gpt", "value": "This image contains potted plant, bottle, dining table, chair, pizza, cup. Based on this, is there a spoon in the image?"}]}, {"id": 2453, "image": "COCO_val2014_000000294475.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains potted plant, bottle, dining table, chair, pizza, cup. Based on this, is there a dining table in the image?"}]}, {"id": 2454, "image": "COCO_val2014_000000294475.jpg", "conversations": [{"from": "human", "value": "Is there a laptop in the image?"}, {"from": "gpt", "value": "This image contains potted plant, bottle, dining table, chair, pizza, cup. Based on this, is there a laptop in the image?"}]}, {"id": 2455, "image": "COCO_val2014_000000149592.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, bench, boat. Based on this, is there a person in the image?"}]}, {"id": 2456, "image": "COCO_val2014_000000149592.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, bench, boat. Based on this, is there a car in the image?"}]}, {"id": 2457, "image": "COCO_val2014_000000149592.jpg", "conversations": [{"from": "human", "value": "Is there a bench in the image?"}, {"from": "gpt", "value": "This image contains person, bench, boat. Based on this, is there a bench in the image?"}]}, {"id": 2458, "image": "COCO_val2014_000000149592.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, bench, boat. Based on this, is there a dining table in the image?"}]}, {"id": 2459, "image": "COCO_val2014_000000149592.jpg", "conversations": [{"from": "human", "value": "Is there a boat in the image?"}, {"from": "gpt", "value": "This image contains person, bench, boat. Based on this, is there a boat in the image?"}]}, {"id": 2460, "image": "COCO_val2014_000000149592.jpg", "conversations": [{"from": "human", "value": "Is there a bird in the image?"}, {"from": "gpt", "value": "This image contains person, bench, boat. Based on this, is there a bird in the image?"}]}, {"id": 2461, "image": "COCO_val2014_000000447787.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, bowl, bottle, carrot, microwave, cake, oven. Based on this, is there a person in the image?"}]}, {"id": 2462, "image": "COCO_val2014_000000447787.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, bowl, bottle, carrot, microwave, cake, oven. Based on this, is there a car in the image?"}]}, {"id": 2463, "image": "COCO_val2014_000000447787.jpg", "conversations": [{"from": "human", "value": "Is there a bowl in the image?"}, {"from": "gpt", "value": "This image contains person, bowl, bottle, carrot, microwave, cake, oven. Based on this, is there a bowl in the image?"}]}, {"id": 2464, "image": "COCO_val2014_000000447787.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains person, bowl, bottle, carrot, microwave, cake, oven. Based on this, is there a cup in the image?"}]}, {"id": 2465, "image": "COCO_val2014_000000447787.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains person, bowl, bottle, carrot, microwave, cake, oven. Based on this, is there a bottle in the image?"}]}, {"id": 2466, "image": "COCO_val2014_000000447787.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, bowl, bottle, carrot, microwave, cake, oven. Based on this, is there a dining table in the image?"}]}, {"id": 2467, "image": "COCO_val2014_000000458325.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains car, traffic light, person, skateboard. Based on this, is there a car in the image?"}]}, {"id": 2468, "image": "COCO_val2014_000000458325.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains car, traffic light, person, skateboard. Based on this, is there a truck in the image?"}]}, {"id": 2469, "image": "COCO_val2014_000000458325.jpg", "conversations": [{"from": "human", "value": "Is there a traffic light in the image?"}, {"from": "gpt", "value": "This image contains car, traffic light, person, skateboard. Based on this, is there a traffic light in the image?"}]}, {"id": 2470, "image": "COCO_val2014_000000458325.jpg", "conversations": [{"from": "human", "value": "Is there a bus in the image?"}, {"from": "gpt", "value": "This image contains car, traffic light, person, skateboard. Based on this, is there a bus in the image?"}]}, {"id": 2471, "image": "COCO_val2014_000000458325.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains car, traffic light, person, skateboard. Based on this, is there a person in the image?"}]}, {"id": 2472, "image": "COCO_val2014_000000458325.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains car, traffic light, person, skateboard. Based on this, is there a dining table in the image?"}]}, {"id": 2473, "image": "COCO_val2014_000000388237.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains chair, person, skateboard, bottle. Based on this, is there a chair in the image?"}]}, {"id": 2474, "image": "COCO_val2014_000000388237.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains chair, person, skateboard, bottle. Based on this, is there a dining table in the image?"}]}, {"id": 2475, "image": "COCO_val2014_000000388237.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains chair, person, skateboard, bottle. Based on this, is there a person in the image?"}]}, {"id": 2476, "image": "COCO_val2014_000000388237.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains chair, person, skateboard, bottle. Based on this, is there a car in the image?"}]}, {"id": 2477, "image": "COCO_val2014_000000388237.jpg", "conversations": [{"from": "human", "value": "Is there a skateboard in the image?"}, {"from": "gpt", "value": "This image contains chair, person, skateboard, bottle. Based on this, is there a skateboard in the image?"}]}, {"id": 2478, "image": "COCO_val2014_000000388237.jpg", "conversations": [{"from": "human", "value": "Is there a bicycle in the image?"}, {"from": "gpt", "value": "This image contains chair, person, skateboard, bottle. Based on this, is there a bicycle in the image?"}]}, {"id": 2479, "image": "COCO_val2014_000000038645.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains chair, cup, potted plant, umbrella. Based on this, is there a chair in the image?"}]}, {"id": 2480, "image": "COCO_val2014_000000038645.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains chair, cup, potted plant, umbrella. Based on this, is there a person in the image?"}]}, {"id": 2481, "image": "COCO_val2014_000000038645.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains chair, cup, potted plant, umbrella. Based on this, is there a cup in the image?"}]}, {"id": 2482, "image": "COCO_val2014_000000038645.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains chair, cup, potted plant, umbrella. Based on this, is there a dining table in the image?"}]}, {"id": 2483, "image": "COCO_val2014_000000038645.jpg", "conversations": [{"from": "human", "value": "Is there a potted plant in the image?"}, {"from": "gpt", "value": "This image contains chair, cup, potted plant, umbrella. Based on this, is there a potted plant in the image?"}]}, {"id": 2484, "image": "COCO_val2014_000000038645.jpg", "conversations": [{"from": "human", "value": "Is there a vase in the image?"}, {"from": "gpt", "value": "This image contains chair, cup, potted plant, umbrella. Based on this, is there a vase in the image?"}]}, {"id": 2485, "image": "COCO_val2014_000000071738.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains chair, person, motorcycle, tie. Based on this, is there a chair in the image?"}]}, {"id": 2486, "image": "COCO_val2014_000000071738.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains chair, person, motorcycle, tie. Based on this, is there a dining table in the image?"}]}, {"id": 2487, "image": "COCO_val2014_000000071738.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains chair, person, motorcycle, tie. Based on this, is there a person in the image?"}]}, {"id": 2488, "image": "COCO_val2014_000000071738.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains chair, person, motorcycle, tie. Based on this, is there a car in the image?"}]}, {"id": 2489, "image": "COCO_val2014_000000071738.jpg", "conversations": [{"from": "human", "value": "Is there a motorcycle in the image?"}, {"from": "gpt", "value": "This image contains chair, person, motorcycle, tie. Based on this, is there a motorcycle in the image?"}]}, {"id": 2490, "image": "COCO_val2014_000000071738.jpg", "conversations": [{"from": "human", "value": "Is there a bicycle in the image?"}, {"from": "gpt", "value": "This image contains chair, person, motorcycle, tie. Based on this, is there a bicycle in the image?"}]}, {"id": 2491, "image": "COCO_val2014_000000170077.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, wine glass, handbag, dining table, chair, umbrella. Based on this, is there a person in the image?"}]}, {"id": 2492, "image": "COCO_val2014_000000170077.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, wine glass, handbag, dining table, chair, umbrella. Based on this, is there a car in the image?"}]}, {"id": 2493, "image": "COCO_val2014_000000170077.jpg", "conversations": [{"from": "human", "value": "Is there a wine glass in the image?"}, {"from": "gpt", "value": "This image contains person, wine glass, handbag, dining table, chair, umbrella. Based on this, is there a wine glass in the image?"}]}, {"id": 2494, "image": "COCO_val2014_000000170077.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains person, wine glass, handbag, dining table, chair, umbrella. Based on this, is there a cup in the image?"}]}, {"id": 2495, "image": "COCO_val2014_000000170077.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains person, wine glass, handbag, dining table, chair, umbrella. Based on this, is there a handbag in the image?"}]}, {"id": 2496, "image": "COCO_val2014_000000170077.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains person, wine glass, handbag, dining table, chair, umbrella. Based on this, is there a backpack in the image?"}]}, {"id": 2497, "image": "COCO_val2014_000000378751.jpg", "conversations": [{"from": "human", "value": "Is there a tv in the image?"}, {"from": "gpt", "value": "This image contains tv, couch, remote, chair, cat. Based on this, is there a tv in the image?"}]}, {"id": 2498, "image": "COCO_val2014_000000378751.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains tv, couch, remote, chair, cat. Based on this, is there a person in the image?"}]}, {"id": 2499, "image": "COCO_val2014_000000378751.jpg", "conversations": [{"from": "human", "value": "Is there a couch in the image?"}, {"from": "gpt", "value": "This image contains tv, couch, remote, chair, cat. Based on this, is there a couch in the image?"}]}, {"id": 2500, "image": "COCO_val2014_000000378751.jpg", "conversations": [{"from": "human", "value": "Is there a book in the image?"}, {"from": "gpt", "value": "This image contains tv, couch, remote, chair, cat. Based on this, is there a book in the image?"}]}, {"id": 2501, "image": "COCO_val2014_000000378751.jpg", "conversations": [{"from": "human", "value": "Is there a remote in the image?"}, {"from": "gpt", "value": "This image contains tv, couch, remote, chair, cat. Based on this, is there a remote in the image?"}]}, {"id": 2502, "image": "COCO_val2014_000000378751.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains tv, couch, remote, chair, cat. Based on this, is there a dining table in the image?"}]}, {"id": 2503, "image": "COCO_val2014_000000073182.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, handbag, bicycle, car, motorcycle. Based on this, is there a person in the image?"}]}, {"id": 2504, "image": "COCO_val2014_000000073182.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, handbag, bicycle, car, motorcycle. Based on this, is there a dining table in the image?"}]}, {"id": 2505, "image": "COCO_val2014_000000073182.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains person, handbag, bicycle, car, motorcycle. Based on this, is there a handbag in the image?"}]}, {"id": 2506, "image": "COCO_val2014_000000073182.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains person, handbag, bicycle, car, motorcycle. Based on this, is there a backpack in the image?"}]}, {"id": 2507, "image": "COCO_val2014_000000073182.jpg", "conversations": [{"from": "human", "value": "Is there a bicycle in the image?"}, {"from": "gpt", "value": "This image contains person, handbag, bicycle, car, motorcycle. Based on this, is there a bicycle in the image?"}]}, {"id": 2508, "image": "COCO_val2014_000000073182.jpg", "conversations": [{"from": "human", "value": "Is there a bus in the image?"}, {"from": "gpt", "value": "This image contains person, handbag, bicycle, car, motorcycle. Based on this, is there a bus in the image?"}]}, {"id": 2509, "image": "COCO_val2014_000000246928.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains chair, car, bed, boat. Based on this, is there a chair in the image?"}]}, {"id": 2510, "image": "COCO_val2014_000000246928.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains chair, car, bed, boat. Based on this, is there a person in the image?"}]}, {"id": 2511, "image": "COCO_val2014_000000246928.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains chair, car, bed, boat. Based on this, is there a car in the image?"}]}, {"id": 2512, "image": "COCO_val2014_000000246928.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains chair, car, bed, boat. Based on this, is there a truck in the image?"}]}, {"id": 2513, "image": "COCO_val2014_000000246928.jpg", "conversations": [{"from": "human", "value": "Is there a bed in the image?"}, {"from": "gpt", "value": "This image contains chair, car, bed, boat. Based on this, is there a bed in the image?"}]}, {"id": 2514, "image": "COCO_val2014_000000246928.jpg", "conversations": [{"from": "human", "value": "Is there a book in the image?"}, {"from": "gpt", "value": "This image contains chair, car, bed, boat. Based on this, is there a book in the image?"}]}, {"id": 2515, "image": "COCO_val2014_000000528136.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains truck, person, car, bus. Based on this, is there a truck in the image?"}]}, {"id": 2516, "image": "COCO_val2014_000000528136.jpg", "conversations": [{"from": "human", "value": "Is there a traffic light in the image?"}, {"from": "gpt", "value": "This image contains truck, person, car, bus. Based on this, is there a traffic light in the image?"}]}, {"id": 2517, "image": "COCO_val2014_000000528136.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains truck, person, car, bus. Based on this, is there a person in the image?"}]}, {"id": 2518, "image": "COCO_val2014_000000528136.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains truck, person, car, bus. Based on this, is there a dining table in the image?"}]}, {"id": 2519, "image": "COCO_val2014_000000528136.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains truck, person, car, bus. Based on this, is there a car in the image?"}]}, {"id": 2520, "image": "COCO_val2014_000000528136.jpg", "conversations": [{"from": "human", "value": "Is there a bicycle in the image?"}, {"from": "gpt", "value": "This image contains truck, person, car, bus. Based on this, is there a bicycle in the image?"}]}, {"id": 2521, "image": "COCO_val2014_000000209290.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, fork, dining table, chair, cup. Based on this, is there a person in the image?"}]}, {"id": 2522, "image": "COCO_val2014_000000209290.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, fork, dining table, chair, cup. Based on this, is there a car in the image?"}]}, {"id": 2523, "image": "COCO_val2014_000000209290.jpg", "conversations": [{"from": "human", "value": "Is there a fork in the image?"}, {"from": "gpt", "value": "This image contains person, fork, dining table, chair, cup. Based on this, is there a fork in the image?"}]}, {"id": 2524, "image": "COCO_val2014_000000209290.jpg", "conversations": [{"from": "human", "value": "Is there a knife in the image?"}, {"from": "gpt", "value": "This image contains person, fork, dining table, chair, cup. Based on this, is there a knife in the image?"}]}, {"id": 2525, "image": "COCO_val2014_000000209290.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, fork, dining table, chair, cup. Based on this, is there a dining table in the image?"}]}, {"id": 2526, "image": "COCO_val2014_000000209290.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains person, fork, dining table, chair, cup. Based on this, is there a bottle in the image?"}]}, {"id": 2527, "image": "COCO_val2014_000000564511.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, wine glass, bottle, pizza, oven, cup. Based on this, is there a person in the image?"}]}, {"id": 2528, "image": "COCO_val2014_000000564511.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, wine glass, bottle, pizza, oven, cup. Based on this, is there a car in the image?"}]}, {"id": 2529, "image": "COCO_val2014_000000564511.jpg", "conversations": [{"from": "human", "value": "Is there a wine glass in the image?"}, {"from": "gpt", "value": "This image contains person, wine glass, bottle, pizza, oven, cup. Based on this, is there a wine glass in the image?"}]}, {"id": 2530, "image": "COCO_val2014_000000564511.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, wine glass, bottle, pizza, oven, cup. Based on this, is there a dining table in the image?"}]}, {"id": 2531, "image": "COCO_val2014_000000564511.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains person, wine glass, bottle, pizza, oven, cup. Based on this, is there a bottle in the image?"}]}, {"id": 2532, "image": "COCO_val2014_000000564511.jpg", "conversations": [{"from": "human", "value": "Is there a spoon in the image?"}, {"from": "gpt", "value": "This image contains person, wine glass, bottle, pizza, oven, cup. Based on this, is there a spoon in the image?"}]}, {"id": 2533, "image": "COCO_val2014_000000200739.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains truck, person, horse, car, suitcase. Based on this, is there a truck in the image?"}]}, {"id": 2534, "image": "COCO_val2014_000000200739.jpg", "conversations": [{"from": "human", "value": "Is there a traffic light in the image?"}, {"from": "gpt", "value": "This image contains truck, person, horse, car, suitcase. Based on this, is there a traffic light in the image?"}]}, {"id": 2535, "image": "COCO_val2014_000000200739.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains truck, person, horse, car, suitcase. Based on this, is there a person in the image?"}]}, {"id": 2536, "image": "COCO_val2014_000000200739.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains truck, person, horse, car, suitcase. Based on this, is there a dining table in the image?"}]}, {"id": 2537, "image": "COCO_val2014_000000200739.jpg", "conversations": [{"from": "human", "value": "Is there a horse in the image?"}, {"from": "gpt", "value": "This image contains truck, person, horse, car, suitcase. Based on this, is there a horse in the image?"}]}, {"id": 2538, "image": "COCO_val2014_000000200739.jpg", "conversations": [{"from": "human", "value": "Is there a dog in the image?"}, {"from": "gpt", "value": "This image contains truck, person, horse, car, suitcase. Based on this, is there a dog in the image?"}]}, {"id": 2539, "image": "COCO_val2014_000000462805.jpg", "conversations": [{"from": "human", "value": "Is there a snowboard in the image?"}, {"from": "gpt", "value": "This image contains snowboard, person, skis. Based on this, is there a snowboard in the image?"}]}, {"id": 2540, "image": "COCO_val2014_000000462805.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains snowboard, person, skis. Based on this, is there a backpack in the image?"}]}, {"id": 2541, "image": "COCO_val2014_000000462805.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains snowboard, person, skis. Based on this, is there a person in the image?"}]}, {"id": 2542, "image": "COCO_val2014_000000462805.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains snowboard, person, skis. Based on this, is there a car in the image?"}]}, {"id": 2543, "image": "COCO_val2014_000000462805.jpg", "conversations": [{"from": "human", "value": "Is there a skis in the image?"}, {"from": "gpt", "value": "This image contains snowboard, person, skis. Based on this, is there a skis in the image?"}]}, {"id": 2544, "image": "COCO_val2014_000000462805.jpg", "conversations": [{"from": "human", "value": "Is there a dog in the image?"}, {"from": "gpt", "value": "This image contains snowboard, person, skis. Based on this, is there a dog in the image?"}]}, {"id": 2545, "image": "COCO_val2014_000000163575.jpg", "conversations": [{"from": "human", "value": "Is there a dog in the image?"}, {"from": "gpt", "value": "This image contains dog, person, bed. Based on this, is there a dog in the image?"}]}, {"id": 2546, "image": "COCO_val2014_000000163575.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains dog, person, bed. Based on this, is there a car in the image?"}]}, {"id": 2547, "image": "COCO_val2014_000000163575.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains dog, person, bed. Based on this, is there a person in the image?"}]}, {"id": 2548, "image": "COCO_val2014_000000163575.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains dog, person, bed. Based on this, is there a dining table in the image?"}]}, {"id": 2549, "image": "COCO_val2014_000000163575.jpg", "conversations": [{"from": "human", "value": "Is there a bed in the image?"}, {"from": "gpt", "value": "This image contains dog, person, bed. Based on this, is there a bed in the image?"}]}, {"id": 2550, "image": "COCO_val2014_000000163575.jpg", "conversations": [{"from": "human", "value": "Is there a book in the image?"}, {"from": "gpt", "value": "This image contains dog, person, bed. Based on this, is there a book in the image?"}]}, {"id": 2551, "image": "COCO_val2014_000000059383.jpg", "conversations": [{"from": "human", "value": "Is there an oven in the image?"}, {"from": "gpt", "value": "This image contains oven, bottle, sink, microwave, cell phone, cup. Based on this, is there an oven in the image?"}]}, {"id": 2552, "image": "COCO_val2014_000000059383.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains oven, bottle, sink, microwave, cell phone, cup. Based on this, is there a person in the image?"}]}, {"id": 2553, "image": "COCO_val2014_000000059383.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains oven, bottle, sink, microwave, cell phone, cup. Based on this, is there a bottle in the image?"}]}, {"id": 2554, "image": "COCO_val2014_000000059383.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains oven, bottle, sink, microwave, cell phone, cup. Based on this, is there a dining table in the image?"}]}, {"id": 2555, "image": "COCO_val2014_000000059383.jpg", "conversations": [{"from": "human", "value": "Is there a sink in the image?"}, {"from": "gpt", "value": "This image contains oven, bottle, sink, microwave, cell phone, cup. Based on this, is there a sink in the image?"}]}, {"id": 2556, "image": "COCO_val2014_000000059383.jpg", "conversations": [{"from": "human", "value": "Is there a toilet in the image?"}, {"from": "gpt", "value": "This image contains oven, bottle, sink, microwave, cell phone, cup. Based on this, is there a toilet in the image?"}]}, {"id": 2557, "image": "COCO_val2014_000000478736.jpg", "conversations": [{"from": "human", "value": "Is there a traffic light in the image?"}, {"from": "gpt", "value": "This image contains traffic light, car, stop sign. Based on this, is there a traffic light in the image?"}]}, {"id": 2558, "image": "COCO_val2014_000000478736.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains traffic light, car, stop sign. Based on this, is there a person in the image?"}]}, {"id": 2559, "image": "COCO_val2014_000000478736.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains traffic light, car, stop sign. Based on this, is there a car in the image?"}]}, {"id": 2560, "image": "COCO_val2014_000000478736.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains traffic light, car, stop sign. Based on this, is there a truck in the image?"}]}, {"id": 2561, "image": "COCO_val2014_000000478736.jpg", "conversations": [{"from": "human", "value": "Is there a stop sign in the image?"}, {"from": "gpt", "value": "This image contains traffic light, car, stop sign. Based on this, is there a stop sign in the image?"}]}, {"id": 2562, "image": "COCO_val2014_000000478736.jpg", "conversations": [{"from": "human", "value": "Is there a fire hydrant in the image?"}, {"from": "gpt", "value": "This image contains traffic light, car, stop sign. Based on this, is there a fire hydrant in the image?"}]}, {"id": 2563, "image": "COCO_val2014_000000156282.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, kite, umbrella. Based on this, is there a person in the image?"}]}, {"id": 2564, "image": "COCO_val2014_000000156282.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, kite, umbrella. Based on this, is there a car in the image?"}]}, {"id": 2565, "image": "COCO_val2014_000000156282.jpg", "conversations": [{"from": "human", "value": "Is there a kite in the image?"}, {"from": "gpt", "value": "This image contains person, kite, umbrella. Based on this, is there a kite in the image?"}]}, {"id": 2566, "image": "COCO_val2014_000000156282.jpg", "conversations": [{"from": "human", "value": "Is there a surfboard in the image?"}, {"from": "gpt", "value": "This image contains person, kite, umbrella. Based on this, is there a surfboard in the image?"}]}, {"id": 2567, "image": "COCO_val2014_000000156282.jpg", "conversations": [{"from": "human", "value": "Is there an umbrella in the image?"}, {"from": "gpt", "value": "This image contains person, kite, umbrella. Based on this, is there an umbrella in the image?"}]}, {"id": 2568, "image": "COCO_val2014_000000156282.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains person, kite, umbrella. Based on this, is there a handbag in the image?"}]}, {"id": 2569, "image": "COCO_val2014_000000052689.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, bench, skis. Based on this, is there a person in the image?"}]}, {"id": 2570, "image": "COCO_val2014_000000052689.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, bench, skis. Based on this, is there a car in the image?"}]}, {"id": 2571, "image": "COCO_val2014_000000052689.jpg", "conversations": [{"from": "human", "value": "Is there a bench in the image?"}, {"from": "gpt", "value": "This image contains person, bench, skis. Based on this, is there a bench in the image?"}]}, {"id": 2572, "image": "COCO_val2014_000000052689.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, bench, skis. Based on this, is there a dining table in the image?"}]}, {"id": 2573, "image": "COCO_val2014_000000052689.jpg", "conversations": [{"from": "human", "value": "Is there a skis in the image?"}, {"from": "gpt", "value": "This image contains person, bench, skis. Based on this, is there a skis in the image?"}]}, {"id": 2574, "image": "COCO_val2014_000000052689.jpg", "conversations": [{"from": "human", "value": "Is there a snowboard in the image?"}, {"from": "gpt", "value": "This image contains person, bench, skis. Based on this, is there a snowboard in the image?"}]}, {"id": 2575, "image": "COCO_val2014_000000516601.jpg", "conversations": [{"from": "human", "value": "Is there a snowboard in the image?"}, {"from": "gpt", "value": "This image contains snowboard, person, skis. Based on this, is there a snowboard in the image?"}]}, {"id": 2576, "image": "COCO_val2014_000000516601.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains snowboard, person, skis. Based on this, is there a backpack in the image?"}]}, {"id": 2577, "image": "COCO_val2014_000000516601.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains snowboard, person, skis. Based on this, is there a person in the image?"}]}, {"id": 2578, "image": "COCO_val2014_000000516601.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains snowboard, person, skis. Based on this, is there a car in the image?"}]}, {"id": 2579, "image": "COCO_val2014_000000516601.jpg", "conversations": [{"from": "human", "value": "Is there a skis in the image?"}, {"from": "gpt", "value": "This image contains snowboard, person, skis. Based on this, is there a skis in the image?"}]}, {"id": 2580, "image": "COCO_val2014_000000516601.jpg", "conversations": [{"from": "human", "value": "Is there a dog in the image?"}, {"from": "gpt", "value": "This image contains snowboard, person, skis. Based on this, is there a dog in the image?"}]}, {"id": 2581, "image": "COCO_val2014_000000562155.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, car, tie. Based on this, is there a person in the image?"}]}, {"id": 2582, "image": "COCO_val2014_000000562155.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, car, tie. Based on this, is there a dining table in the image?"}]}, {"id": 2583, "image": "COCO_val2014_000000562155.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, car, tie. Based on this, is there a car in the image?"}]}, {"id": 2584, "image": "COCO_val2014_000000562155.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains person, car, tie. Based on this, is there a truck in the image?"}]}, {"id": 2585, "image": "COCO_val2014_000000562155.jpg", "conversations": [{"from": "human", "value": "Is there a tie in the image?"}, {"from": "gpt", "value": "This image contains person, car, tie. Based on this, is there a tie in the image?"}]}, {"id": 2586, "image": "COCO_val2014_000000562155.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains person, car, tie. Based on this, is there a cup in the image?"}]}, {"id": 2587, "image": "COCO_val2014_000000142056.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket. Based on this, is there a person in the image?"}]}, {"id": 2588, "image": "COCO_val2014_000000142056.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket. Based on this, is there a car in the image?"}]}, {"id": 2589, "image": "COCO_val2014_000000142056.jpg", "conversations": [{"from": "human", "value": "Is there a sports ball in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket. Based on this, is there a sports ball in the image?"}]}, {"id": 2590, "image": "COCO_val2014_000000142056.jpg", "conversations": [{"from": "human", "value": "Is there a baseball glove in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket. Based on this, is there a baseball glove in the image?"}]}, {"id": 2591, "image": "COCO_val2014_000000142056.jpg", "conversations": [{"from": "human", "value": "Is there a tennis racket in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket. Based on this, is there a tennis racket in the image?"}]}, {"id": 2592, "image": "COCO_val2014_000000142056.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket. Based on this, is there a chair in the image?"}]}, {"id": 2593, "image": "COCO_val2014_000000299986.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, bench, cell phone. Based on this, is there a person in the image?"}]}, {"id": 2594, "image": "COCO_val2014_000000299986.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, bench, cell phone. Based on this, is there a car in the image?"}]}, {"id": 2595, "image": "COCO_val2014_000000299986.jpg", "conversations": [{"from": "human", "value": "Is there a bench in the image?"}, {"from": "gpt", "value": "This image contains person, bench, cell phone. Based on this, is there a bench in the image?"}]}, {"id": 2596, "image": "COCO_val2014_000000299986.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, bench, cell phone. Based on this, is there a dining table in the image?"}]}, {"id": 2597, "image": "COCO_val2014_000000299986.jpg", "conversations": [{"from": "human", "value": "Is there a cell phone in the image?"}, {"from": "gpt", "value": "This image contains person, bench, cell phone. Based on this, is there a cell phone in the image?"}]}, {"id": 2598, "image": "COCO_val2014_000000299986.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains person, bench, cell phone. Based on this, is there a chair in the image?"}]}, {"id": 2599, "image": "COCO_val2014_000000521643.jpg", "conversations": [{"from": "human", "value": "Is there a vase in the image?"}, {"from": "gpt", "value": "This image contains vase, bottle, dining table. Based on this, is there a vase in the image?"}]}, {"id": 2600, "image": "COCO_val2014_000000521643.jpg", "conversations": [{"from": "human", "value": "Is there a potted plant in the image?"}, {"from": "gpt", "value": "This image contains vase, bottle, dining table. Based on this, is there a potted plant in the image?"}]}, {"id": 2601, "image": "COCO_val2014_000000521643.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains vase, bottle, dining table. Based on this, is there a bottle in the image?"}]}, {"id": 2602, "image": "COCO_val2014_000000521643.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains vase, bottle, dining table. Based on this, is there a person in the image?"}]}, {"id": 2603, "image": "COCO_val2014_000000521643.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains vase, bottle, dining table. Based on this, is there a dining table in the image?"}]}, {"id": 2604, "image": "COCO_val2014_000000521643.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains vase, bottle, dining table. Based on this, is there a cup in the image?"}]}, {"id": 2605, "image": "COCO_val2014_000000574454.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, surfboard, kite. Based on this, is there a person in the image?"}]}, {"id": 2606, "image": "COCO_val2014_000000574454.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, surfboard, kite. Based on this, is there a car in the image?"}]}, {"id": 2607, "image": "COCO_val2014_000000574454.jpg", "conversations": [{"from": "human", "value": "Is there a surfboard in the image?"}, {"from": "gpt", "value": "This image contains person, surfboard, kite. Based on this, is there a surfboard in the image?"}]}, {"id": 2608, "image": "COCO_val2014_000000574454.jpg", "conversations": [{"from": "human", "value": "Is there an umbrella in the image?"}, {"from": "gpt", "value": "This image contains person, surfboard, kite. Based on this, is there an umbrella in the image?"}]}, {"id": 2609, "image": "COCO_val2014_000000574454.jpg", "conversations": [{"from": "human", "value": "Is there a kite in the image?"}, {"from": "gpt", "value": "This image contains person, surfboard, kite. Based on this, is there a kite in the image?"}]}, {"id": 2610, "image": "COCO_val2014_000000574454.jpg", "conversations": [{"from": "human", "value": "Is there a bicycle in the image?"}, {"from": "gpt", "value": "This image contains person, surfboard, kite. Based on this, is there a bicycle in the image?"}]}, {"id": 2611, "image": "COCO_val2014_000000415727.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, bench, baseball bat. Based on this, is there a backpack in the image?"}]}, {"id": 2612, "image": "COCO_val2014_000000415727.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, bench, baseball bat. Based on this, is there a handbag in the image?"}]}, {"id": 2613, "image": "COCO_val2014_000000415727.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, bench, baseball bat. Based on this, is there a person in the image?"}]}, {"id": 2614, "image": "COCO_val2014_000000415727.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, bench, baseball bat. Based on this, is there a car in the image?"}]}, {"id": 2615, "image": "COCO_val2014_000000415727.jpg", "conversations": [{"from": "human", "value": "Is there a bench in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, bench, baseball bat. Based on this, is there a bench in the image?"}]}, {"id": 2616, "image": "COCO_val2014_000000415727.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, bench, baseball bat. Based on this, is there a dining table in the image?"}]}, {"id": 2617, "image": "COCO_val2014_000000222118.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, suitcase, handbag, cell phone. Based on this, is there a person in the image?"}]}, {"id": 2618, "image": "COCO_val2014_000000222118.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, suitcase, handbag, cell phone. Based on this, is there a car in the image?"}]}, {"id": 2619, "image": "COCO_val2014_000000222118.jpg", "conversations": [{"from": "human", "value": "Is there a suitcase in the image?"}, {"from": "gpt", "value": "This image contains person, suitcase, handbag, cell phone. Based on this, is there a suitcase in the image?"}]}, {"id": 2620, "image": "COCO_val2014_000000222118.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains person, suitcase, handbag, cell phone. Based on this, is there a backpack in the image?"}]}, {"id": 2621, "image": "COCO_val2014_000000222118.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains person, suitcase, handbag, cell phone. Based on this, is there a handbag in the image?"}]}, {"id": 2622, "image": "COCO_val2014_000000222118.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, suitcase, handbag, cell phone. Based on this, is there a dining table in the image?"}]}, {"id": 2623, "image": "COCO_val2014_000000514292.jpg", "conversations": [{"from": "human", "value": "Is there a book in the image?"}, {"from": "gpt", "value": "This image contains book, teddy bear, bear. Based on this, is there a book in the image?"}]}, {"id": 2624, "image": "COCO_val2014_000000514292.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains book, teddy bear, bear. Based on this, is there a person in the image?"}]}, {"id": 2625, "image": "COCO_val2014_000000514292.jpg", "conversations": [{"from": "human", "value": "Is there a teddy bear in the image?"}, {"from": "gpt", "value": "This image contains book, teddy bear, bear. Based on this, is there a teddy bear in the image?"}]}, {"id": 2626, "image": "COCO_val2014_000000514292.jpg", "conversations": [{"from": "human", "value": "Is there a bed in the image?"}, {"from": "gpt", "value": "This image contains book, teddy bear, bear. Based on this, is there a bed in the image?"}]}, {"id": 2627, "image": "COCO_val2014_000000514292.jpg", "conversations": [{"from": "human", "value": "Is there a bear in the image?"}, {"from": "gpt", "value": "This image contains book, teddy bear, bear. Based on this, is there a bear in the image?"}]}, {"id": 2628, "image": "COCO_val2014_000000514292.jpg", "conversations": [{"from": "human", "value": "Is there a couch in the image?"}, {"from": "gpt", "value": "This image contains book, teddy bear, bear. Based on this, is there a couch in the image?"}]}, {"id": 2629, "image": "COCO_val2014_000000117527.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains dining table, person, bowl, cup. Based on this, is there a dining table in the image?"}]}, {"id": 2630, "image": "COCO_val2014_000000117527.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains dining table, person, bowl, cup. Based on this, is there a chair in the image?"}]}, {"id": 2631, "image": "COCO_val2014_000000117527.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains dining table, person, bowl, cup. Based on this, is there a person in the image?"}]}, {"id": 2632, "image": "COCO_val2014_000000117527.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains dining table, person, bowl, cup. Based on this, is there a car in the image?"}]}, {"id": 2633, "image": "COCO_val2014_000000117527.jpg", "conversations": [{"from": "human", "value": "Is there a bowl in the image?"}, {"from": "gpt", "value": "This image contains dining table, person, bowl, cup. Based on this, is there a bowl in the image?"}]}, {"id": 2634, "image": "COCO_val2014_000000117527.jpg", "conversations": [{"from": "human", "value": "Is there a spoon in the image?"}, {"from": "gpt", "value": "This image contains dining table, person, bowl, cup. Based on this, is there a spoon in the image?"}]}, {"id": 2635, "image": "COCO_val2014_000000016451.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, handbag, surfboard, chair, umbrella. Based on this, is there a backpack in the image?"}]}, {"id": 2636, "image": "COCO_val2014_000000016451.jpg", "conversations": [{"from": "human", "value": "Is there a skis in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, handbag, surfboard, chair, umbrella. Based on this, is there a skis in the image?"}]}, {"id": 2637, "image": "COCO_val2014_000000016451.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, handbag, surfboard, chair, umbrella. Based on this, is there a person in the image?"}]}, {"id": 2638, "image": "COCO_val2014_000000016451.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, handbag, surfboard, chair, umbrella. Based on this, is there a car in the image?"}]}, {"id": 2639, "image": "COCO_val2014_000000016451.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, handbag, surfboard, chair, umbrella. Based on this, is there a handbag in the image?"}]}, {"id": 2640, "image": "COCO_val2014_000000016451.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, handbag, surfboard, chair, umbrella. Based on this, is there a dining table in the image?"}]}, {"id": 2641, "image": "COCO_val2014_000000429706.jpg", "conversations": [{"from": "human", "value": "Is there a tv in the image?"}, {"from": "gpt", "value": "This image contains tv, backpack, person, handbag, suitcase. Based on this, is there a tv in the image?"}]}, {"id": 2642, "image": "COCO_val2014_000000429706.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains tv, backpack, person, handbag, suitcase. Based on this, is there a dining table in the image?"}]}, {"id": 2643, "image": "COCO_val2014_000000429706.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains tv, backpack, person, handbag, suitcase. Based on this, is there a backpack in the image?"}]}, {"id": 2644, "image": "COCO_val2014_000000429706.jpg", "conversations": [{"from": "human", "value": "Is there a skis in the image?"}, {"from": "gpt", "value": "This image contains tv, backpack, person, handbag, suitcase. Based on this, is there a skis in the image?"}]}, {"id": 2645, "image": "COCO_val2014_000000429706.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains tv, backpack, person, handbag, suitcase. Based on this, is there a person in the image?"}]}, {"id": 2646, "image": "COCO_val2014_000000429706.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains tv, backpack, person, handbag, suitcase. Based on this, is there a car in the image?"}]}, {"id": 2647, "image": "COCO_val2014_000000429580.jpg", "conversations": [{"from": "human", "value": "Is there a dog in the image?"}, {"from": "gpt", "value": "This image contains dog, person, frisbee. Based on this, is there a dog in the image?"}]}, {"id": 2648, "image": "COCO_val2014_000000429580.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains dog, person, frisbee. Based on this, is there a car in the image?"}]}, {"id": 2649, "image": "COCO_val2014_000000429580.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains dog, person, frisbee. Based on this, is there a person in the image?"}]}, {"id": 2650, "image": "COCO_val2014_000000429580.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains dog, person, frisbee. Based on this, is there a dining table in the image?"}]}, {"id": 2651, "image": "COCO_val2014_000000429580.jpg", "conversations": [{"from": "human", "value": "Is there a frisbee in the image?"}, {"from": "gpt", "value": "This image contains dog, person, frisbee. Based on this, is there a frisbee in the image?"}]}, {"id": 2652, "image": "COCO_val2014_000000429580.jpg", "conversations": [{"from": "human", "value": "Is there an orange in the image?"}, {"from": "gpt", "value": "This image contains dog, person, frisbee. Based on this, is there an orange in the image?"}]}, {"id": 2653, "image": "COCO_val2014_000000283168.jpg", "conversations": [{"from": "human", "value": "Is there a bowl in the image?"}, {"from": "gpt", "value": "This image contains bowl, sandwich, fork, cup. Based on this, is there a bowl in the image?"}]}, {"id": 2654, "image": "COCO_val2014_000000283168.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains bowl, sandwich, fork, cup. Based on this, is there a dining table in the image?"}]}, {"id": 2655, "image": "COCO_val2014_000000283168.jpg", "conversations": [{"from": "human", "value": "Is there a sandwich in the image?"}, {"from": "gpt", "value": "This image contains bowl, sandwich, fork, cup. Based on this, is there a sandwich in the image?"}]}, {"id": 2656, "image": "COCO_val2014_000000283168.jpg", "conversations": [{"from": "human", "value": "Is there a knife in the image?"}, {"from": "gpt", "value": "This image contains bowl, sandwich, fork, cup. Based on this, is there a knife in the image?"}]}, {"id": 2657, "image": "COCO_val2014_000000283168.jpg", "conversations": [{"from": "human", "value": "Is there a fork in the image?"}, {"from": "gpt", "value": "This image contains bowl, sandwich, fork, cup. Based on this, is there a fork in the image?"}]}, {"id": 2658, "image": "COCO_val2014_000000283168.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains bowl, sandwich, fork, cup. Based on this, is there a person in the image?"}]}, {"id": 2659, "image": "COCO_val2014_000000405205.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains truck, person, bus. Based on this, is there a truck in the image?"}]}, {"id": 2660, "image": "COCO_val2014_000000405205.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains truck, person, bus. Based on this, is there a car in the image?"}]}, {"id": 2661, "image": "COCO_val2014_000000405205.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains truck, person, bus. Based on this, is there a person in the image?"}]}, {"id": 2662, "image": "COCO_val2014_000000405205.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains truck, person, bus. Based on this, is there a dining table in the image?"}]}, {"id": 2663, "image": "COCO_val2014_000000405205.jpg", "conversations": [{"from": "human", "value": "Is there a bus in the image?"}, {"from": "gpt", "value": "This image contains truck, person, bus. Based on this, is there a bus in the image?"}]}, {"id": 2664, "image": "COCO_val2014_000000405205.jpg", "conversations": [{"from": "human", "value": "Is there a traffic light in the image?"}, {"from": "gpt", "value": "This image contains truck, person, bus. Based on this, is there a traffic light in the image?"}]}, {"id": 2665, "image": "COCO_val2014_000000123570.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, car, umbrella. Based on this, is there a person in the image?"}]}, {"id": 2666, "image": "COCO_val2014_000000123570.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, car, umbrella. Based on this, is there a dining table in the image?"}]}, {"id": 2667, "image": "COCO_val2014_000000123570.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, car, umbrella. Based on this, is there a car in the image?"}]}, {"id": 2668, "image": "COCO_val2014_000000123570.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains person, car, umbrella. Based on this, is there a truck in the image?"}]}, {"id": 2669, "image": "COCO_val2014_000000123570.jpg", "conversations": [{"from": "human", "value": "Is there an umbrella in the image?"}, {"from": "gpt", "value": "This image contains person, car, umbrella. Based on this, is there an umbrella in the image?"}]}, {"id": 2670, "image": "COCO_val2014_000000123570.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains person, car, umbrella. Based on this, is there a handbag in the image?"}]}, {"id": 2671, "image": "COCO_val2014_000000365317.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket. Based on this, is there a person in the image?"}]}, {"id": 2672, "image": "COCO_val2014_000000365317.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket. Based on this, is there a car in the image?"}]}, {"id": 2673, "image": "COCO_val2014_000000365317.jpg", "conversations": [{"from": "human", "value": "Is there a sports ball in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket. Based on this, is there a sports ball in the image?"}]}, {"id": 2674, "image": "COCO_val2014_000000365317.jpg", "conversations": [{"from": "human", "value": "Is there a baseball glove in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket. Based on this, is there a baseball glove in the image?"}]}, {"id": 2675, "image": "COCO_val2014_000000365317.jpg", "conversations": [{"from": "human", "value": "Is there a tennis racket in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket. Based on this, is there a tennis racket in the image?"}]}, {"id": 2676, "image": "COCO_val2014_000000365317.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket. Based on this, is there a chair in the image?"}]}, {"id": 2677, "image": "COCO_val2014_000000224155.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, toilet, cell phone. Based on this, is there a person in the image?"}]}, {"id": 2678, "image": "COCO_val2014_000000224155.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, toilet, cell phone. Based on this, is there a car in the image?"}]}, {"id": 2679, "image": "COCO_val2014_000000224155.jpg", "conversations": [{"from": "human", "value": "Is there a toilet in the image?"}, {"from": "gpt", "value": "This image contains person, toilet, cell phone. Based on this, is there a toilet in the image?"}]}, {"id": 2680, "image": "COCO_val2014_000000224155.jpg", "conversations": [{"from": "human", "value": "Is there a sink in the image?"}, {"from": "gpt", "value": "This image contains person, toilet, cell phone. Based on this, is there a sink in the image?"}]}, {"id": 2681, "image": "COCO_val2014_000000224155.jpg", "conversations": [{"from": "human", "value": "Is there a cell phone in the image?"}, {"from": "gpt", "value": "This image contains person, toilet, cell phone. Based on this, is there a cell phone in the image?"}]}, {"id": 2682, "image": "COCO_val2014_000000224155.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, toilet, cell phone. Based on this, is there a dining table in the image?"}]}, {"id": 2683, "image": "COCO_val2014_000000191964.jpg", "conversations": [{"from": "human", "value": "Is there a keyboard in the image?"}, {"from": "gpt", "value": "This image contains keyboard, orange, cat, laptop. Based on this, is there a keyboard in the image?"}]}, {"id": 2684, "image": "COCO_val2014_000000191964.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains keyboard, orange, cat, laptop. Based on this, is there a dining table in the image?"}]}, {"id": 2685, "image": "COCO_val2014_000000191964.jpg", "conversations": [{"from": "human", "value": "Is there an orange in the image?"}, {"from": "gpt", "value": "This image contains keyboard, orange, cat, laptop. Based on this, is there an orange in the image?"}]}, {"id": 2686, "image": "COCO_val2014_000000191964.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains keyboard, orange, cat, laptop. Based on this, is there a person in the image?"}]}, {"id": 2687, "image": "COCO_val2014_000000191964.jpg", "conversations": [{"from": "human", "value": "Is there a cat in the image?"}, {"from": "gpt", "value": "This image contains keyboard, orange, cat, laptop. Based on this, is there a cat in the image?"}]}, {"id": 2688, "image": "COCO_val2014_000000191964.jpg", "conversations": [{"from": "human", "value": "Is there a couch in the image?"}, {"from": "gpt", "value": "This image contains keyboard, orange, cat, laptop. Based on this, is there a couch in the image?"}]}, {"id": 2689, "image": "COCO_val2014_000000265472.jpg", "conversations": [{"from": "human", "value": "Is there a banana in the image?"}, {"from": "gpt", "value": "This image contains banana, bowl, orange, cake. Based on this, is there a banana in the image?"}]}, {"id": 2690, "image": "COCO_val2014_000000265472.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains banana, bowl, orange, cake. Based on this, is there a dining table in the image?"}]}, {"id": 2691, "image": "COCO_val2014_000000265472.jpg", "conversations": [{"from": "human", "value": "Is there a bowl in the image?"}, {"from": "gpt", "value": "This image contains banana, bowl, orange, cake. Based on this, is there a bowl in the image?"}]}, {"id": 2692, "image": "COCO_val2014_000000265472.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains banana, bowl, orange, cake. Based on this, is there a cup in the image?"}]}, {"id": 2693, "image": "COCO_val2014_000000265472.jpg", "conversations": [{"from": "human", "value": "Is there an orange in the image?"}, {"from": "gpt", "value": "This image contains banana, bowl, orange, cake. Based on this, is there an orange in the image?"}]}, {"id": 2694, "image": "COCO_val2014_000000265472.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains banana, bowl, orange, cake. Based on this, is there a person in the image?"}]}, {"id": 2695, "image": "COCO_val2014_000000550514.jpg", "conversations": [{"from": "human", "value": "Is there a snowboard in the image?"}, {"from": "gpt", "value": "This image contains snowboard, backpack, person, skis. Based on this, is there a snowboard in the image?"}]}, {"id": 2696, "image": "COCO_val2014_000000550514.jpg", "conversations": [{"from": "human", "value": "Is there a surfboard in the image?"}, {"from": "gpt", "value": "This image contains snowboard, backpack, person, skis. Based on this, is there a surfboard in the image?"}]}, {"id": 2697, "image": "COCO_val2014_000000550514.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains snowboard, backpack, person, skis. Based on this, is there a backpack in the image?"}]}, {"id": 2698, "image": "COCO_val2014_000000550514.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains snowboard, backpack, person, skis. Based on this, is there a handbag in the image?"}]}, {"id": 2699, "image": "COCO_val2014_000000550514.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains snowboard, backpack, person, skis. Based on this, is there a person in the image?"}]}, {"id": 2700, "image": "COCO_val2014_000000550514.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains snowboard, backpack, person, skis. Based on this, is there a car in the image?"}]}, {"id": 2701, "image": "COCO_val2014_000000163814.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, motorcycle, skateboard. Based on this, is there a person in the image?"}]}, {"id": 2702, "image": "COCO_val2014_000000163814.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, motorcycle, skateboard. Based on this, is there a car in the image?"}]}, {"id": 2703, "image": "COCO_val2014_000000163814.jpg", "conversations": [{"from": "human", "value": "Is there a motorcycle in the image?"}, {"from": "gpt", "value": "This image contains person, motorcycle, skateboard. Based on this, is there a motorcycle in the image?"}]}, {"id": 2704, "image": "COCO_val2014_000000163814.jpg", "conversations": [{"from": "human", "value": "Is there a bicycle in the image?"}, {"from": "gpt", "value": "This image contains person, motorcycle, skateboard. Based on this, is there a bicycle in the image?"}]}, {"id": 2705, "image": "COCO_val2014_000000163814.jpg", "conversations": [{"from": "human", "value": "Is there a skateboard in the image?"}, {"from": "gpt", "value": "This image contains person, motorcycle, skateboard. Based on this, is there a skateboard in the image?"}]}, {"id": 2706, "image": "COCO_val2014_000000163814.jpg", "conversations": [{"from": "human", "value": "Is there a bench in the image?"}, {"from": "gpt", "value": "This image contains person, motorcycle, skateboard. Based on this, is there a bench in the image?"}]}, {"id": 2707, "image": "COCO_val2014_000000505933.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains truck, train, car. Based on this, is there a truck in the image?"}]}, {"id": 2708, "image": "COCO_val2014_000000505933.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains truck, train, car. Based on this, is there a person in the image?"}]}, {"id": 2709, "image": "COCO_val2014_000000505933.jpg", "conversations": [{"from": "human", "value": "Is there a train in the image?"}, {"from": "gpt", "value": "This image contains truck, train, car. Based on this, is there a train in the image?"}]}, {"id": 2710, "image": "COCO_val2014_000000505933.jpg", "conversations": [{"from": "human", "value": "Is there a traffic light in the image?"}, {"from": "gpt", "value": "This image contains truck, train, car. Based on this, is there a traffic light in the image?"}]}, {"id": 2711, "image": "COCO_val2014_000000505933.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains truck, train, car. Based on this, is there a car in the image?"}]}, {"id": 2712, "image": "COCO_val2014_000000505933.jpg", "conversations": [{"from": "human", "value": "Is there a bus in the image?"}, {"from": "gpt", "value": "This image contains truck, train, car. Based on this, is there a bus in the image?"}]}, {"id": 2713, "image": "COCO_val2014_000000318550.jpg", "conversations": [{"from": "human", "value": "Is there a traffic light in the image?"}, {"from": "gpt", "value": "This image contains traffic light, truck, train, car. Based on this, is there a traffic light in the image?"}]}, {"id": 2714, "image": "COCO_val2014_000000318550.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains traffic light, truck, train, car. Based on this, is there a person in the image?"}]}, {"id": 2715, "image": "COCO_val2014_000000318550.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains traffic light, truck, train, car. Based on this, is there a truck in the image?"}]}, {"id": 2716, "image": "COCO_val2014_000000318550.jpg", "conversations": [{"from": "human", "value": "Is there a motorcycle in the image?"}, {"from": "gpt", "value": "This image contains traffic light, truck, train, car. Based on this, is there a motorcycle in the image?"}]}, {"id": 2717, "image": "COCO_val2014_000000318550.jpg", "conversations": [{"from": "human", "value": "Is there a train in the image?"}, {"from": "gpt", "value": "This image contains traffic light, truck, train, car. Based on this, is there a train in the image?"}]}, {"id": 2718, "image": "COCO_val2014_000000318550.jpg", "conversations": [{"from": "human", "value": "Is there a bus in the image?"}, {"from": "gpt", "value": "This image contains traffic light, truck, train, car. Based on this, is there a bus in the image?"}]}, {"id": 2719, "image": "COCO_val2014_000000367528.jpg", "conversations": [{"from": "human", "value": "Is there a bowl in the image?"}, {"from": "gpt", "value": "This image contains bowl, person, remote, dining table, vase, tv, potted plant, book, cup. Based on this, is there a bowl in the image?"}]}, {"id": 2720, "image": "COCO_val2014_000000367528.jpg", "conversations": [{"from": "human", "value": "Is there a spoon in the image?"}, {"from": "gpt", "value": "This image contains bowl, person, remote, dining table, vase, tv, potted plant, book, cup. Based on this, is there a spoon in the image?"}]}, {"id": 2721, "image": "COCO_val2014_000000367528.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains bowl, person, remote, dining table, vase, tv, potted plant, book, cup. Based on this, is there a person in the image?"}]}, {"id": 2722, "image": "COCO_val2014_000000367528.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains bowl, person, remote, dining table, vase, tv, potted plant, book, cup. Based on this, is there a car in the image?"}]}, {"id": 2723, "image": "COCO_val2014_000000367528.jpg", "conversations": [{"from": "human", "value": "Is there a remote in the image?"}, {"from": "gpt", "value": "This image contains bowl, person, remote, dining table, vase, tv, potted plant, book, cup. Based on this, is there a remote in the image?"}]}, {"id": 2724, "image": "COCO_val2014_000000367528.jpg", "conversations": [{"from": "human", "value": "Is there a couch in the image?"}, {"from": "gpt", "value": "This image contains bowl, person, remote, dining table, vase, tv, potted plant, book, cup. Based on this, is there a couch in the image?"}]}, {"id": 2725, "image": "COCO_val2014_000000252911.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, car, boat, stop sign, motorcycle. Based on this, is there a person in the image?"}]}, {"id": 2726, "image": "COCO_val2014_000000252911.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, car, boat, stop sign, motorcycle. Based on this, is there a dining table in the image?"}]}, {"id": 2727, "image": "COCO_val2014_000000252911.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, car, boat, stop sign, motorcycle. Based on this, is there a car in the image?"}]}, {"id": 2728, "image": "COCO_val2014_000000252911.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains person, car, boat, stop sign, motorcycle. Based on this, is there a truck in the image?"}]}, {"id": 2729, "image": "COCO_val2014_000000252911.jpg", "conversations": [{"from": "human", "value": "Is there a boat in the image?"}, {"from": "gpt", "value": "This image contains person, car, boat, stop sign, motorcycle. Based on this, is there a boat in the image?"}]}, {"id": 2730, "image": "COCO_val2014_000000252911.jpg", "conversations": [{"from": "human", "value": "Is there a bird in the image?"}, {"from": "gpt", "value": "This image contains person, car, boat, stop sign, motorcycle. Based on this, is there a bird in the image?"}]}, {"id": 2731, "image": "COCO_val2014_000000214421.jpg", "conversations": [{"from": "human", "value": "Is there a tv in the image?"}, {"from": "gpt", "value": "This image contains tv, person, potted plant, bottle, laptop, dining table, cup. Based on this, is there a tv in the image?"}]}, {"id": 2732, "image": "COCO_val2014_000000214421.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains tv, person, potted plant, bottle, laptop, dining table, cup. Based on this, is there a chair in the image?"}]}, {"id": 2733, "image": "COCO_val2014_000000214421.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains tv, person, potted plant, bottle, laptop, dining table, cup. Based on this, is there a person in the image?"}]}, {"id": 2734, "image": "COCO_val2014_000000214421.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains tv, person, potted plant, bottle, laptop, dining table, cup. Based on this, is there a car in the image?"}]}, {"id": 2735, "image": "COCO_val2014_000000214421.jpg", "conversations": [{"from": "human", "value": "Is there a potted plant in the image?"}, {"from": "gpt", "value": "This image contains tv, person, potted plant, bottle, laptop, dining table, cup. Based on this, is there a potted plant in the image?"}]}, {"id": 2736, "image": "COCO_val2014_000000214421.jpg", "conversations": [{"from": "human", "value": "Is there a vase in the image?"}, {"from": "gpt", "value": "This image contains tv, person, potted plant, bottle, laptop, dining table, cup. Based on this, is there a vase in the image?"}]}, {"id": 2737, "image": "COCO_val2014_000000050627.jpg", "conversations": [{"from": "human", "value": "Is there a baseball glove in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball, baseball bat. Based on this, is there a baseball glove in the image?"}]}, {"id": 2738, "image": "COCO_val2014_000000050627.jpg", "conversations": [{"from": "human", "value": "Is there a dog in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball, baseball bat. Based on this, is there a dog in the image?"}]}, {"id": 2739, "image": "COCO_val2014_000000050627.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball, baseball bat. Based on this, is there a person in the image?"}]}, {"id": 2740, "image": "COCO_val2014_000000050627.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball, baseball bat. Based on this, is there a car in the image?"}]}, {"id": 2741, "image": "COCO_val2014_000000050627.jpg", "conversations": [{"from": "human", "value": "Is there a sports ball in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball, baseball bat. Based on this, is there a sports ball in the image?"}]}, {"id": 2742, "image": "COCO_val2014_000000050627.jpg", "conversations": [{"from": "human", "value": "Is there a tennis racket in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball, baseball bat. Based on this, is there a tennis racket in the image?"}]}, {"id": 2743, "image": "COCO_val2014_000000233426.jpg", "conversations": [{"from": "human", "value": "Is there a vase in the image?"}, {"from": "gpt", "value": "This image contains vase, potted plant, dining table. Based on this, is there a vase in the image?"}]}, {"id": 2744, "image": "COCO_val2014_000000233426.jpg", "conversations": [{"from": "human", "value": "Is there a couch in the image?"}, {"from": "gpt", "value": "This image contains vase, potted plant, dining table. Based on this, is there a couch in the image?"}]}, {"id": 2745, "image": "COCO_val2014_000000233426.jpg", "conversations": [{"from": "human", "value": "Is there a potted plant in the image?"}, {"from": "gpt", "value": "This image contains vase, potted plant, dining table. Based on this, is there a potted plant in the image?"}]}, {"id": 2746, "image": "COCO_val2014_000000233426.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains vase, potted plant, dining table. Based on this, is there a person in the image?"}]}, {"id": 2747, "image": "COCO_val2014_000000233426.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains vase, potted plant, dining table. Based on this, is there a dining table in the image?"}]}, {"id": 2748, "image": "COCO_val2014_000000233426.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains vase, potted plant, dining table. Based on this, is there a cup in the image?"}]}, {"id": 2749, "image": "COCO_val2014_000000372817.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, car, handbag, umbrella. Based on this, is there a person in the image?"}]}, {"id": 2750, "image": "COCO_val2014_000000372817.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, car, handbag, umbrella. Based on this, is there a dining table in the image?"}]}, {"id": 2751, "image": "COCO_val2014_000000372817.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, car, handbag, umbrella. Based on this, is there a car in the image?"}]}, {"id": 2752, "image": "COCO_val2014_000000372817.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains person, car, handbag, umbrella. Based on this, is there a truck in the image?"}]}, {"id": 2753, "image": "COCO_val2014_000000372817.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains person, car, handbag, umbrella. Based on this, is there a handbag in the image?"}]}, {"id": 2754, "image": "COCO_val2014_000000372817.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains person, car, handbag, umbrella. Based on this, is there a backpack in the image?"}]}, {"id": 2755, "image": "COCO_val2014_000000536073.jpg", "conversations": [{"from": "human", "value": "Is there a knife in the image?"}, {"from": "gpt", "value": "This image contains knife, bottle, cup. Based on this, is there a knife in the image?"}]}, {"id": 2756, "image": "COCO_val2014_000000536073.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains knife, bottle, cup. Based on this, is there a dining table in the image?"}]}, {"id": 2757, "image": "COCO_val2014_000000536073.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains knife, bottle, cup. Based on this, is there a bottle in the image?"}]}, {"id": 2758, "image": "COCO_val2014_000000536073.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains knife, bottle, cup. Based on this, is there a person in the image?"}]}, {"id": 2759, "image": "COCO_val2014_000000536073.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains knife, bottle, cup. Based on this, is there a cup in the image?"}]}, {"id": 2760, "image": "COCO_val2014_000000536073.jpg", "conversations": [{"from": "human", "value": "Is there a bowl in the image?"}, {"from": "gpt", "value": "This image contains knife, bottle, cup. Based on this, is there a bowl in the image?"}]}, {"id": 2761, "image": "COCO_val2014_000000579231.jpg", "conversations": [{"from": "human", "value": "Is there a baseball glove in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, baseball bat. Based on this, is there a baseball glove in the image?"}]}, {"id": 2762, "image": "COCO_val2014_000000579231.jpg", "conversations": [{"from": "human", "value": "Is there a sports ball in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, baseball bat. Based on this, is there a sports ball in the image?"}]}, {"id": 2763, "image": "COCO_val2014_000000579231.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, baseball bat. Based on this, is there a person in the image?"}]}, {"id": 2764, "image": "COCO_val2014_000000579231.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, baseball bat. Based on this, is there a car in the image?"}]}, {"id": 2765, "image": "COCO_val2014_000000579231.jpg", "conversations": [{"from": "human", "value": "Is there a baseball bat in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, baseball bat. Based on this, is there a baseball bat in the image?"}]}, {"id": 2766, "image": "COCO_val2014_000000579231.jpg", "conversations": [{"from": "human", "value": "Is there a bench in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, baseball bat. Based on this, is there a bench in the image?"}]}, {"id": 2767, "image": "COCO_val2014_000000092624.jpg", "conversations": [{"from": "human", "value": "Is there a giraffe in the image?"}, {"from": "gpt", "value": "This image contains giraffe, cow, zebra. Based on this, is there a giraffe in the image?"}]}, {"id": 2768, "image": "COCO_val2014_000000092624.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains giraffe, cow, zebra. Based on this, is there a person in the image?"}]}, {"id": 2769, "image": "COCO_val2014_000000092624.jpg", "conversations": [{"from": "human", "value": "Is there a cow in the image?"}, {"from": "gpt", "value": "This image contains giraffe, cow, zebra. Based on this, is there a cow in the image?"}]}, {"id": 2770, "image": "COCO_val2014_000000092624.jpg", "conversations": [{"from": "human", "value": "Is there a bicycle in the image?"}, {"from": "gpt", "value": "This image contains giraffe, cow, zebra. Based on this, is there a bicycle in the image?"}]}, {"id": 2771, "image": "COCO_val2014_000000092624.jpg", "conversations": [{"from": "human", "value": "Is there a zebra in the image?"}, {"from": "gpt", "value": "This image contains giraffe, cow, zebra. Based on this, is there a zebra in the image?"}]}, {"id": 2772, "image": "COCO_val2014_000000092624.jpg", "conversations": [{"from": "human", "value": "Is there an airplane in the image?"}, {"from": "gpt", "value": "This image contains giraffe, cow, zebra. Based on this, is there an airplane in the image?"}]}, {"id": 2773, "image": "COCO_val2014_000000390184.jpg", "conversations": [{"from": "human", "value": "Is there a spoon in the image?"}, {"from": "gpt", "value": "This image contains spoon, dining table, chair, microwave, oven. Based on this, is there a spoon in the image?"}]}, {"id": 2774, "image": "COCO_val2014_000000390184.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains spoon, dining table, chair, microwave, oven. Based on this, is there a cup in the image?"}]}, {"id": 2775, "image": "COCO_val2014_000000390184.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains spoon, dining table, chair, microwave, oven. Based on this, is there a dining table in the image?"}]}, {"id": 2776, "image": "COCO_val2014_000000390184.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains spoon, dining table, chair, microwave, oven. Based on this, is there a person in the image?"}]}, {"id": 2777, "image": "COCO_val2014_000000390184.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains spoon, dining table, chair, microwave, oven. Based on this, is there a chair in the image?"}]}, {"id": 2778, "image": "COCO_val2014_000000390184.jpg", "conversations": [{"from": "human", "value": "Is there a couch in the image?"}, {"from": "gpt", "value": "This image contains spoon, dining table, chair, microwave, oven. Based on this, is there a couch in the image?"}]}, {"id": 2779, "image": "COCO_val2014_000000079213.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, couch, remote. Based on this, is there a person in the image?"}]}, {"id": 2780, "image": "COCO_val2014_000000079213.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, couch, remote. Based on this, is there a car in the image?"}]}, {"id": 2781, "image": "COCO_val2014_000000079213.jpg", "conversations": [{"from": "human", "value": "Is there a couch in the image?"}, {"from": "gpt", "value": "This image contains person, couch, remote. Based on this, is there a couch in the image?"}]}, {"id": 2782, "image": "COCO_val2014_000000079213.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains person, couch, remote. Based on this, is there a chair in the image?"}]}, {"id": 2783, "image": "COCO_val2014_000000079213.jpg", "conversations": [{"from": "human", "value": "Is there a remote in the image?"}, {"from": "gpt", "value": "This image contains person, couch, remote. Based on this, is there a remote in the image?"}]}, {"id": 2784, "image": "COCO_val2014_000000079213.jpg", "conversations": [{"from": "human", "value": "Is there a tv in the image?"}, {"from": "gpt", "value": "This image contains person, couch, remote. Based on this, is there a tv in the image?"}]}, {"id": 2785, "image": "COCO_val2014_000000465346.jpg", "conversations": [{"from": "human", "value": "Is there a spoon in the image?"}, {"from": "gpt", "value": "This image contains spoon, sandwich, fork, dining table, knife. Based on this, is there a spoon in the image?"}]}, {"id": 2786, "image": "COCO_val2014_000000465346.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains spoon, sandwich, fork, dining table, knife. Based on this, is there a cup in the image?"}]}, {"id": 2787, "image": "COCO_val2014_000000465346.jpg", "conversations": [{"from": "human", "value": "Is there a sandwich in the image?"}, {"from": "gpt", "value": "This image contains spoon, sandwich, fork, dining table, knife. Based on this, is there a sandwich in the image?"}]}, {"id": 2788, "image": "COCO_val2014_000000465346.jpg", "conversations": [{"from": "human", "value": "Is there a bowl in the image?"}, {"from": "gpt", "value": "This image contains spoon, sandwich, fork, dining table, knife. Based on this, is there a bowl in the image?"}]}, {"id": 2789, "image": "COCO_val2014_000000465346.jpg", "conversations": [{"from": "human", "value": "Is there a fork in the image?"}, {"from": "gpt", "value": "This image contains spoon, sandwich, fork, dining table, knife. Based on this, is there a fork in the image?"}]}, {"id": 2790, "image": "COCO_val2014_000000465346.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains spoon, sandwich, fork, dining table, knife. Based on this, is there a person in the image?"}]}, {"id": 2791, "image": "COCO_val2014_000000514248.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains car, person, horse, fire hydrant. Based on this, is there a car in the image?"}]}, {"id": 2792, "image": "COCO_val2014_000000514248.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains car, person, horse, fire hydrant. Based on this, is there a truck in the image?"}]}, {"id": 2793, "image": "COCO_val2014_000000514248.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains car, person, horse, fire hydrant. Based on this, is there a person in the image?"}]}, {"id": 2794, "image": "COCO_val2014_000000514248.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains car, person, horse, fire hydrant. Based on this, is there a dining table in the image?"}]}, {"id": 2795, "image": "COCO_val2014_000000514248.jpg", "conversations": [{"from": "human", "value": "Is there a horse in the image?"}, {"from": "gpt", "value": "This image contains car, person, horse, fire hydrant. Based on this, is there a horse in the image?"}]}, {"id": 2796, "image": "COCO_val2014_000000514248.jpg", "conversations": [{"from": "human", "value": "Is there a dog in the image?"}, {"from": "gpt", "value": "This image contains car, person, horse, fire hydrant. Based on this, is there a dog in the image?"}]}, {"id": 2797, "image": "COCO_val2014_000000355776.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, chair, sink, toothbrush, cup. Based on this, is there a person in the image?"}]}, {"id": 2798, "image": "COCO_val2014_000000355776.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, chair, sink, toothbrush, cup. Based on this, is there a car in the image?"}]}, {"id": 2799, "image": "COCO_val2014_000000355776.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains person, chair, sink, toothbrush, cup. Based on this, is there a chair in the image?"}]}, {"id": 2800, "image": "COCO_val2014_000000355776.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, chair, sink, toothbrush, cup. Based on this, is there a dining table in the image?"}]}, {"id": 2801, "image": "COCO_val2014_000000355776.jpg", "conversations": [{"from": "human", "value": "Is there a sink in the image?"}, {"from": "gpt", "value": "This image contains person, chair, sink, toothbrush, cup. Based on this, is there a sink in the image?"}]}, {"id": 2802, "image": "COCO_val2014_000000355776.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains person, chair, sink, toothbrush, cup. Based on this, is there a bottle in the image?"}]}, {"id": 2803, "image": "COCO_val2014_000000575355.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains chair, bench, dining table. Based on this, is there a chair in the image?"}]}, {"id": 2804, "image": "COCO_val2014_000000575355.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains chair, bench, dining table. Based on this, is there a person in the image?"}]}, {"id": 2805, "image": "COCO_val2014_000000575355.jpg", "conversations": [{"from": "human", "value": "Is there a bench in the image?"}, {"from": "gpt", "value": "This image contains chair, bench, dining table. Based on this, is there a bench in the image?"}]}, {"id": 2806, "image": "COCO_val2014_000000575355.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains chair, bench, dining table. Based on this, is there a backpack in the image?"}]}, {"id": 2807, "image": "COCO_val2014_000000575355.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains chair, bench, dining table. Based on this, is there a dining table in the image?"}]}, {"id": 2808, "image": "COCO_val2014_000000575355.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains chair, bench, dining table. Based on this, is there a cup in the image?"}]}, {"id": 2809, "image": "COCO_val2014_000000396068.jpg", "conversations": [{"from": "human", "value": "Is there a tv in the image?"}, {"from": "gpt", "value": "This image contains tv, person, remote. Based on this, is there a tv in the image?"}]}, {"id": 2810, "image": "COCO_val2014_000000396068.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains tv, person, remote. Based on this, is there a dining table in the image?"}]}, {"id": 2811, "image": "COCO_val2014_000000396068.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains tv, person, remote. Based on this, is there a person in the image?"}]}, {"id": 2812, "image": "COCO_val2014_000000396068.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains tv, person, remote. Based on this, is there a car in the image?"}]}, {"id": 2813, "image": "COCO_val2014_000000396068.jpg", "conversations": [{"from": "human", "value": "Is there a remote in the image?"}, {"from": "gpt", "value": "This image contains tv, person, remote. Based on this, is there a remote in the image?"}]}, {"id": 2814, "image": "COCO_val2014_000000396068.jpg", "conversations": [{"from": "human", "value": "Is there a couch in the image?"}, {"from": "gpt", "value": "This image contains tv, person, remote. Based on this, is there a couch in the image?"}]}, {"id": 2815, "image": "COCO_val2014_000000559547.jpg", "conversations": [{"from": "human", "value": "Is there a baseball glove in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball, baseball bat. Based on this, is there a baseball glove in the image?"}]}, {"id": 2816, "image": "COCO_val2014_000000559547.jpg", "conversations": [{"from": "human", "value": "Is there a dog in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball, baseball bat. Based on this, is there a dog in the image?"}]}, {"id": 2817, "image": "COCO_val2014_000000559547.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball, baseball bat. Based on this, is there a person in the image?"}]}, {"id": 2818, "image": "COCO_val2014_000000559547.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball, baseball bat. Based on this, is there a car in the image?"}]}, {"id": 2819, "image": "COCO_val2014_000000559547.jpg", "conversations": [{"from": "human", "value": "Is there a sports ball in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball, baseball bat. Based on this, is there a sports ball in the image?"}]}, {"id": 2820, "image": "COCO_val2014_000000559547.jpg", "conversations": [{"from": "human", "value": "Is there a tennis racket in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball, baseball bat. Based on this, is there a tennis racket in the image?"}]}, {"id": 2821, "image": "COCO_val2014_000000230175.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, cup, tie. Based on this, is there a person in the image?"}]}, {"id": 2822, "image": "COCO_val2014_000000230175.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, cup, tie. Based on this, is there a car in the image?"}]}, {"id": 2823, "image": "COCO_val2014_000000230175.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains person, cup, tie. Based on this, is there a cup in the image?"}]}, {"id": 2824, "image": "COCO_val2014_000000230175.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, cup, tie. Based on this, is there a dining table in the image?"}]}, {"id": 2825, "image": "COCO_val2014_000000230175.jpg", "conversations": [{"from": "human", "value": "Is there a tie in the image?"}, {"from": "gpt", "value": "This image contains person, cup, tie. Based on this, is there a tie in the image?"}]}, {"id": 2826, "image": "COCO_val2014_000000230175.jpg", "conversations": [{"from": "human", "value": "Is there a cake in the image?"}, {"from": "gpt", "value": "This image contains person, cup, tie. Based on this, is there a cake in the image?"}]}, {"id": 2827, "image": "COCO_val2014_000000159969.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, skis. Based on this, is there a backpack in the image?"}]}, {"id": 2828, "image": "COCO_val2014_000000159969.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, skis. Based on this, is there a handbag in the image?"}]}, {"id": 2829, "image": "COCO_val2014_000000159969.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, skis. Based on this, is there a person in the image?"}]}, {"id": 2830, "image": "COCO_val2014_000000159969.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, skis. Based on this, is there a car in the image?"}]}, {"id": 2831, "image": "COCO_val2014_000000159969.jpg", "conversations": [{"from": "human", "value": "Is there a skis in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, skis. Based on this, is there a skis in the image?"}]}, {"id": 2832, "image": "COCO_val2014_000000159969.jpg", "conversations": [{"from": "human", "value": "Is there a snowboard in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, skis. Based on this, is there a snowboard in the image?"}]}, {"id": 2833, "image": "COCO_val2014_000000399702.jpg", "conversations": [{"from": "human", "value": "Is there a bowl in the image?"}, {"from": "gpt", "value": "This image contains bowl, sandwich, cup, dining table. Based on this, is there a bowl in the image?"}]}, {"id": 2834, "image": "COCO_val2014_000000399702.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains bowl, sandwich, cup, dining table. Based on this, is there a person in the image?"}]}, {"id": 2835, "image": "COCO_val2014_000000399702.jpg", "conversations": [{"from": "human", "value": "Is there a sandwich in the image?"}, {"from": "gpt", "value": "This image contains bowl, sandwich, cup, dining table. Based on this, is there a sandwich in the image?"}]}, {"id": 2836, "image": "COCO_val2014_000000399702.jpg", "conversations": [{"from": "human", "value": "Is there a fork in the image?"}, {"from": "gpt", "value": "This image contains bowl, sandwich, cup, dining table. Based on this, is there a fork in the image?"}]}, {"id": 2837, "image": "COCO_val2014_000000399702.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains bowl, sandwich, cup, dining table. Based on this, is there a cup in the image?"}]}, {"id": 2838, "image": "COCO_val2014_000000399702.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains bowl, sandwich, cup, dining table. Based on this, is there a bottle in the image?"}]}, {"id": 2839, "image": "COCO_val2014_000000555538.jpg", "conversations": [{"from": "human", "value": "Is there a baseball glove in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball, baseball bat. Based on this, is there a baseball glove in the image?"}]}, {"id": 2840, "image": "COCO_val2014_000000555538.jpg", "conversations": [{"from": "human", "value": "Is there a dog in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball, baseball bat. Based on this, is there a dog in the image?"}]}, {"id": 2841, "image": "COCO_val2014_000000555538.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball, baseball bat. Based on this, is there a person in the image?"}]}, {"id": 2842, "image": "COCO_val2014_000000555538.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball, baseball bat. Based on this, is there a car in the image?"}]}, {"id": 2843, "image": "COCO_val2014_000000555538.jpg", "conversations": [{"from": "human", "value": "Is there a sports ball in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball, baseball bat. Based on this, is there a sports ball in the image?"}]}, {"id": 2844, "image": "COCO_val2014_000000555538.jpg", "conversations": [{"from": "human", "value": "Is there a tennis racket in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball, baseball bat. Based on this, is there a tennis racket in the image?"}]}, {"id": 2845, "image": "COCO_val2014_000000264155.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, bottle, fork, dining table, knife, pizza. Based on this, is there a person in the image?"}]}, {"id": 2846, "image": "COCO_val2014_000000264155.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, bottle, fork, dining table, knife, pizza. Based on this, is there a car in the image?"}]}, {"id": 2847, "image": "COCO_val2014_000000264155.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains person, bottle, fork, dining table, knife, pizza. Based on this, is there a bottle in the image?"}]}, {"id": 2848, "image": "COCO_val2014_000000264155.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains person, bottle, fork, dining table, knife, pizza. Based on this, is there a cup in the image?"}]}, {"id": 2849, "image": "COCO_val2014_000000264155.jpg", "conversations": [{"from": "human", "value": "Is there a fork in the image?"}, {"from": "gpt", "value": "This image contains person, bottle, fork, dining table, knife, pizza. Based on this, is there a fork in the image?"}]}, {"id": 2850, "image": "COCO_val2014_000000264155.jpg", "conversations": [{"from": "human", "value": "Is there a bowl in the image?"}, {"from": "gpt", "value": "This image contains person, bottle, fork, dining table, knife, pizza. Based on this, is there a bowl in the image?"}]}, {"id": 2851, "image": "COCO_val2014_000000125572.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains truck, clock, person, traffic light, handbag, bicycle, backpack, motorcycle, bus. Based on this, is there a truck in the image?"}]}, {"id": 2852, "image": "COCO_val2014_000000125572.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains truck, clock, person, traffic light, handbag, bicycle, backpack, motorcycle, bus. Based on this, is there a car in the image?"}]}, {"id": 2853, "image": "COCO_val2014_000000125572.jpg", "conversations": [{"from": "human", "value": "Is there a clock in the image?"}, {"from": "gpt", "value": "This image contains truck, clock, person, traffic light, handbag, bicycle, backpack, motorcycle, bus. Based on this, is there a clock in the image?"}]}, {"id": 2854, "image": "COCO_val2014_000000125572.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains truck, clock, person, traffic light, handbag, bicycle, backpack, motorcycle, bus. Based on this, is there a chair in the image?"}]}, {"id": 2855, "image": "COCO_val2014_000000125572.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains truck, clock, person, traffic light, handbag, bicycle, backpack, motorcycle, bus. Based on this, is there a person in the image?"}]}, {"id": 2856, "image": "COCO_val2014_000000125572.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains truck, clock, person, traffic light, handbag, bicycle, backpack, motorcycle, bus. Based on this, is there a dining table in the image?"}]}, {"id": 2857, "image": "COCO_val2014_000000560744.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, spoon, bowl, dining table, knife, chair, wine glass, bottle, book, cup. Based on this, is there a person in the image?"}]}, {"id": 2858, "image": "COCO_val2014_000000560744.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, spoon, bowl, dining table, knife, chair, wine glass, bottle, book, cup. Based on this, is there a car in the image?"}]}, {"id": 2859, "image": "COCO_val2014_000000560744.jpg", "conversations": [{"from": "human", "value": "Is there a spoon in the image?"}, {"from": "gpt", "value": "This image contains person, spoon, bowl, dining table, knife, chair, wine glass, bottle, book, cup. Based on this, is there a spoon in the image?"}]}, {"id": 2860, "image": "COCO_val2014_000000560744.jpg", "conversations": [{"from": "human", "value": "Is there an oven in the image?"}, {"from": "gpt", "value": "This image contains person, spoon, bowl, dining table, knife, chair, wine glass, bottle, book, cup. Based on this, is there an oven in the image?"}]}, {"id": 2861, "image": "COCO_val2014_000000560744.jpg", "conversations": [{"from": "human", "value": "Is there a bowl in the image?"}, {"from": "gpt", "value": "This image contains person, spoon, bowl, dining table, knife, chair, wine glass, bottle, book, cup. Based on this, is there a bowl in the image?"}]}, {"id": 2862, "image": "COCO_val2014_000000560744.jpg", "conversations": [{"from": "human", "value": "Is there a banana in the image?"}, {"from": "gpt", "value": "This image contains person, spoon, bowl, dining table, knife, chair, wine glass, bottle, book, cup. Based on this, is there a banana in the image?"}]}, {"id": 2863, "image": "COCO_val2014_000000045685.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket. Based on this, is there a person in the image?"}]}, {"id": 2864, "image": "COCO_val2014_000000045685.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket. Based on this, is there a car in the image?"}]}, {"id": 2865, "image": "COCO_val2014_000000045685.jpg", "conversations": [{"from": "human", "value": "Is there a sports ball in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket. Based on this, is there a sports ball in the image?"}]}, {"id": 2866, "image": "COCO_val2014_000000045685.jpg", "conversations": [{"from": "human", "value": "Is there a baseball glove in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket. Based on this, is there a baseball glove in the image?"}]}, {"id": 2867, "image": "COCO_val2014_000000045685.jpg", "conversations": [{"from": "human", "value": "Is there a tennis racket in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket. Based on this, is there a tennis racket in the image?"}]}, {"id": 2868, "image": "COCO_val2014_000000045685.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket. Based on this, is there a chair in the image?"}]}, {"id": 2869, "image": "COCO_val2014_000000434179.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains chair, spoon, cup, dining table. Based on this, is there a chair in the image?"}]}, {"id": 2870, "image": "COCO_val2014_000000434179.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains chair, spoon, cup, dining table. Based on this, is there a person in the image?"}]}, {"id": 2871, "image": "COCO_val2014_000000434179.jpg", "conversations": [{"from": "human", "value": "Is there a spoon in the image?"}, {"from": "gpt", "value": "This image contains chair, spoon, cup, dining table. Based on this, is there a spoon in the image?"}]}, {"id": 2872, "image": "COCO_val2014_000000434179.jpg", "conversations": [{"from": "human", "value": "Is there a bowl in the image?"}, {"from": "gpt", "value": "This image contains chair, spoon, cup, dining table. Based on this, is there a bowl in the image?"}]}, {"id": 2873, "image": "COCO_val2014_000000434179.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains chair, spoon, cup, dining table. Based on this, is there a cup in the image?"}]}, {"id": 2874, "image": "COCO_val2014_000000434179.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains chair, spoon, cup, dining table. Based on this, is there a bottle in the image?"}]}, {"id": 2875, "image": "COCO_val2014_000000008749.jpg", "conversations": [{"from": "human", "value": "Is there a pizza in the image?"}, {"from": "gpt", "value": "This image contains pizza, cup, dining table. Based on this, is there a pizza in the image?"}]}, {"id": 2876, "image": "COCO_val2014_000000008749.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains pizza, cup, dining table. Based on this, is there a person in the image?"}]}, {"id": 2877, "image": "COCO_val2014_000000008749.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains pizza, cup, dining table. Based on this, is there a cup in the image?"}]}, {"id": 2878, "image": "COCO_val2014_000000008749.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains pizza, cup, dining table. Based on this, is there a bottle in the image?"}]}, {"id": 2879, "image": "COCO_val2014_000000008749.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains pizza, cup, dining table. Based on this, is there a dining table in the image?"}]}, {"id": 2880, "image": "COCO_val2014_000000008749.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains pizza, cup, dining table. Based on this, is there a chair in the image?"}]}, {"id": 2881, "image": "COCO_val2014_000000069863.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains car, vase, potted plant, dining table. Based on this, is there a car in the image?"}]}, {"id": 2882, "image": "COCO_val2014_000000069863.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains car, vase, potted plant, dining table. Based on this, is there a person in the image?"}]}, {"id": 2883, "image": "COCO_val2014_000000069863.jpg", "conversations": [{"from": "human", "value": "Is there a vase in the image?"}, {"from": "gpt", "value": "This image contains car, vase, potted plant, dining table. Based on this, is there a vase in the image?"}]}, {"id": 2884, "image": "COCO_val2014_000000069863.jpg", "conversations": [{"from": "human", "value": "Is there a couch in the image?"}, {"from": "gpt", "value": "This image contains car, vase, potted plant, dining table. Based on this, is there a couch in the image?"}]}, {"id": 2885, "image": "COCO_val2014_000000069863.jpg", "conversations": [{"from": "human", "value": "Is there a potted plant in the image?"}, {"from": "gpt", "value": "This image contains car, vase, potted plant, dining table. Based on this, is there a potted plant in the image?"}]}, {"id": 2886, "image": "COCO_val2014_000000069863.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains car, vase, potted plant, dining table. Based on this, is there a chair in the image?"}]}, {"id": 2887, "image": "COCO_val2014_000000041180.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, cow. Based on this, is there a backpack in the image?"}]}, {"id": 2888, "image": "COCO_val2014_000000041180.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, cow. Based on this, is there a handbag in the image?"}]}, {"id": 2889, "image": "COCO_val2014_000000041180.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, cow. Based on this, is there a person in the image?"}]}, {"id": 2890, "image": "COCO_val2014_000000041180.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, cow. Based on this, is there a car in the image?"}]}, {"id": 2891, "image": "COCO_val2014_000000041180.jpg", "conversations": [{"from": "human", "value": "Is there a cow in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, cow. Based on this, is there a cow in the image?"}]}, {"id": 2892, "image": "COCO_val2014_000000041180.jpg", "conversations": [{"from": "human", "value": "Is there a bicycle in the image?"}, {"from": "gpt", "value": "This image contains backpack, person, cow. Based on this, is there a bicycle in the image?"}]}, {"id": 2893, "image": "COCO_val2014_000000429913.jpg", "conversations": [{"from": "human", "value": "Is there a baseball glove in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball, baseball bat. Based on this, is there a baseball glove in the image?"}]}, {"id": 2894, "image": "COCO_val2014_000000429913.jpg", "conversations": [{"from": "human", "value": "Is there a dog in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball, baseball bat. Based on this, is there a dog in the image?"}]}, {"id": 2895, "image": "COCO_val2014_000000429913.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball, baseball bat. Based on this, is there a person in the image?"}]}, {"id": 2896, "image": "COCO_val2014_000000429913.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball, baseball bat. Based on this, is there a car in the image?"}]}, {"id": 2897, "image": "COCO_val2014_000000429913.jpg", "conversations": [{"from": "human", "value": "Is there a sports ball in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball, baseball bat. Based on this, is there a sports ball in the image?"}]}, {"id": 2898, "image": "COCO_val2014_000000429913.jpg", "conversations": [{"from": "human", "value": "Is there a tennis racket in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball, baseball bat. Based on this, is there a tennis racket in the image?"}]}, {"id": 2899, "image": "COCO_val2014_000000554002.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains chair, dog, person, handbag. Based on this, is there a chair in the image?"}]}, {"id": 2900, "image": "COCO_val2014_000000554002.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains chair, dog, person, handbag. Based on this, is there a dining table in the image?"}]}, {"id": 2901, "image": "COCO_val2014_000000554002.jpg", "conversations": [{"from": "human", "value": "Is there a dog in the image?"}, {"from": "gpt", "value": "This image contains chair, dog, person, handbag. Based on this, is there a dog in the image?"}]}, {"id": 2902, "image": "COCO_val2014_000000554002.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains chair, dog, person, handbag. Based on this, is there a car in the image?"}]}, {"id": 2903, "image": "COCO_val2014_000000554002.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains chair, dog, person, handbag. Based on this, is there a person in the image?"}]}, {"id": 2904, "image": "COCO_val2014_000000554002.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains chair, dog, person, handbag. Based on this, is there a backpack in the image?"}]}, {"id": 2905, "image": "COCO_val2014_000000141278.jpg", "conversations": [{"from": "human", "value": "Is there a tv in the image?"}, {"from": "gpt", "value": "This image contains tv, mouse, laptop, dining table, chair, keyboard, cell phone. Based on this, is there a tv in the image?"}]}, {"id": 2906, "image": "COCO_val2014_000000141278.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains tv, mouse, laptop, dining table, chair, keyboard, cell phone. Based on this, is there a person in the image?"}]}, {"id": 2907, "image": "COCO_val2014_000000141278.jpg", "conversations": [{"from": "human", "value": "Is there a mouse in the image?"}, {"from": "gpt", "value": "This image contains tv, mouse, laptop, dining table, chair, keyboard, cell phone. Based on this, is there a mouse in the image?"}]}, {"id": 2908, "image": "COCO_val2014_000000141278.jpg", "conversations": [{"from": "human", "value": "Is there a book in the image?"}, {"from": "gpt", "value": "This image contains tv, mouse, laptop, dining table, chair, keyboard, cell phone. Based on this, is there a book in the image?"}]}, {"id": 2909, "image": "COCO_val2014_000000141278.jpg", "conversations": [{"from": "human", "value": "Is there a laptop in the image?"}, {"from": "gpt", "value": "This image contains tv, mouse, laptop, dining table, chair, keyboard, cell phone. Based on this, is there a laptop in the image?"}]}, {"id": 2910, "image": "COCO_val2014_000000141278.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains tv, mouse, laptop, dining table, chair, keyboard, cell phone. Based on this, is there a bottle in the image?"}]}, {"id": 2911, "image": "COCO_val2014_000000190788.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, dining table, knife, pizza, cup. Based on this, is there a person in the image?"}]}, {"id": 2912, "image": "COCO_val2014_000000190788.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, dining table, knife, pizza, cup. Based on this, is there a car in the image?"}]}, {"id": 2913, "image": "COCO_val2014_000000190788.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, dining table, knife, pizza, cup. Based on this, is there a dining table in the image?"}]}, {"id": 2914, "image": "COCO_val2014_000000190788.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains person, dining table, knife, pizza, cup. Based on this, is there a chair in the image?"}]}, {"id": 2915, "image": "COCO_val2014_000000190788.jpg", "conversations": [{"from": "human", "value": "Is there a knife in the image?"}, {"from": "gpt", "value": "This image contains person, dining table, knife, pizza, cup. Based on this, is there a knife in the image?"}]}, {"id": 2916, "image": "COCO_val2014_000000190788.jpg", "conversations": [{"from": "human", "value": "Is there a spoon in the image?"}, {"from": "gpt", "value": "This image contains person, dining table, knife, pizza, cup. Based on this, is there a spoon in the image?"}]}, {"id": 2917, "image": "COCO_val2014_000000534942.jpg", "conversations": [{"from": "human", "value": "Is there a bed in the image?"}, {"from": "gpt", "value": "This image contains bed, cat, tie. Based on this, is there a bed in the image?"}]}, {"id": 2918, "image": "COCO_val2014_000000534942.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains bed, cat, tie. Based on this, is there a person in the image?"}]}, {"id": 2919, "image": "COCO_val2014_000000534942.jpg", "conversations": [{"from": "human", "value": "Is there a cat in the image?"}, {"from": "gpt", "value": "This image contains bed, cat, tie. Based on this, is there a cat in the image?"}]}, {"id": 2920, "image": "COCO_val2014_000000534942.jpg", "conversations": [{"from": "human", "value": "Is there a couch in the image?"}, {"from": "gpt", "value": "This image contains bed, cat, tie. Based on this, is there a couch in the image?"}]}, {"id": 2921, "image": "COCO_val2014_000000534942.jpg", "conversations": [{"from": "human", "value": "Is there a tie in the image?"}, {"from": "gpt", "value": "This image contains bed, cat, tie. Based on this, is there a tie in the image?"}]}, {"id": 2922, "image": "COCO_val2014_000000534942.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains bed, cat, tie. Based on this, is there a dining table in the image?"}]}, {"id": 2923, "image": "COCO_val2014_000000377951.jpg", "conversations": [{"from": "human", "value": "Is there a pizza in the image?"}, {"from": "gpt", "value": "This image contains pizza, dining table, person, cup. Based on this, is there a pizza in the image?"}]}, {"id": 2924, "image": "COCO_val2014_000000377951.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains pizza, dining table, person, cup. Based on this, is there a bottle in the image?"}]}, {"id": 2925, "image": "COCO_val2014_000000377951.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains pizza, dining table, person, cup. Based on this, is there a dining table in the image?"}]}, {"id": 2926, "image": "COCO_val2014_000000377951.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains pizza, dining table, person, cup. Based on this, is there a chair in the image?"}]}, {"id": 2927, "image": "COCO_val2014_000000377951.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains pizza, dining table, person, cup. Based on this, is there a person in the image?"}]}, {"id": 2928, "image": "COCO_val2014_000000377951.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains pizza, dining table, person, cup. Based on this, is there a car in the image?"}]}, {"id": 2929, "image": "COCO_val2014_000000533201.jpg", "conversations": [{"from": "human", "value": "Is there a truck in the image?"}, {"from": "gpt", "value": "This image contains truck, person, airplane. Based on this, is there a truck in the image?"}]}, {"id": 2930, "image": "COCO_val2014_000000533201.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains truck, person, airplane. Based on this, is there a car in the image?"}]}, {"id": 2931, "image": "COCO_val2014_000000533201.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains truck, person, airplane. Based on this, is there a person in the image?"}]}, {"id": 2932, "image": "COCO_val2014_000000533201.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains truck, person, airplane. Based on this, is there a dining table in the image?"}]}, {"id": 2933, "image": "COCO_val2014_000000533201.jpg", "conversations": [{"from": "human", "value": "Is there an airplane in the image?"}, {"from": "gpt", "value": "This image contains truck, person, airplane. Based on this, is there an airplane in the image?"}]}, {"id": 2934, "image": "COCO_val2014_000000533201.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains truck, person, airplane. Based on this, is there a backpack in the image?"}]}, {"id": 2935, "image": "COCO_val2014_000000235203.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, couch, remote, chair, keyboard, cat. Based on this, is there a person in the image?"}]}, {"id": 2936, "image": "COCO_val2014_000000235203.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, couch, remote, chair, keyboard, cat. Based on this, is there a car in the image?"}]}, {"id": 2937, "image": "COCO_val2014_000000235203.jpg", "conversations": [{"from": "human", "value": "Is there a couch in the image?"}, {"from": "gpt", "value": "This image contains person, couch, remote, chair, keyboard, cat. Based on this, is there a couch in the image?"}]}, {"id": 2938, "image": "COCO_val2014_000000235203.jpg", "conversations": [{"from": "human", "value": "Is there a tv in the image?"}, {"from": "gpt", "value": "This image contains person, couch, remote, chair, keyboard, cat. Based on this, is there a tv in the image?"}]}, {"id": 2939, "image": "COCO_val2014_000000235203.jpg", "conversations": [{"from": "human", "value": "Is there a remote in the image?"}, {"from": "gpt", "value": "This image contains person, couch, remote, chair, keyboard, cat. Based on this, is there a remote in the image?"}]}, {"id": 2940, "image": "COCO_val2014_000000235203.jpg", "conversations": [{"from": "human", "value": "Is there a book in the image?"}, {"from": "gpt", "value": "This image contains person, couch, remote, chair, keyboard, cat. Based on this, is there a book in the image?"}]}, {"id": 2941, "image": "COCO_val2014_000000468997.jpg", "conversations": [{"from": "human", "value": "Is there a baseball glove in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball, baseball bat. Based on this, is there a baseball glove in the image?"}]}, {"id": 2942, "image": "COCO_val2014_000000468997.jpg", "conversations": [{"from": "human", "value": "Is there a dog in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball, baseball bat. Based on this, is there a dog in the image?"}]}, {"id": 2943, "image": "COCO_val2014_000000468997.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball, baseball bat. Based on this, is there a person in the image?"}]}, {"id": 2944, "image": "COCO_val2014_000000468997.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball, baseball bat. Based on this, is there a car in the image?"}]}, {"id": 2945, "image": "COCO_val2014_000000468997.jpg", "conversations": [{"from": "human", "value": "Is there a sports ball in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball, baseball bat. Based on this, is there a sports ball in the image?"}]}, {"id": 2946, "image": "COCO_val2014_000000468997.jpg", "conversations": [{"from": "human", "value": "Is there a tennis racket in the image?"}, {"from": "gpt", "value": "This image contains baseball glove, person, sports ball, baseball bat. Based on this, is there a tennis racket in the image?"}]}, {"id": 2947, "image": "COCO_val2014_000000401398.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, potted plant, vase, teddy bear, bear. Based on this, is there a person in the image?"}]}, {"id": 2948, "image": "COCO_val2014_000000401398.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, potted plant, vase, teddy bear, bear. Based on this, is there a car in the image?"}]}, {"id": 2949, "image": "COCO_val2014_000000401398.jpg", "conversations": [{"from": "human", "value": "Is there a potted plant in the image?"}, {"from": "gpt", "value": "This image contains person, potted plant, vase, teddy bear, bear. Based on this, is there a potted plant in the image?"}]}, {"id": 2950, "image": "COCO_val2014_000000401398.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains person, potted plant, vase, teddy bear, bear. Based on this, is there a dining table in the image?"}]}, {"id": 2951, "image": "COCO_val2014_000000401398.jpg", "conversations": [{"from": "human", "value": "Is there a vase in the image?"}, {"from": "gpt", "value": "This image contains person, potted plant, vase, teddy bear, bear. Based on this, is there a vase in the image?"}]}, {"id": 2952, "image": "COCO_val2014_000000401398.jpg", "conversations": [{"from": "human", "value": "Is there a couch in the image?"}, {"from": "gpt", "value": "This image contains person, potted plant, vase, teddy bear, bear. Based on this, is there a couch in the image?"}]}, {"id": 2953, "image": "COCO_val2014_000000323752.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket. Based on this, is there a person in the image?"}]}, {"id": 2954, "image": "COCO_val2014_000000323752.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket. Based on this, is there a car in the image?"}]}, {"id": 2955, "image": "COCO_val2014_000000323752.jpg", "conversations": [{"from": "human", "value": "Is there a sports ball in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket. Based on this, is there a sports ball in the image?"}]}, {"id": 2956, "image": "COCO_val2014_000000323752.jpg", "conversations": [{"from": "human", "value": "Is there a baseball glove in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket. Based on this, is there a baseball glove in the image?"}]}, {"id": 2957, "image": "COCO_val2014_000000323752.jpg", "conversations": [{"from": "human", "value": "Is there a tennis racket in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket. Based on this, is there a tennis racket in the image?"}]}, {"id": 2958, "image": "COCO_val2014_000000323752.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket. Based on this, is there a chair in the image?"}]}, {"id": 2959, "image": "COCO_val2014_000000003845.jpg", "conversations": [{"from": "human", "value": "Is there a spoon in the image?"}, {"from": "gpt", "value": "This image contains spoon, broccoli, fork, dining table, carrot, cup. Based on this, is there a spoon in the image?"}]}, {"id": 2960, "image": "COCO_val2014_000000003845.jpg", "conversations": [{"from": "human", "value": "Is there a bowl in the image?"}, {"from": "gpt", "value": "This image contains spoon, broccoli, fork, dining table, carrot, cup. Based on this, is there a bowl in the image?"}]}, {"id": 2961, "image": "COCO_val2014_000000003845.jpg", "conversations": [{"from": "human", "value": "Is there a broccoli in the image?"}, {"from": "gpt", "value": "This image contains spoon, broccoli, fork, dining table, carrot, cup. Based on this, is there a broccoli in the image?"}]}, {"id": 2962, "image": "COCO_val2014_000000003845.jpg", "conversations": [{"from": "human", "value": "Is there a knife in the image?"}, {"from": "gpt", "value": "This image contains spoon, broccoli, fork, dining table, carrot, cup. Based on this, is there a knife in the image?"}]}, {"id": 2963, "image": "COCO_val2014_000000003845.jpg", "conversations": [{"from": "human", "value": "Is there a fork in the image?"}, {"from": "gpt", "value": "This image contains spoon, broccoli, fork, dining table, carrot, cup. Based on this, is there a fork in the image?"}]}, {"id": 2964, "image": "COCO_val2014_000000003845.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains spoon, broccoli, fork, dining table, carrot, cup. Based on this, is there a person in the image?"}]}, {"id": 2965, "image": "COCO_val2014_000000122962.jpg", "conversations": [{"from": "human", "value": "Is there a pizza in the image?"}, {"from": "gpt", "value": "This image contains pizza, person, cell phone, dining table. Based on this, is there a pizza in the image?"}]}, {"id": 2966, "image": "COCO_val2014_000000122962.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains pizza, person, cell phone, dining table. Based on this, is there a cup in the image?"}]}, {"id": 2967, "image": "COCO_val2014_000000122962.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains pizza, person, cell phone, dining table. Based on this, is there a person in the image?"}]}, {"id": 2968, "image": "COCO_val2014_000000122962.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains pizza, person, cell phone, dining table. Based on this, is there a car in the image?"}]}, {"id": 2969, "image": "COCO_val2014_000000122962.jpg", "conversations": [{"from": "human", "value": "Is there a cell phone in the image?"}, {"from": "gpt", "value": "This image contains pizza, person, cell phone, dining table. Based on this, is there a cell phone in the image?"}]}, {"id": 2970, "image": "COCO_val2014_000000122962.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains pizza, person, cell phone, dining table. Based on this, is there a chair in the image?"}]}, {"id": 2971, "image": "COCO_val2014_000000015738.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket, bottle, chair. Based on this, is there a person in the image?"}]}, {"id": 2972, "image": "COCO_val2014_000000015738.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket, bottle, chair. Based on this, is there a car in the image?"}]}, {"id": 2973, "image": "COCO_val2014_000000015738.jpg", "conversations": [{"from": "human", "value": "Is there a sports ball in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket, bottle, chair. Based on this, is there a sports ball in the image?"}]}, {"id": 2974, "image": "COCO_val2014_000000015738.jpg", "conversations": [{"from": "human", "value": "Is there a baseball glove in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket, bottle, chair. Based on this, is there a baseball glove in the image?"}]}, {"id": 2975, "image": "COCO_val2014_000000015738.jpg", "conversations": [{"from": "human", "value": "Is there a tennis racket in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket, bottle, chair. Based on this, is there a tennis racket in the image?"}]}, {"id": 2976, "image": "COCO_val2014_000000015738.jpg", "conversations": [{"from": "human", "value": "Is there a bench in the image?"}, {"from": "gpt", "value": "This image contains person, sports ball, tennis racket, bottle, chair. Based on this, is there a bench in the image?"}]}, {"id": 2977, "image": "COCO_val2014_000000497599.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains chair, person, laptop, dining table. Based on this, is there a chair in the image?"}]}, {"id": 2978, "image": "COCO_val2014_000000497599.jpg", "conversations": [{"from": "human", "value": "Is there a couch in the image?"}, {"from": "gpt", "value": "This image contains chair, person, laptop, dining table. Based on this, is there a couch in the image?"}]}, {"id": 2979, "image": "COCO_val2014_000000497599.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains chair, person, laptop, dining table. Based on this, is there a person in the image?"}]}, {"id": 2980, "image": "COCO_val2014_000000497599.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains chair, person, laptop, dining table. Based on this, is there a car in the image?"}]}, {"id": 2981, "image": "COCO_val2014_000000497599.jpg", "conversations": [{"from": "human", "value": "Is there a laptop in the image?"}, {"from": "gpt", "value": "This image contains chair, person, laptop, dining table. Based on this, is there a laptop in the image?"}]}, {"id": 2982, "image": "COCO_val2014_000000497599.jpg", "conversations": [{"from": "human", "value": "Is there a tv in the image?"}, {"from": "gpt", "value": "This image contains chair, person, laptop, dining table. Based on this, is there a tv in the image?"}]}, {"id": 2983, "image": "COCO_val2014_000000121959.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains chair, person, handbag, umbrella. Based on this, is there a chair in the image?"}]}, {"id": 2984, "image": "COCO_val2014_000000121959.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains chair, person, handbag, umbrella. Based on this, is there a dining table in the image?"}]}, {"id": 2985, "image": "COCO_val2014_000000121959.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains chair, person, handbag, umbrella. Based on this, is there a person in the image?"}]}, {"id": 2986, "image": "COCO_val2014_000000121959.jpg", "conversations": [{"from": "human", "value": "Is there a car in the image?"}, {"from": "gpt", "value": "This image contains chair, person, handbag, umbrella. Based on this, is there a car in the image?"}]}, {"id": 2987, "image": "COCO_val2014_000000121959.jpg", "conversations": [{"from": "human", "value": "Is there a handbag in the image?"}, {"from": "gpt", "value": "This image contains chair, person, handbag, umbrella. Based on this, is there a handbag in the image?"}]}, {"id": 2988, "image": "COCO_val2014_000000121959.jpg", "conversations": [{"from": "human", "value": "Is there a backpack in the image?"}, {"from": "gpt", "value": "This image contains chair, person, handbag, umbrella. Based on this, is there a backpack in the image?"}]}, {"id": 2989, "image": "COCO_val2014_000000361430.jpg", "conversations": [{"from": "human", "value": "Is there a bowl in the image?"}, {"from": "gpt", "value": "This image contains bowl, broccoli, spoon, knife, carrot, oven. Based on this, is there a bowl in the image?"}]}, {"id": 2990, "image": "COCO_val2014_000000361430.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains bowl, broccoli, spoon, knife, carrot, oven. Based on this, is there a cup in the image?"}]}, {"id": 2991, "image": "COCO_val2014_000000361430.jpg", "conversations": [{"from": "human", "value": "Is there a broccoli in the image?"}, {"from": "gpt", "value": "This image contains bowl, broccoli, spoon, knife, carrot, oven. Based on this, is there a broccoli in the image?"}]}, {"id": 2992, "image": "COCO_val2014_000000361430.jpg", "conversations": [{"from": "human", "value": "Is there a dining table in the image?"}, {"from": "gpt", "value": "This image contains bowl, broccoli, spoon, knife, carrot, oven. Based on this, is there a dining table in the image?"}]}, {"id": 2993, "image": "COCO_val2014_000000361430.jpg", "conversations": [{"from": "human", "value": "Is there a spoon in the image?"}, {"from": "gpt", "value": "This image contains bowl, broccoli, spoon, knife, carrot, oven. Based on this, is there a spoon in the image?"}]}, {"id": 2994, "image": "COCO_val2014_000000361430.jpg", "conversations": [{"from": "human", "value": "Is there a bottle in the image?"}, {"from": "gpt", "value": "This image contains bowl, broccoli, spoon, knife, carrot, oven. Based on this, is there a bottle in the image?"}]}, {"id": 2995, "image": "COCO_val2014_000000277289.jpg", "conversations": [{"from": "human", "value": "Is there a tv in the image?"}, {"from": "gpt", "value": "This image contains tv, bowl, couch, potted plant, dining table, vase. Based on this, is there a tv in the image?"}]}, {"id": 2996, "image": "COCO_val2014_000000277289.jpg", "conversations": [{"from": "human", "value": "Is there a person in the image?"}, {"from": "gpt", "value": "This image contains tv, bowl, couch, potted plant, dining table, vase. Based on this, is there a person in the image?"}]}, {"id": 2997, "image": "COCO_val2014_000000277289.jpg", "conversations": [{"from": "human", "value": "Is there a bowl in the image?"}, {"from": "gpt", "value": "This image contains tv, bowl, couch, potted plant, dining table, vase. Based on this, is there a bowl in the image?"}]}, {"id": 2998, "image": "COCO_val2014_000000277289.jpg", "conversations": [{"from": "human", "value": "Is there a cup in the image?"}, {"from": "gpt", "value": "This image contains tv, bowl, couch, potted plant, dining table, vase. Based on this, is there a cup in the image?"}]}, {"id": 2999, "image": "COCO_val2014_000000277289.jpg", "conversations": [{"from": "human", "value": "Is there a couch in the image?"}, {"from": "gpt", "value": "This image contains tv, bowl, couch, potted plant, dining table, vase. Based on this, is there a couch in the image?"}]}, {"id": 3000, "image": "COCO_val2014_000000277289.jpg", "conversations": [{"from": "human", "value": "Is there a chair in the image?"}, {"from": "gpt", "value": "This image contains tv, bowl, couch, potted plant, dining table, vase. Based on this, is there a chair in the image?"}]}]