[{"id": 1, "image": "COCO_val2014_000000144305.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: keyboard, laptop, dining table."}]}, {"id": 7, "image": "COCO_val2014_000000164091.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: person, bed, teddy bear."}]}, {"id": 13, "image": "COCO_val2014_000000308003.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: chair, bench, dining table."}]}, {"id": 19, "image": "COCO_val2014_000000054870.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: knife, sandwich, fork."}]}, {"id": 25, "image": "COCO_val2014_000000095908.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: mouse, laptop, dining table, keyboard, cup."}]}, {"id": 31, "image": "COCO_val2014_000000329614.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: person, car, bus."}]}, {"id": 37, "image": "COCO_val2014_000000324008.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: banana, person, train, dining table, airplane, orange, cup."}]}, {"id": 43, "image": "COCO_val2014_000000052700.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: person, spoon, handbag, fork, dining table, cake."}]}, {"id": 49, "image": "COCO_val2014_000000501311.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: baseball glove, person, sports ball."}]}, {"id": 55, "image": "COCO_val2014_000000247179.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: truck, person, elephant, clock."}]}, {"id": 61, "image": "COCO_val2014_000000577912.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: sink, toothbrush, toilet, bottle."}]}, {"id": 67, "image": "COCO_val2014_000000196341.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: clock, handbag, person."}]}, {"id": 73, "image": "COCO_val2014_000000234433.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: traffic light, person, bicycle, car."}]}, {"id": 79, "image": "COCO_val2014_000000455610.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: traffic light, person, motorcycle, car."}]}, {"id": 85, "image": "COCO_val2014_000000039053.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: spoon, bowl, dining table, apple, cake, cell phone, cup."}]}, {"id": 91, "image": "COCO_val2014_000000493862.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: dog, person, tennis racket."}]}, {"id": 97, "image": "COCO_val2014_000000269873.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: traffic light, person, car, bus."}]}, {"id": 103, "image": "COCO_val2014_000000524656.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: bowl, spoon, knife, sink, refrigerator, toaster, wine glass, bottle, microwave, oven, cup."}]}, {"id": 109, "image": "COCO_val2014_000000369547.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: dog, cat, bird."}]}, {"id": 115, "image": "COCO_val2014_000000181446.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: bowl, person, bottle, sink, refrigerator."}]}, {"id": 121, "image": "COCO_val2014_000000128119.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: backpack, person, handbag, bicycle, cell phone, bus."}]}, {"id": 127, "image": "COCO_val2014_000000401027.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: sandwich, fork, dining table, knife, cup."}]}, {"id": 133, "image": "COCO_val2014_000000253630.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: tv, chair, potted plant, dining table."}]}, {"id": 139, "image": "COCO_val2014_000000326021.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: person, teddy bear, dining table."}]}, {"id": 145, "image": "COCO_val2014_000000317320.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: motorcycle, person, bicycle."}]}, {"id": 151, "image": "COCO_val2014_000000507171.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: person, surfboard, cat."}]}, {"id": 157, "image": "COCO_val2014_000000161227.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: couch, laptop, remote, chair, keyboard, cell phone."}]}, {"id": 163, "image": "COCO_val2014_000000025812.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: snowboard, person, skis."}]}, {"id": 169, "image": "COCO_val2014_000000267537.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: tie, person, bench, umbrella."}]}, {"id": 175, "image": "COCO_val2014_000000195645.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: person, wine glass, handbag, bottle, dining table, bench."}]}, {"id": 181, "image": "COCO_val2014_000000155671.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: traffic light, truck, car."}]}, {"id": 187, "image": "COCO_val2014_000000412894.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: traffic light, person, backpack, handbag."}]}, {"id": 193, "image": "COCO_val2014_000000032625.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: bowl, fork, dining table, book, cup."}]}, {"id": 199, "image": "COCO_val2014_000000018688.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: baseball glove, person, sports ball, baseball bat."}]}, {"id": 205, "image": "COCO_val2014_000000343534.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: dog, potted plant, chair, book, teddy bear."}]}, {"id": 211, "image": "COCO_val2014_000000370657.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: person, motorcycle, handbag."}]}, {"id": 217, "image": "COCO_val2014_000000481596.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: chair, person, hot dog."}]}, {"id": 223, "image": "COCO_val2014_000000460347.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: person, car, bus."}]}, {"id": 229, "image": "COCO_val2014_000000398753.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: baseball glove, person, sports ball, baseball bat."}]}, {"id": 235, "image": "COCO_val2014_000000067833.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: person, bowl, dining table, knife, wine glass, bottle, fork, pizza, cup."}]}, {"id": 241, "image": "COCO_val2014_000000272880.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: person, fork, dining table, knife, pizza, cup."}]}, {"id": 247, "image": "COCO_val2014_000000254368.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: pizza, person, bed."}]}, {"id": 253, "image": "COCO_val2014_000000193108.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: person, sports ball, baseball bat."}]}, {"id": 259, "image": "COCO_val2014_000000459141.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: motorcycle, person, bicycle, potted plant."}]}, {"id": 265, "image": "COCO_val2014_000000231534.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: truck, person, handbag, suitcase, airplane."}]}, {"id": 271, "image": "COCO_val2014_000000227031.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: person, potted plant, dining table, knife, cake, tie."}]}, {"id": 277, "image": "COCO_val2014_000000209347.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: person, handbag, train, cell phone, tie."}]}, {"id": 283, "image": "COCO_val2014_000000523292.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: tv, laptop, dining table, chair, cat."}]}, {"id": 289, "image": "COCO_val2014_000000012375.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: broccoli, carrot, dining table."}]}, {"id": 295, "image": "COCO_val2014_000000013550.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: person, elephant, handbag."}]}, {"id": 301, "image": "COCO_val2014_000000146837.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: person, motorcycle, skateboard."}]}, {"id": 307, "image": "COCO_val2014_000000067042.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: person, cell phone, tie."}]}, {"id": 313, "image": "COCO_val2014_000000209925.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: baseball glove, person, sports ball."}]}, {"id": 319, "image": "COCO_val2014_000000002154.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: person, bench, car, umbrella."}]}, {"id": 325, "image": "COCO_val2014_000000274931.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: traffic light, car, fire hydrant."}]}, {"id": 331, "image": "COCO_val2014_000000104326.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: clock, dining table, chair, knife, sink, potted plant, microwave, oven."}]}, {"id": 337, "image": "COCO_val2014_000000233888.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: tv, baseball glove, person, potted plant, baseball bat."}]}, {"id": 343, "image": "COCO_val2014_000000213905.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: chair, backpack, person, tennis racket."}]}, {"id": 349, "image": "COCO_val2014_000000277479.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: refrigerator, bottle, person."}]}, {"id": 355, "image": "COCO_val2014_000000300784.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: dog, person, couch, bench."}]}, {"id": 361, "image": "COCO_val2014_000000183766.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: knife, fork, cake, dining table."}]}, {"id": 367, "image": "COCO_val2014_000000169169.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: car, traffic light, person, potted plant."}]}, {"id": 373, "image": "COCO_val2014_000000409346.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: bowl, person, spoon, dining table, cake."}]}, {"id": 379, "image": "COCO_val2014_000000522262.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: traffic light, person, bicycle, car."}]}, {"id": 385, "image": "COCO_val2014_000000079014.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: person, orange, sports ball."}]}, {"id": 391, "image": "COCO_val2014_000000344942.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: tv, clock, laptop."}]}, {"id": 397, "image": "COCO_val2014_000000275929.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: sink, bowl, toilet."}]}, {"id": 403, "image": "COCO_val2014_000000465601.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: handbag, bench, person, umbrella."}]}, {"id": 409, "image": "COCO_val2014_000000300124.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: chair, couch, microwave, dining table."}]}, {"id": 415, "image": "COCO_val2014_000000046919.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: backpack, person, skis."}]}, {"id": 421, "image": "COCO_val2014_000000434022.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: person, train, car."}]}, {"id": 427, "image": "COCO_val2014_000000490491.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: person, car, stop sign."}]}, {"id": 433, "image": "COCO_val2014_000000175878.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: backpack, person, cell phone."}]}, {"id": 439, "image": "COCO_val2014_000000012669.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: wine glass, person, vase, handbag."}]}, {"id": 445, "image": "COCO_val2014_000000192496.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: person, train, car."}]}, {"id": 451, "image": "COCO_val2014_000000133146.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: tv, couch, chair, vase, book."}]}, {"id": 457, "image": "COCO_val2014_000000053744.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: knife, sandwich, dining table."}]}, {"id": 463, "image": "COCO_val2014_000000375902.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: backpack, person, skis."}]}, {"id": 469, "image": "COCO_val2014_000000498747.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: bird, person, bottle, cell phone."}]}, {"id": 475, "image": "COCO_val2014_000000052435.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: bird, person, surfboard, umbrella."}]}, {"id": 481, "image": "COCO_val2014_000000301977.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: refrigerator, bottle, cow."}]}, {"id": 487, "image": "COCO_val2014_000000261097.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: chair, person, bench, tennis racket."}]}, {"id": 493, "image": "COCO_val2014_000000227204.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: banana, person, spoon, bowl, dining table, knife, bottle, cell phone, cup."}]}, {"id": 499, "image": "COCO_val2014_000000353981.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: truck, person, airplane."}]}, {"id": 505, "image": "COCO_val2014_000000185327.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: person, horse, car, cow, bus."}]}, {"id": 511, "image": "COCO_val2014_000000348654.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: tv, laptop, cell phone, dining table."}]}, {"id": 517, "image": "COCO_val2014_000000482432.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: sink, toothbrush, bowl."}]}, {"id": 523, "image": "COCO_val2014_000000454161.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: pizza, wine glass, fork, dining table."}]}, {"id": 529, "image": "COCO_val2014_000000144723.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: dog, truck, car, frisbee."}]}, {"id": 535, "image": "COCO_val2014_000000129707.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: book, person, cell phone."}]}, {"id": 541, "image": "COCO_val2014_000000379842.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: book, remote, dining table."}]}, {"id": 547, "image": "COCO_val2014_000000203110.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: truck, person, train, car, orange, bus."}]}, {"id": 553, "image": "COCO_val2014_000000556478.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: pizza, bottle, oven, cup."}]}, {"id": 559, "image": "COCO_val2014_000000103815.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: baseball glove, person, sports ball, baseball bat."}]}, {"id": 565, "image": "COCO_val2014_000000451943.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: backpack, suitcase, bed, dining table."}]}, {"id": 571, "image": "COCO_val2014_000000268854.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: person, boat, handbag."}]}, {"id": 577, "image": "COCO_val2014_000000034464.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: person, surfboard, boat."}]}, {"id": 583, "image": "COCO_val2014_000000495513.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: person, fork, hot dog."}]}, {"id": 589, "image": "COCO_val2014_000000529256.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: dog, bed, book."}]}, {"id": 595, "image": "COCO_val2014_000000037907.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: tv, potted plant, cat."}]}, {"id": 601, "image": "COCO_val2014_000000506401.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: traffic light, truck, person, car, cat."}]}, {"id": 607, "image": "COCO_val2014_000000406611.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: backpack, skis, person."}]}, {"id": 613, "image": "COCO_val2014_000000267225.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: tv, truck, person, car, remote."}]}, {"id": 619, "image": "COCO_val2014_000000278365.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: person, dining table, chair, pizza, cell phone, cup."}]}, {"id": 625, "image": "COCO_val2014_000000069757.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: person, wine glass, knife, dining table, chair, cake, cup."}]}, {"id": 631, "image": "COCO_val2014_000000432213.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: bowl, person, wine glass, sandwich, dining table, knife."}]}, {"id": 637, "image": "COCO_val2014_000000368367.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: person, cell phone, cup."}]}, {"id": 643, "image": "COCO_val2014_000000201555.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: traffic light, truck, car."}]}, {"id": 649, "image": "COCO_val2014_000000092131.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: person, handbag, bus."}]}, {"id": 655, "image": "COCO_val2014_000000021779.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: backpack, person, suitcase."}]}, {"id": 661, "image": "COCO_val2014_000000565148.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: baseball glove, person, sports ball, baseball bat."}]}, {"id": 667, "image": "COCO_val2014_000000160183.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: truck, car, person."}]}, {"id": 673, "image": "COCO_val2014_000000555456.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: snowboard, person, skis."}]}, {"id": 679, "image": "COCO_val2014_000000235595.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: person, car, potted plant, parking meter, motorcycle, cup."}]}, {"id": 685, "image": "COCO_val2014_000000489909.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: banana, bowl, orange."}]}, {"id": 691, "image": "COCO_val2014_000000501080.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: vase, bowl, potted plant, dining table."}]}, {"id": 697, "image": "COCO_val2014_000000405183.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: person, remote, chair, tv, handbag, couch, potted plant, book."}]}, {"id": 703, "image": "COCO_val2014_000000409138.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: person, car, bus."}]}, {"id": 709, "image": "COCO_val2014_000000411840.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: backpack, person, sports ball, tennis racket, chair."}]}, {"id": 715, "image": "COCO_val2014_000000333712.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: pizza, spoon, dining table."}]}, {"id": 721, "image": "COCO_val2014_000000148977.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: bottle, dining table, keyboard, book, teddy bear, bear."}]}, {"id": 727, "image": "COCO_val2014_000000399058.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: truck, person, bicycle, orange, elephant."}]}, {"id": 733, "image": "COCO_val2014_000000183571.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: dog, person, boat."}]}, {"id": 739, "image": "COCO_val2014_000000325836.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: handbag, motorcycle, person, bicycle."}]}, {"id": 745, "image": "COCO_val2014_000000437910.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: sink, bottle, toilet."}]}, {"id": 751, "image": "COCO_val2014_000000155885.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: bird, person, boat."}]}, {"id": 757, "image": "COCO_val2014_000000467887.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: person, mouse, couch, laptop, dining table, chair."}]}, {"id": 763, "image": "COCO_val2014_000000174402.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: person, sports ball, tennis racket."}]}, {"id": 769, "image": "COCO_val2014_000000352734.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: person, spoon, fork, dining table, cake."}]}, {"id": 775, "image": "COCO_val2014_000000346716.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: person, car, bus."}]}, {"id": 781, "image": "COCO_val2014_000000451144.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: backpack, person, skis."}]}, {"id": 787, "image": "COCO_val2014_000000295656.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: tv, person, clock, car, chair, pizza, tie."}]}, {"id": 793, "image": "COCO_val2014_000000129886.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: snowboard, person, skis."}]}, {"id": 799, "image": "COCO_val2014_000000557998.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: person, wine glass, bottle, dining table, chair."}]}, {"id": 805, "image": "COCO_val2014_000000401010.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: tv, chair, sink, bed."}]}, {"id": 811, "image": "COCO_val2014_000000567562.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: person, spoon, bowl, broccoli, dining table, chair, bottle, fork, pizza, book, cup."}]}, {"id": 817, "image": "COCO_val2014_000000313928.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: wine glass, surfboard, bottle, dining table, chair."}]}, {"id": 823, "image": "COCO_val2014_000000490284.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: dog, person, couch."}]}, {"id": 829, "image": "COCO_val2014_000000346940.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: knife, bowl, oven."}]}, {"id": 835, "image": "COCO_val2014_000000222782.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: truck, car, cell phone, person."}]}, {"id": 841, "image": "COCO_val2014_000000255934.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: person, cow, elephant, handbag."}]}, {"id": 847, "image": "COCO_val2014_000000278627.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: person, spoon, dining table, chair, fork, bottle, potted plant, cup."}]}, {"id": 853, "image": "COCO_val2014_000000400851.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: backpack, person, sports ball, boat, chair, bench, umbrella."}]}, {"id": 859, "image": "COCO_val2014_000000472610.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: dog, person, cow."}]}, {"id": 865, "image": "COCO_val2014_000000078565.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: dog, person, boat."}]}, {"id": 871, "image": "COCO_val2014_000000388237.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: chair, person, skateboard, bottle."}]}, {"id": 877, "image": "COCO_val2014_000000289640.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: person, wine glass, frisbee, dining table, chair, orange, cup."}]}, {"id": 883, "image": "COCO_val2014_000000122602.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: scissors, bottle, dining table."}]}, {"id": 889, "image": "COCO_val2014_000000024104.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: laptop, dining table, bed, tv, mouse, keyboard, book, cup."}]}, {"id": 895, "image": "COCO_val2014_000000183709.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: traffic light, person, car, handbag."}]}, {"id": 901, "image": "COCO_val2014_000000059710.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: chair, refrigerator, dining table."}]}, {"id": 907, "image": "COCO_val2014_000000279407.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: baseball glove, person, sports ball, bottle, bench."}]}, {"id": 913, "image": "COCO_val2014_000000314729.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: person, sports ball, baseball bat."}]}, {"id": 919, "image": "COCO_val2014_000000527497.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: tv, mouse, laptop, dining table, keyboard."}]}, {"id": 925, "image": "COCO_val2014_000000411564.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: person, bottle, dining table, chair, refrigerator, cell phone."}]}, {"id": 931, "image": "COCO_val2014_000000320350.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: dog, person, skis."}]}, {"id": 937, "image": "COCO_val2014_000000401857.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: baseball glove, person, sports ball, bench, baseball bat, cup."}]}, {"id": 943, "image": "COCO_val2014_000000285302.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: chair, person, dining table, scissors."}]}, {"id": 949, "image": "COCO_val2014_000000061959.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: traffic light, truck, car, bus."}]}, {"id": 955, "image": "COCO_val2014_000000229659.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: tv, person, clock, bottle, laptop, dining table, chair."}]}, {"id": 961, "image": "COCO_val2014_000000473118.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: person, bicycle, skateboard."}]}, {"id": 967, "image": "COCO_val2014_000000391222.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: backpack, person, skis."}]}, {"id": 973, "image": "COCO_val2014_000000416104.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: person, wine glass, bottle, dining table, chair, umbrella."}]}, {"id": 979, "image": "COCO_val2014_000000511852.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: backpack, person, skis."}]}, {"id": 985, "image": "COCO_val2014_000000059386.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: giraffe, car, zebra."}]}, {"id": 991, "image": "COCO_val2014_000000540180.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: traffic light, person, car."}]}, {"id": 997, "image": "COCO_val2014_000000153692.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "It has been verified that the image exclusively contains the following objects: backpack, person, dog, bicycle, car, traffic light."}]}]