[
  {
    "file_name": "COCO_val2014_000000371873.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "cup",
      "donut"
    ]
  },
  {
    "file_name": "COCO_val2014_000000032284.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "truck",
      "car",
      "motorcycle"
    ]
  },
  {
    "file_name": "COCO_val2014_000000429697.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "sheep"
    ]
  },
  {
    "file_name": "COCO_val2014_000000134016.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "dining table",
      "bowl",
      "broccoli"
    ]
  },
  {
    "file_name": "COCO_val2014_000000405021.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "person",
      "bus",
      "car",
      "handbag",
      "truck",
      "dog"
    ]
  },
  {
    "file_name": "COCO_val2014_000000019404.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bird"
    ]
  },
  {
    "file_name": "COCO_val2014_000000469859.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "dining table",
      "bottle",
      "person",
      "fork",
      "wine glass",
      "tie",
      "cup",
      "chair",
      "knife"
    ]
  },
  {
    "file_name": "COCO_val2014_000000552901.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "toilet",
      "sink"
    ]
  },
  {
    "file_name": "COCO_val2014_000000279714.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "car",
      "sports ball",
      "baseball bat",
      "parking meter"
    ]
  },
  {
    "file_name": "COCO_val2014_000000284160.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "traffic light",
      "bus",
      "car",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000373904.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bird",
      "cow"
    ]
  },
  {
    "file_name": "COCO_val2014_000000446894.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "fork",
      "bowl",
      "knife"
    ]
  },
  {
    "file_name": "COCO_val2014_000000423785.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "tv",
      "couch",
      "vase",
      "book"
    ]
  },
  {
    "file_name": "COCO_val2014_000000434634.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "pizza"
    ]
  },
  {
    "file_name": "COCO_val2014_000000523252.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "person",
      "bench",
      "train"
    ]
  },
  {
    "file_name": "COCO_val2014_000000276133.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "carrot",
      "bowl",
      "knife"
    ]
  },
  {
    "file_name": "COCO_val2014_000000452881.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "clock",
      "book"
    ]
  },
  {
    "file_name": "COCO_val2014_000000388658.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bottle",
      "cat",
      "dog"
    ]
  },
  {
    "file_name": "COCO_val2014_000000375691.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "refrigerator"
    ]
  },
  {
    "file_name": "COCO_val2014_000000192858.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "dining table",
      "bottle",
      "bowl",
      "person",
      "spoon",
      "cup",
      "chair",
      "pizza"
    ]
  },
  {
    "file_name": "COCO_val2014_000000510852.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bottle"
    ]
  },
  {
    "file_name": "COCO_val2014_000000535452.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "clock",
      "person",
      "tennis racket"
    ]
  },
  {
    "file_name": "COCO_val2014_000000363163.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "person",
      "tennis racket"
    ]
  },
  {
    "file_name": "COCO_val2014_000000178175.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "suitcase",
      "boat",
      "backpack",
      "handbag",
      "chair"
    ]
  },
  {
    "file_name": "COCO_val2014_000000103558.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "dining table",
      "bottle",
      "person",
      "remote",
      "chair",
      "couch",
      "potted plant"
    ]
  },
  {
    "file_name": "COCO_val2014_000000404297.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "frisbee",
      "person",
      "dog"
    ]
  },
  {
    "file_name": "COCO_val2014_000000410576.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bottle",
      "mouse",
      "remote",
      "keyboard",
      "laptop",
      "clock",
      "tv",
      "book"
    ]
  },
  {
    "file_name": "COCO_val2014_000000383443.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "tv",
      "remote",
      "sink"
    ]
  },
  {
    "file_name": "COCO_val2014_000000244823.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "tv"
    ]
  },
  {
    "file_name": "COCO_val2014_000000290170.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "truck",
      "car",
      "person",
      "motorcycle"
    ]
  },
  {
    "file_name": "COCO_val2014_000000310788.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "tv",
      "person",
      "book",
      "chair"
    ]
  },
  {
    "file_name": "COCO_val2014_000000482917.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "dining table",
      "person",
      "couch",
      "dog",
      "tv"
    ]
  },
  {
    "file_name": "COCO_val2014_000000459440.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "handbag",
      "keyboard",
      "mouse",
      "cell phone"
    ]
  },
  {
    "file_name": "COCO_val2014_000000440461.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "truck",
      "bus"
    ]
  },
  {
    "file_name": "COCO_val2014_000000073861.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bottle",
      "oven",
      "refrigerator",
      "chair",
      "spoon",
      "microwave",
      "vase",
      "sink",
      "clock",
      "cat",
      "knife"
    ]
  },
  {
    "file_name": "COCO_val2014_000000175593.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "dining table",
      "bowl",
      "fork",
      "apple",
      "spoon",
      "wine glass",
      "cup",
      "chair",
      "knife"
    ]
  },
  {
    "file_name": "COCO_val2014_000000545594.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "backpack",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000046144.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bench"
    ]
  },
  {
    "file_name": "COCO_val2014_000000234595.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "person",
      "umbrella",
      "chair"
    ]
  },
  {
    "file_name": "COCO_val2014_000000091517.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "stop sign",
      "potted plant"
    ]
  },
  {
    "file_name": "COCO_val2014_000000515642.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "remote",
      "book"
    ]
  },
  {
    "file_name": "COCO_val2014_000000541909.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "person",
      "tennis racket"
    ]
  },
  {
    "file_name": "COCO_val2014_000000115626.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "person",
      "parking meter",
      "motorcycle"
    ]
  },
  {
    "file_name": "COCO_val2014_000000181132.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "stop sign"
    ]
  },
  {
    "file_name": "COCO_val2014_000000031699.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "truck",
      "surfboard",
      "car",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000210342.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "surfboard",
      "person",
      "umbrella"
    ]
  },
  {
    "file_name": "COCO_val2014_000000060623.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "dining table",
      "bowl",
      "person",
      "wine glass",
      "spoon"
    ]
  },
  {
    "file_name": "COCO_val2014_000000007574.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bottle",
      "bowl",
      "oven",
      "refrigerator",
      "wine glass",
      "microwave",
      "vase",
      "sink"
    ]
  },
  {
    "file_name": "COCO_val2014_000000386352.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "person",
      "tennis racket",
      "chair"
    ]
  },
  {
    "file_name": "COCO_val2014_000000156100.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "dining table",
      "pizza",
      "cup"
    ]
  },
  {
    "file_name": "COCO_val2014_000000549390.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bicycle",
      "backpack",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000150301.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "giraffe"
    ]
  },
  {
    "file_name": "COCO_val2014_000000425361.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bowl",
      "person",
      "mouse",
      "fork",
      "laptop",
      "wine glass",
      "chair",
      "pizza",
      "knife"
    ]
  },
  {
    "file_name": "COCO_val2014_000000261712.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "giraffe"
    ]
  },
  {
    "file_name": "COCO_val2014_000000551822.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "dining table",
      "bowl",
      "cup",
      "chair",
      "sandwich"
    ]
  },
  {
    "file_name": "COCO_val2014_000000505619.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "dining table",
      "cake",
      "person",
      "spoon",
      "cup"
    ]
  },
  {
    "file_name": "COCO_val2014_000000444273.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "truck",
      "zebra"
    ]
  },
  {
    "file_name": "COCO_val2014_000000406071.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "elephant"
    ]
  },
  {
    "file_name": "COCO_val2014_000000538879.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "traffic light",
      "car"
    ]
  },
  {
    "file_name": "COCO_val2014_000000361238.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "dining table",
      "person",
      "backpack",
      "cup",
      "pizza",
      "potted plant"
    ]
  },
  {
    "file_name": "COCO_val2014_000000246057.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "truck",
      "traffic light",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000487482.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "person",
      "tennis racket"
    ]
  },
  {
    "file_name": "COCO_val2014_000000374241.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "person",
      "fire hydrant",
      "traffic light",
      "car",
      "truck",
      "bench"
    ]
  },
  {
    "file_name": "COCO_val2014_000000109797.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "wine glass",
      "vase",
      "couch",
      "potted plant",
      "book"
    ]
  },
  {
    "file_name": "COCO_val2014_000000381563.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "spoon",
      "dining table",
      "cup"
    ]
  },
  {
    "file_name": "COCO_val2014_000000509116.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "sheep"
    ]
  },
  {
    "file_name": "COCO_val2014_000000194203.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "couch",
      "handbag",
      "chair",
      "dog"
    ]
  },
  {
    "file_name": "COCO_val2014_000000025457.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "clock",
      "book"
    ]
  },
  {
    "file_name": "COCO_val2014_000000408363.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "person",
      "parking meter"
    ]
  },
  {
    "file_name": "COCO_val2014_000000566364.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "dining table",
      "person",
      "truck",
      "bicycle",
      "chair",
      "orange"
    ]
  },
  {
    "file_name": "COCO_val2014_000000070353.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "couch",
      "vase",
      "book",
      "cat"
    ]
  },
  {
    "file_name": "COCO_val2014_000000094376.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bed",
      "dog"
    ]
  },
  {
    "file_name": "COCO_val2014_000000047010.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "cow",
      "giraffe"
    ]
  },
  {
    "file_name": "COCO_val2014_000000092998.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "dining table",
      "bottle",
      "oven",
      "vase",
      "book",
      "cup",
      "chair",
      "potted plant",
      "orange"
    ]
  },
  {
    "file_name": "COCO_val2014_000000191925.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "baseball bat",
      "baseball glove",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000277289.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bowl",
      "couch",
      "vase",
      "tv",
      "potted plant"
    ]
  },
  {
    "file_name": "COCO_val2014_000000050025.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bed",
      "person",
      "book"
    ]
  },
  {
    "file_name": "COCO_val2014_000000183803.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "couch",
      "remote",
      "chair"
    ]
  },
  {
    "file_name": "COCO_val2014_000000313623.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "truck"
    ]
  },
  {
    "file_name": "COCO_val2014_000000187592.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "oven",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000283438.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "tv",
      "person",
      "chair"
    ]
  },
  {
    "file_name": "COCO_val2014_000000530052.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "carrot"
    ]
  },
  {
    "file_name": "COCO_val2014_000000190700.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "couch",
      "teddy bear"
    ]
  },
  {
    "file_name": "COCO_val2014_000000544956.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "person",
      "bench",
      "handbag",
      "cell phone"
    ]
  },
  {
    "file_name": "COCO_val2014_000000218362.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "clock"
    ]
  },
  {
    "file_name": "COCO_val2014_000000034617.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "giraffe",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000427796.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bottle",
      "knife",
      "cup",
      "sink"
    ]
  },
  {
    "file_name": "COCO_val2014_000000510587.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "truck",
      "person",
      "skateboard"
    ]
  },
  {
    "file_name": "COCO_val2014_000000537280.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "person",
      "car",
      "umbrella"
    ]
  },
  {
    "file_name": "COCO_val2014_000000111030.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "handbag",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000517861.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "dining table",
      "bottle",
      "bowl",
      "fork",
      "sandwich"
    ]
  },
  {
    "file_name": "COCO_val2014_000000400847.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "vase"
    ]
  },
  {
    "file_name": "COCO_val2014_000000500200.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "potted plant",
      "vase",
      "spoon"
    ]
  },
  {
    "file_name": "COCO_val2014_000000121153.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": []
  },
  {
    "file_name": "COCO_val2014_000000226315.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "train"
    ]
  },
  {
    "file_name": "COCO_val2014_000000448113.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "dining table",
      "bowl",
      "person",
      "remote",
      "cup",
      "chair",
      "tv",
      "knife"
    ]
  },
  {
    "file_name": "COCO_val2014_000000175364.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "dining table",
      "bottle",
      "bowl",
      "oven",
      "wine glass",
      "spoon",
      "cup",
      "sink",
      "toaster"
    ]
  },
  {
    "file_name": "COCO_val2014_000000371861.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "dining table",
      "cake"
    ]
  },
  {
    "file_name": "COCO_val2014_000000120747.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bottle",
      "person",
      "cell phone",
      "remote",
      "couch",
      "laptop",
      "vase",
      "cup",
      "tv",
      "potted plant",
      "cat"
    ]
  },
  {
    "file_name": "COCO_val2014_000000225129.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bottle",
      "cup",
      "broccoli"
    ]
  },
  {
    "file_name": "COCO_val2014_000000055109.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "dining table",
      "bowl",
      "vase",
      "teddy bear",
      "cup",
      "potted plant"
    ]
  },
  {
    "file_name": "COCO_val2014_000000446983.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "person",
      "skis",
      "umbrella"
    ]
  },
  {
    "file_name": "COCO_val2014_000000393277.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "clock",
      "car"
    ]
  },
  {
    "file_name": "COCO_val2014_000000533408.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "truck",
      "bus",
      "car",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000416930.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bottle",
      "vase",
      "person",
      "hair drier"
    ]
  },
  {
    "file_name": "COCO_val2014_000000083850.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "dining table",
      "bottle",
      "person",
      "cell phone",
      "laptop",
      "cup",
      "pizza"
    ]
  },
  {
    "file_name": "COCO_val2014_000000066568.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "sports ball",
      "teddy bear"
    ]
  },
  {
    "file_name": "COCO_val2014_000000259952.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bed",
      "potted plant",
      "book",
      "chair"
    ]
  },
  {
    "file_name": "COCO_val2014_000000247141.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "surfboard",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000469471.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "toilet",
      "sink"
    ]
  },
  {
    "file_name": "COCO_val2014_000000020403.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "teddy bear",
      "cell phone"
    ]
  },
  {
    "file_name": "COCO_val2014_000000425672.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bed",
      "dog"
    ]
  },
  {
    "file_name": "COCO_val2014_000000356531.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "dining table",
      "bottle",
      "person",
      "fork",
      "cup",
      "knife"
    ]
  },
  {
    "file_name": "COCO_val2014_000000581458.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "person",
      "traffic light",
      "car",
      "train"
    ]
  },
  {
    "file_name": "COCO_val2014_000000281365.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "toilet"
    ]
  },
  {
    "file_name": "COCO_val2014_000000535668.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "baseball bat",
      "sports ball",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000136846.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "truck",
      "car"
    ]
  },
  {
    "file_name": "COCO_val2014_000000364745.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "dining table",
      "person",
      "couch",
      "clock",
      "cup",
      "chair",
      "tv"
    ]
  },
  {
    "file_name": "COCO_val2014_000000172137.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bottle",
      "apple",
      "banana",
      "vase",
      "orange"
    ]
  },
  {
    "file_name": "COCO_val2014_000000430756.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "horse",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000271864.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bed"
    ]
  },
  {
    "file_name": "COCO_val2014_000000081766.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "dog"
    ]
  },
  {
    "file_name": "COCO_val2014_000000351130.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "baseball bat",
      "person",
      "baseball glove",
      "chair",
      "bench"
    ]
  },
  {
    "file_name": "COCO_val2014_000000537270.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "person",
      "cell phone",
      "cup",
      "chair"
    ]
  },
  {
    "file_name": "COCO_val2014_000000166142.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bottle",
      "toilet"
    ]
  },
  {
    "file_name": "COCO_val2014_000000185925.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "sports ball",
      "person",
      "tennis racket"
    ]
  },
  {
    "file_name": "COCO_val2014_000000057671.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bottle",
      "sink"
    ]
  },
  {
    "file_name": "COCO_val2014_000000443006.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "giraffe"
    ]
  },
  {
    "file_name": "COCO_val2014_000000419601.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "couch",
      "bed",
      "book",
      "chair"
    ]
  },
  {
    "file_name": "COCO_val2014_000000224119.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "tv",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000399595.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "person",
      "bus",
      "car",
      "truck",
      "bicycle",
      "clock",
      "bench"
    ]
  },
  {
    "file_name": "COCO_val2014_000000007297.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "person",
      "traffic light",
      "car",
      "truck",
      "clock"
    ]
  },
  {
    "file_name": "COCO_val2014_000000449296.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bottle",
      "bowl",
      "oven",
      "spoon",
      "cup",
      "sink"
    ]
  },
  {
    "file_name": "COCO_val2014_000000205344.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bed",
      "person",
      "dog",
      "laptop",
      "chair",
      "couch",
      "book"
    ]
  },
  {
    "file_name": "COCO_val2014_000000041908.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "zebra"
    ]
  },
  {
    "file_name": "COCO_val2014_000000356740.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "tv",
      "keyboard",
      "laptop"
    ]
  },
  {
    "file_name": "COCO_val2014_000000250655.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "clock",
      "person",
      "tennis racket"
    ]
  },
  {
    "file_name": "COCO_val2014_000000505754.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "dining table",
      "cake",
      "fork",
      "keyboard",
      "cup"
    ]
  },
  {
    "file_name": "COCO_val2014_000000344194.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "clock",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000520918.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "person",
      "suitcase",
      "train"
    ]
  },
  {
    "file_name": "COCO_val2014_000000414917.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "airplane",
      "truck",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000017769.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bear",
      "teddy bear"
    ]
  },
  {
    "file_name": "COCO_val2014_000000442019.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "baseball bat",
      "baseball glove",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000513060.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "chair",
      "bench",
      "person",
      "donut"
    ]
  },
  {
    "file_name": "COCO_val2014_000000309317.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "clock",
      "person",
      "sandwich"
    ]
  },
  {
    "file_name": "COCO_val2014_000000441522.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bowl",
      "person",
      "oven",
      "spoon",
      "sink"
    ]
  },
  {
    "file_name": "COCO_val2014_000000359465.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": []
  },
  {
    "file_name": "COCO_val2014_000000144935.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "person",
      "kite"
    ]
  },
  {
    "file_name": "COCO_val2014_000000352507.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bed",
      "couch",
      "chair",
      "tv",
      "potted plant"
    ]
  },
  {
    "file_name": "COCO_val2014_000000017905.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "traffic light",
      "person",
      "fire hydrant"
    ]
  },
  {
    "file_name": "COCO_val2014_000000486383.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "tv",
      "keyboard",
      "laptop",
      "mouse"
    ]
  },
  {
    "file_name": "COCO_val2014_000000319706.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "mouse",
      "keyboard",
      "laptop",
      "scissors",
      "chair",
      "tv",
      "cat"
    ]
  },
  {
    "file_name": "COCO_val2014_000000378515.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "person",
      "banana",
      "bicycle"
    ]
  },
  {
    "file_name": "COCO_val2014_000000407602.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "person",
      "motorcycle"
    ]
  },
  {
    "file_name": "COCO_val2014_000000399879.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "dining table",
      "person",
      "oven",
      "refrigerator",
      "cup",
      "chair"
    ]
  },
  {
    "file_name": "COCO_val2014_000000444324.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "tie",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000096306.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bottle",
      "sports ball",
      "person",
      "chair"
    ]
  },
  {
    "file_name": "COCO_val2014_000000512929.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "oven",
      "bowl",
      "person",
      "spoon"
    ]
  },
  {
    "file_name": "COCO_val2014_000000288435.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "clock",
      "traffic light",
      "bus"
    ]
  },
  {
    "file_name": "COCO_val2014_000000476939.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "tv",
      "bed",
      "person",
      "book"
    ]
  },
  {
    "file_name": "COCO_val2014_000000037670.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "remote",
      "person",
      "toilet"
    ]
  },
  {
    "file_name": "COCO_val2014_000000534019.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "fork",
      "broccoli"
    ]
  },
  {
    "file_name": "COCO_val2014_000000315976.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bicycle",
      "bus",
      "handbag",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000256722.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "laptop",
      "vase",
      "teddy bear",
      "tv",
      "book"
    ]
  },
  {
    "file_name": "COCO_val2014_000000318056.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bus"
    ]
  },
  {
    "file_name": "COCO_val2014_000000084643.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "elephant"
    ]
  },
  {
    "file_name": "COCO_val2014_000000504248.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bottle",
      "toilet",
      "sink"
    ]
  },
  {
    "file_name": "COCO_val2014_000000406885.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "train"
    ]
  },
  {
    "file_name": "COCO_val2014_000000213008.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bed",
      "dining table",
      "vase",
      "chair"
    ]
  },
  {
    "file_name": "COCO_val2014_000000021496.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "airplane"
    ]
  },
  {
    "file_name": "COCO_val2014_000000412338.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000133025.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "baseball bat",
      "sports ball",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000270815.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "baseball glove",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000494970.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "vase"
    ]
  },
  {
    "file_name": "COCO_val2014_000000322119.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "tv",
      "remote",
      "person",
      "book"
    ]
  },
  {
    "file_name": "COCO_val2014_000000152103.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bed",
      "remote",
      "dog"
    ]
  },
  {
    "file_name": "COCO_val2014_000000315939.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "handbag",
      "bench",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000235380.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "car",
      "person",
      "parking meter"
    ]
  },
  {
    "file_name": "COCO_val2014_000000413959.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bird",
      "horse",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000146961.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bottle",
      "bowl",
      "person",
      "chair",
      "fork",
      "spoon",
      "microwave",
      "cup",
      "sink"
    ]
  },
  {
    "file_name": "COCO_val2014_000000137412.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "person",
      "cell phone",
      "laptop",
      "tv",
      "cat"
    ]
  },
  {
    "file_name": "COCO_val2014_000000289201.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "person",
      "chair",
      "refrigerator"
    ]
  },
  {
    "file_name": "COCO_val2014_000000514860.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "dining table",
      "cell phone",
      "person",
      "wine glass",
      "knife"
    ]
  },
  {
    "file_name": "COCO_val2014_000000298680.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "carrot",
      "fork",
      "bowl",
      "spoon"
    ]
  },
  {
    "file_name": "COCO_val2014_000000506052.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "person",
      "cell phone"
    ]
  },
  {
    "file_name": "COCO_val2014_000000161567.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "oven",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000118778.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "car",
      "train"
    ]
  },
  {
    "file_name": "COCO_val2014_000000021023.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "vase",
      "potted plant"
    ]
  },
  {
    "file_name": "COCO_val2014_000000393411.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "person",
      "train"
    ]
  },
  {
    "file_name": "COCO_val2014_000000478798.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "laptop",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000365182.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "clock",
      "handbag",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000287318.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "train"
    ]
  },
  {
    "file_name": "COCO_val2014_000000115875.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "couch",
      "remote",
      "person",
      "chair"
    ]
  },
  {
    "file_name": "COCO_val2014_000000447770.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "couch",
      "laptop",
      "mouse",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000261504.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bed"
    ]
  },
  {
    "file_name": "COCO_val2014_000000195045.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bench"
    ]
  },
  {
    "file_name": "COCO_val2014_000000041998.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "clock",
      "person",
      "umbrella"
    ]
  },
  {
    "file_name": "COCO_val2014_000000133611.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "boat",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000460091.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bed",
      "vase",
      "potted plant",
      "book"
    ]
  },
  {
    "file_name": "COCO_val2014_000000256031.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "surfboard",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000504470.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "teddy bear"
    ]
  },
  {
    "file_name": "COCO_val2014_000000082462.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "person",
      "dining table",
      "hot dog",
      "umbrella"
    ]
  },
  {
    "file_name": "COCO_val2014_000000018461.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bottle",
      "refrigerator"
    ]
  },
  {
    "file_name": "COCO_val2014_000000297676.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "baseball glove",
      "sports ball",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000295693.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bowl",
      "person",
      "remote",
      "couch",
      "laptop",
      "handbag",
      "wine glass",
      "cup",
      "chair",
      "tv",
      "potted plant",
      "book",
      "cat"
    ]
  },
  {
    "file_name": "COCO_val2014_000000442456.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "person",
      "cell phone",
      "handbag",
      "car",
      "truck"
    ]
  },
  {
    "file_name": "COCO_val2014_000000347058.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "cake",
      "cup"
    ]
  },
  {
    "file_name": "COCO_val2014_000000241503.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bed",
      "chair",
      "book",
      "dog"
    ]
  },
  {
    "file_name": "COCO_val2014_000000444755.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "tie",
      "person",
      "book",
      "dog"
    ]
  },
  {
    "file_name": "COCO_val2014_000000487391.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "hot dog"
    ]
  },
  {
    "file_name": "COCO_val2014_000000176362.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "baseball bat",
      "baseball glove",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000515355.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "fork",
      "donut"
    ]
  },
  {
    "file_name": "COCO_val2014_000000186797.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "car"
    ]
  },
  {
    "file_name": "COCO_val2014_000000077172.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "tv",
      "book"
    ]
  },
  {
    "file_name": "COCO_val2014_000000438232.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "person",
      "train"
    ]
  },
  {
    "file_name": "COCO_val2014_000000391603.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000216761.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "skateboard",
      "backpack",
      "bench",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000120767.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bench",
      "giraffe",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000152111.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "surfboard",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000319908.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "snowboard",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000579008.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bottle",
      "cat"
    ]
  },
  {
    "file_name": "COCO_val2014_000000173685.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": []
  },
  {
    "file_name": "COCO_val2014_000000357526.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "person",
      "backpack",
      "umbrella",
      "cup",
      "chair"
    ]
  },
  {
    "file_name": "COCO_val2014_000000543203.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "airplane",
      "truck",
      "car"
    ]
  },
  {
    "file_name": "COCO_val2014_000000299116.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "dining table",
      "person",
      "cup",
      "chair",
      "sandwich"
    ]
  },
  {
    "file_name": "COCO_val2014_000000436470.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "dining table",
      "vase",
      "chair",
      "couch",
      "potted plant",
      "book"
    ]
  },
  {
    "file_name": "COCO_val2014_000000327186.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "airplane"
    ]
  },
  {
    "file_name": "COCO_val2014_000000381254.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bird",
      "elephant"
    ]
  },
  {
    "file_name": "COCO_val2014_000000552832.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "person",
      "remote",
      "couch",
      "tv",
      "book"
    ]
  },
  {
    "file_name": "COCO_val2014_000000370591.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "dining table",
      "cake",
      "person",
      "fork",
      "wine glass",
      "spoon",
      "chair",
      "knife"
    ]
  },
  {
    "file_name": "COCO_val2014_000000069914.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bottle",
      "bowl",
      "oven",
      "person",
      "refrigerator",
      "sink",
      "spoon",
      "chair",
      "clock",
      "knife"
    ]
  },
  {
    "file_name": "COCO_val2014_000000464358.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bed",
      "tv",
      "chair"
    ]
  },
  {
    "file_name": "COCO_val2014_000000165229.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "tv"
    ]
  },
  {
    "file_name": "COCO_val2014_000000206684.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "suitcase",
      "person",
      "cell phone",
      "handbag",
      "car",
      "bicycle",
      "cup",
      "bench"
    ]
  },
  {
    "file_name": "COCO_val2014_000000257624.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "sports ball",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000457254.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "person",
      "motorcycle"
    ]
  },
  {
    "file_name": "COCO_val2014_000000079213.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "couch",
      "remote",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000143275.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "backpack",
      "skis",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000313155.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "keyboard",
      "donut"
    ]
  },
  {
    "file_name": "COCO_val2014_000000532901.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "couch",
      "vase",
      "chair"
    ]
  },
  {
    "file_name": "COCO_val2014_000000484721.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "microwave",
      "bottle"
    ]
  },
  {
    "file_name": "COCO_val2014_000000181518.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "stop sign",
      "car"
    ]
  },
  {
    "file_name": "COCO_val2014_000000028456.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "baseball bat",
      "baseball glove",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000106351.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bowl",
      "refrigerator",
      "apple",
      "cup",
      "toaster"
    ]
  },
  {
    "file_name": "COCO_val2014_000000136915.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "baseball bat",
      "person",
      "tie",
      "chair",
      "book"
    ]
  },
  {
    "file_name": "COCO_val2014_000000469158.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "skateboard",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000355410.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "backpack",
      "person",
      "kite"
    ]
  },
  {
    "file_name": "COCO_val2014_000000114941.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "train"
    ]
  },
  {
    "file_name": "COCO_val2014_000000124599.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "boat",
      "person",
      "umbrella",
      "sports ball",
      "chair"
    ]
  },
  {
    "file_name": "COCO_val2014_000000484751.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "mouse",
      "cell phone",
      "keyboard",
      "clock",
      "cup",
      "chair",
      "tv"
    ]
  },
  {
    "file_name": "COCO_val2014_000000484351.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "dining table",
      "bottle",
      "person",
      "handbag",
      "apple",
      "spoon",
      "tie",
      "chair",
      "book"
    ]
  },
  {
    "file_name": "COCO_val2014_000000155125.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "dining table",
      "person",
      "chair",
      "pizza",
      "bench"
    ]
  },
  {
    "file_name": "COCO_val2014_000000494808.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "remote",
      "bottle"
    ]
  },
  {
    "file_name": "COCO_val2014_000000146675.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "handbag",
      "person",
      "tennis racket"
    ]
  },
  {
    "file_name": "COCO_val2014_000000076588.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "sink",
      "bottle",
      "vase",
      "cat"
    ]
  },
  {
    "file_name": "COCO_val2014_000000360208.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bottle",
      "tie",
      "person",
      "chair"
    ]
  },
  {
    "file_name": "COCO_val2014_000000132578.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "couch",
      "bed",
      "cat"
    ]
  },
  {
    "file_name": "COCO_val2014_000000446812.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bottle",
      "person",
      "refrigerator"
    ]
  },
  {
    "file_name": "COCO_val2014_000000094619.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "skateboard",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000207969.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bowl",
      "oven",
      "person",
      "cup",
      "sink",
      "book"
    ]
  },
  {
    "file_name": "COCO_val2014_000000370116.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "backpack",
      "suitcase"
    ]
  },
  {
    "file_name": "COCO_val2014_000000542350.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "elephant"
    ]
  },
  {
    "file_name": "COCO_val2014_000000249443.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bench"
    ]
  },
  {
    "file_name": "COCO_val2014_000000263969.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "cake",
      "tie",
      "person",
      "knife"
    ]
  },
  {
    "file_name": "COCO_val2014_000000112568.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "hot dog",
      "dining table",
      "person",
      "umbrella",
      "bench",
      "potted plant",
      "knife"
    ]
  },
  {
    "file_name": "COCO_val2014_000000449660.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "cat"
    ]
  },
  {
    "file_name": "COCO_val2014_000000021839.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "traffic light",
      "car",
      "handbag",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000491366.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "person",
      "remote",
      "couch",
      "keyboard",
      "clock",
      "tv"
    ]
  },
  {
    "file_name": "COCO_val2014_000000312489.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "surfboard",
      "boat",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000272673.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "sink"
    ]
  },
  {
    "file_name": "COCO_val2014_000000507833.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "person",
      "car",
      "motorcycle",
      "truck",
      "bicycle"
    ]
  },
  {
    "file_name": "COCO_val2014_000000207486.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "cow",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000039150.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "carrot",
      "broccoli"
    ]
  },
  {
    "file_name": "COCO_val2014_000000008603.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "giraffe"
    ]
  },
  {
    "file_name": "COCO_val2014_000000032964.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "fork",
      "hot dog",
      "bowl",
      "spoon"
    ]
  },
  {
    "file_name": "COCO_val2014_000000515077.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "dining table",
      "person",
      "remote",
      "couch",
      "chair",
      "tv"
    ]
  },
  {
    "file_name": "COCO_val2014_000000272440.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bowl",
      "oven",
      "person",
      "spoon",
      "pizza"
    ]
  },
  {
    "file_name": "COCO_val2014_000000167700.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "toilet"
    ]
  },
  {
    "file_name": "COCO_val2014_000000323155.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "person",
      "banana",
      "umbrella"
    ]
  },
  {
    "file_name": "COCO_val2014_000000296759.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "person",
      "teddy bear"
    ]
  },
  {
    "file_name": "COCO_val2014_000000071023.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "dining table",
      "bowl",
      "chair",
      "spoon",
      "microwave",
      "cup",
      "sink",
      "potted plant",
      "book"
    ]
  },
  {
    "file_name": "COCO_val2014_000000411941.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "microwave",
      "refrigerator",
      "toaster",
      "sink"
    ]
  },
  {
    "file_name": "COCO_val2014_000000022324.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "vase"
    ]
  },
  {
    "file_name": "COCO_val2014_000000313789.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "banana"
    ]
  },
  {
    "file_name": "COCO_val2014_000000228011.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "person",
      "cell phone",
      "motorcycle",
      "cow",
      "bicycle"
    ]
  },
  {
    "file_name": "COCO_val2014_000000145015.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bed",
      "chair"
    ]
  },
  {
    "file_name": "COCO_val2014_000000499242.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "mouse",
      "person",
      "laptop",
      "keyboard",
      "chair",
      "tv"
    ]
  },
  {
    "file_name": "COCO_val2014_000000444694.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "carrot",
      "orange",
      "broccoli"
    ]
  },
  {
    "file_name": "COCO_val2014_000000227736.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bench",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000192047.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "sink"
    ]
  },
  {
    "file_name": "COCO_val2014_000000296208.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "banana",
      "cup"
    ]
  },
  {
    "file_name": "COCO_val2014_000000377183.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "mouse",
      "person",
      "laptop",
      "bicycle",
      "cup",
      "chair",
      "potted plant"
    ]
  },
  {
    "file_name": "COCO_val2014_000000271471.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "banana",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000483374.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "person",
      "handbag",
      "cell phone",
      "train"
    ]
  },
  {
    "file_name": "COCO_val2014_000000365217.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "person",
      "tennis racket",
      "chair"
    ]
  },
  {
    "file_name": "COCO_val2014_000000247917.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "baseball glove",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000506614.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bed",
      "clock",
      "chair",
      "couch",
      "book"
    ]
  },
  {
    "file_name": "COCO_val2014_000000422755.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "horse",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000490701.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "dining table",
      "cake",
      "person",
      "fork",
      "spoon",
      "cup"
    ]
  },
  {
    "file_name": "COCO_val2014_000000313562.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "carrot",
      "banana",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000072155.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bench",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000562856.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "dining table",
      "bottle",
      "sandwich"
    ]
  },
  {
    "file_name": "COCO_val2014_000000431967.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "sink"
    ]
  },
  {
    "file_name": "COCO_val2014_000000294585.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "sandwich",
      "person",
      "chair"
    ]
  },
  {
    "file_name": "COCO_val2014_000000396217.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "dog"
    ]
  },
  {
    "file_name": "COCO_val2014_000000058232.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bottle",
      "bowl",
      "person",
      "cup"
    ]
  },
  {
    "file_name": "COCO_val2014_000000243442.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "dining table",
      "bowl",
      "person",
      "refrigerator"
    ]
  },
  {
    "file_name": "COCO_val2014_000000493566.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "train"
    ]
  },
  {
    "file_name": "COCO_val2014_000000396051.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "airplane",
      "truck"
    ]
  },
  {
    "file_name": "COCO_val2014_000000125211.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "zebra"
    ]
  },
  {
    "file_name": "COCO_val2014_000000150117.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "dining table",
      "bottle",
      "person",
      "backpack",
      "fork",
      "wine glass",
      "chair",
      "book",
      "knife"
    ]
  },
  {
    "file_name": "COCO_val2014_000000220528.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "tv",
      "teddy bear"
    ]
  },
  {
    "file_name": "COCO_val2014_000000340573.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "clock"
    ]
  },
  {
    "file_name": "COCO_val2014_000000193021.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "dining table",
      "bottle",
      "oven",
      "cell phone",
      "person",
      "backpack",
      "chair"
    ]
  },
  {
    "file_name": "COCO_val2014_000000103791.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "truck",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000127880.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "person",
      "toilet"
    ]
  },
  {
    "file_name": "COCO_val2014_000000457133.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "stop sign"
    ]
  },
  {
    "file_name": "COCO_val2014_000000297736.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": []
  },
  {
    "file_name": "COCO_val2014_000000383607.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "stop sign",
      "car"
    ]
  },
  {
    "file_name": "COCO_val2014_000000176993.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "person",
      "train"
    ]
  },
  {
    "file_name": "COCO_val2014_000000288041.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "remote",
      "person",
      "chair"
    ]
  },
  {
    "file_name": "COCO_val2014_000000227460.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "person",
      "backpack",
      "bench",
      "bicycle"
    ]
  },
  {
    "file_name": "COCO_val2014_000000291509.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bench",
      "potted plant"
    ]
  },
  {
    "file_name": "COCO_val2014_000000148055.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "truck",
      "car",
      "cow",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000062474.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "train"
    ]
  },
  {
    "file_name": "COCO_val2014_000000314914.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "truck"
    ]
  },
  {
    "file_name": "COCO_val2014_000000139486.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bed"
    ]
  },
  {
    "file_name": "COCO_val2014_000000055429.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "hot dog",
      "dining table",
      "wine glass",
      "knife"
    ]
  },
  {
    "file_name": "COCO_val2014_000000025668.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "person",
      "umbrella"
    ]
  },
  {
    "file_name": "COCO_val2014_000000120164.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "clock",
      "oven"
    ]
  },
  {
    "file_name": "COCO_val2014_000000280536.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "carrot",
      "dining table",
      "bowl",
      "orange"
    ]
  },
  {
    "file_name": "COCO_val2014_000000351331.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "fork",
      "pizza",
      "dining table"
    ]
  },
  {
    "file_name": "COCO_val2014_000000028713.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "hot dog",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000570077.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "potted plant",
      "frisbee",
      "dog"
    ]
  },
  {
    "file_name": "COCO_val2014_000000449279.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "cake",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000421401.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "vase",
      "potted plant"
    ]
  },
  {
    "file_name": "COCO_val2014_000000277073.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "backpack",
      "person",
      "motorcycle"
    ]
  },
  {
    "file_name": "COCO_val2014_000000046775.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "dining table",
      "refrigerator",
      "bowl",
      "sink"
    ]
  },
  {
    "file_name": "COCO_val2014_000000141017.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "dining table",
      "suitcase",
      "person",
      "oven",
      "refrigerator",
      "sink",
      "microwave",
      "chair",
      "couch"
    ]
  },
  {
    "file_name": "COCO_val2014_000000039914.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "person",
      "kite"
    ]
  },
  {
    "file_name": "COCO_val2014_000000090058.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "zebra"
    ]
  },
  {
    "file_name": "COCO_val2014_000000563653.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "person",
      "traffic light",
      "handbag",
      "car",
      "truck"
    ]
  },
  {
    "file_name": "COCO_val2014_000000037814.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "scissors",
      "cell phone"
    ]
  },
  {
    "file_name": "COCO_val2014_000000085787.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "person",
      "traffic light",
      "umbrella"
    ]
  },
  {
    "file_name": "COCO_val2014_000000079837.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "boat"
    ]
  },
  {
    "file_name": "COCO_val2014_000000049060.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "person",
      "train"
    ]
  },
  {
    "file_name": "COCO_val2014_000000026622.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "zebra"
    ]
  },
  {
    "file_name": "COCO_val2014_000000299045.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": []
  },
  {
    "file_name": "COCO_val2014_000000562735.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "dining table",
      "potted plant",
      "cup"
    ]
  },
  {
    "file_name": "COCO_val2014_000000273002.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "person",
      "umbrella",
      "chair"
    ]
  },
  {
    "file_name": "COCO_val2014_000000370209.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bottle",
      "bowl",
      "person",
      "oven",
      "spoon",
      "cup"
    ]
  },
  {
    "file_name": "COCO_val2014_000000263828.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "person",
      "handbag",
      "motorcycle",
      "truck",
      "bicycle"
    ]
  },
  {
    "file_name": "COCO_val2014_000000085328.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "person",
      "handbag",
      "bench",
      "train"
    ]
  },
  {
    "file_name": "COCO_val2014_000000017235.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "toilet",
      "sink"
    ]
  },
  {
    "file_name": "COCO_val2014_000000463703.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "fork",
      "pizza",
      "dining table",
      "cup"
    ]
  },
  {
    "file_name": "COCO_val2014_000000188414.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "tie",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000505133.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bottle",
      "bowl",
      "oven",
      "fork",
      "carrot",
      "cup"
    ]
  },
  {
    "file_name": "COCO_val2014_000000283038.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "truck",
      "stop sign",
      "car",
      "traffic light"
    ]
  },
  {
    "file_name": "COCO_val2014_000000212603.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "cat"
    ]
  },
  {
    "file_name": "COCO_val2014_000000299042.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "sheep"
    ]
  },
  {
    "file_name": "COCO_val2014_000000210522.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "person",
      "backpack",
      "handbag",
      "tie",
      "bicycle"
    ]
  },
  {
    "file_name": "COCO_val2014_000000148549.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bottle",
      "person",
      "backpack",
      "banana",
      "tie",
      "orange"
    ]
  },
  {
    "file_name": "COCO_val2014_000000339019.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "person",
      "umbrella",
      "chair"
    ]
  },
  {
    "file_name": "COCO_val2014_000000125167.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "teddy bear"
    ]
  },
  {
    "file_name": "COCO_val2014_000000014562.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "person",
      "tennis racket",
      "chair"
    ]
  },
  {
    "file_name": "COCO_val2014_000000571944.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "sheep"
    ]
  },
  {
    "file_name": "COCO_val2014_000000016491.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "baseball glove",
      "person",
      "chair"
    ]
  },
  {
    "file_name": "COCO_val2014_000000553034.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bird",
      "giraffe"
    ]
  },
  {
    "file_name": "COCO_val2014_000000010363.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bottle",
      "car",
      "bicycle",
      "cat"
    ]
  },
  {
    "file_name": "COCO_val2014_000000213978.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000358976.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "couch",
      "chair",
      "cat"
    ]
  },
  {
    "file_name": "COCO_val2014_000000217594.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "tv",
      "chair"
    ]
  },
  {
    "file_name": "COCO_val2014_000000384625.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "dining table",
      "cell phone",
      "remote",
      "couch",
      "chair",
      "tv"
    ]
  },
  {
    "file_name": "COCO_val2014_000000429323.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "toilet",
      "sink"
    ]
  },
  {
    "file_name": "COCO_val2014_000000104589.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "cake",
      "bowl",
      "fork",
      "carrot",
      "sandwich"
    ]
  },
  {
    "file_name": "COCO_val2014_000000281766.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bicycle",
      "handbag",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000436617.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "dining table",
      "person",
      "handbag",
      "wine glass",
      "cup",
      "chair",
      "bench"
    ]
  },
  {
    "file_name": "COCO_val2014_000000383065.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "stop sign",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000076460.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "elephant"
    ]
  },
  {
    "file_name": "COCO_val2014_000000513793.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "parking meter"
    ]
  },
  {
    "file_name": "COCO_val2014_000000074037.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "dining table",
      "bottle",
      "tie",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000395745.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "dining table",
      "sandwich",
      "spoon",
      "cup",
      "knife"
    ]
  },
  {
    "file_name": "COCO_val2014_000000285388.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "zebra"
    ]
  },
  {
    "file_name": "COCO_val2014_000000558539.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bus",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000366569.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "person",
      "tennis racket"
    ]
  },
  {
    "file_name": "COCO_val2014_000000058910.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "couch",
      "sink"
    ]
  },
  {
    "file_name": "COCO_val2014_000000072368.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "skateboard",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000498802.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bench",
      "person",
      "tennis racket"
    ]
  },
  {
    "file_name": "COCO_val2014_000000022432.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "tv",
      "bed"
    ]
  },
  {
    "file_name": "COCO_val2014_000000164179.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "carrot",
      "pizza"
    ]
  },
  {
    "file_name": "COCO_val2014_000000581437.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "microwave"
    ]
  },
  {
    "file_name": "COCO_val2014_000000323151.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "dining table",
      "bowl",
      "cup",
      "chair",
      "pizza"
    ]
  },
  {
    "file_name": "COCO_val2014_000000140987.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "dining table",
      "person",
      "cup",
      "chair",
      "pizza",
      "potted plant"
    ]
  },
  {
    "file_name": "COCO_val2014_000000021641.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "person",
      "toothbrush"
    ]
  },
  {
    "file_name": "COCO_val2014_000000184659.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "cake",
      "person",
      "motorcycle"
    ]
  },
  {
    "file_name": "COCO_val2014_000000203661.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "dining table",
      "bottle",
      "bowl",
      "sink",
      "microwave",
      "cup",
      "chair",
      "book",
      "knife"
    ]
  },
  {
    "file_name": "COCO_val2014_000000460460.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "couch",
      "bottle",
      "chair",
      "refrigerator"
    ]
  },
  {
    "file_name": "COCO_val2014_000000144053.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "traffic light"
    ]
  },
  {
    "file_name": "COCO_val2014_000000030796.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bus",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000039540.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "dining table"
    ]
  },
  {
    "file_name": "COCO_val2014_000000395046.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "person",
      "train"
    ]
  },
  {
    "file_name": "COCO_val2014_000000101031.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "traffic light",
      "bus",
      "car"
    ]
  },
  {
    "file_name": "COCO_val2014_000000426852.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "vase"
    ]
  },
  {
    "file_name": "COCO_val2014_000000121817.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "tv",
      "couch",
      "person",
      "cell phone"
    ]
  },
  {
    "file_name": "COCO_val2014_000000082688.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "remote",
      "person",
      "cell phone"
    ]
  },
  {
    "file_name": "COCO_val2014_000000242270.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "handbag",
      "bus",
      "car",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000004312.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "dining table",
      "bowl",
      "person",
      "spoon",
      "pizza"
    ]
  },
  {
    "file_name": "COCO_val2014_000000034438.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "skis",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000437180.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bottle",
      "person",
      "cell phone",
      "remote",
      "laptop"
    ]
  },
  {
    "file_name": "COCO_val2014_000000427189.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "broccoli"
    ]
  },
  {
    "file_name": "COCO_val2014_000000129659.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "dining table",
      "bottle",
      "bowl",
      "person",
      "spoon",
      "cup",
      "chair",
      "knife"
    ]
  },
  {
    "file_name": "COCO_val2014_000000527427.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "dining table",
      "person",
      "cell phone",
      "laptop",
      "chair",
      "potted plant"
    ]
  },
  {
    "file_name": "COCO_val2014_000000196007.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "baseball bat",
      "car",
      "sports ball",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000491090.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "person",
      "motorcycle"
    ]
  },
  {
    "file_name": "COCO_val2014_000000362094.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "dining table",
      "person",
      "chair",
      "cup",
      "donut",
      "clock"
    ]
  },
  {
    "file_name": "COCO_val2014_000000132219.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "apple",
      "tie",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000232563.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "person",
      "handbag",
      "umbrella"
    ]
  },
  {
    "file_name": "COCO_val2014_000000161807.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bowl",
      "chair",
      "fork",
      "broccoli",
      "book"
    ]
  },
  {
    "file_name": "COCO_val2014_000000535591.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bird",
      "train"
    ]
  },
  {
    "file_name": "COCO_val2014_000000178578.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "car",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000347612.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "stop sign"
    ]
  },
  {
    "file_name": "COCO_val2014_000000439472.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "tv",
      "dining table",
      "couch"
    ]
  },
  {
    "file_name": "COCO_val2014_000000166509.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "traffic light"
    ]
  },
  {
    "file_name": "COCO_val2014_000000061717.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bed",
      "chair"
    ]
  },
  {
    "file_name": "COCO_val2014_000000308715.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "cell phone"
    ]
  },
  {
    "file_name": "COCO_val2014_000000382411.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "person",
      "tennis racket"
    ]
  },
  {
    "file_name": "COCO_val2014_000000476754.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "traffic light",
      "car"
    ]
  },
  {
    "file_name": "COCO_val2014_000000581022.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "couch",
      "potted plant",
      "person",
      "book"
    ]
  },
  {
    "file_name": "COCO_val2014_000000467990.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "train"
    ]
  },
  {
    "file_name": "COCO_val2014_000000014635.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "dining table",
      "bowl",
      "oven",
      "person",
      "fork",
      "spoon",
      "cup",
      "chair",
      "tv",
      "knife"
    ]
  },
  {
    "file_name": "COCO_val2014_000000530384.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "dining table",
      "bottle",
      "bowl",
      "oven",
      "refrigerator",
      "sink",
      "microwave",
      "vase",
      "chair",
      "bed",
      "potted plant",
      "toaster"
    ]
  },
  {
    "file_name": "COCO_val2014_000000186036.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "truck",
      "handbag",
      "person",
      "cup"
    ]
  },
  {
    "file_name": "COCO_val2014_000000521879.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "horse",
      "tie",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000527248.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "clock",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000151896.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "potted plant",
      "person",
      "umbrella"
    ]
  },
  {
    "file_name": "COCO_val2014_000000036053.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bottle",
      "toothbrush",
      "cup",
      "sink"
    ]
  },
  {
    "file_name": "COCO_val2014_000000511321.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "boat"
    ]
  },
  {
    "file_name": "COCO_val2014_000000182683.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "cat"
    ]
  },
  {
    "file_name": "COCO_val2014_000000312627.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "tv",
      "couch",
      "refrigerator"
    ]
  },
  {
    "file_name": "COCO_val2014_000000047597.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "clock",
      "book"
    ]
  },
  {
    "file_name": "COCO_val2014_000000158964.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "horse",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000534271.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "vase",
      "bowl",
      "toilet"
    ]
  },
  {
    "file_name": "COCO_val2014_000000269429.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "tv",
      "couch",
      "book",
      "cat"
    ]
  },
  {
    "file_name": "COCO_val2014_000000182736.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "dining table",
      "person",
      "clock",
      "couch",
      "bench"
    ]
  },
  {
    "file_name": "COCO_val2014_000000418440.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "fork",
      "sandwich"
    ]
  },
  {
    "file_name": "COCO_val2014_000000106172.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "person",
      "keyboard",
      "chair",
      "tv",
      "book"
    ]
  },
  {
    "file_name": "COCO_val2014_000000076409.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bed",
      "book"
    ]
  },
  {
    "file_name": "COCO_val2014_000000291460.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "clock",
      "pizza",
      "bottle",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000056544.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "train"
    ]
  },
  {
    "file_name": "COCO_val2014_000000557258.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "toilet"
    ]
  },
  {
    "file_name": "COCO_val2014_000000418623.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "cup",
      "suitcase",
      "book",
      "chair"
    ]
  },
  {
    "file_name": "COCO_val2014_000000463583.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bowl",
      "fork",
      "spoon",
      "cup",
      "sandwich"
    ]
  },
  {
    "file_name": "COCO_val2014_000000320901.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bus",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000266091.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": []
  },
  {
    "file_name": "COCO_val2014_000000310553.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "car",
      "person",
      "motorcycle"
    ]
  },
  {
    "file_name": "COCO_val2014_000000145025.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "person",
      "backpack",
      "bicycle"
    ]
  },
  {
    "file_name": "COCO_val2014_000000204507.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "dining table",
      "person",
      "backpack",
      "umbrella",
      "chair"
    ]
  },
  {
    "file_name": "COCO_val2014_000000150599.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bench",
      "laptop",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000281534.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "person",
      "car",
      "truck",
      "bicycle",
      "bench",
      "potted plant",
      "book"
    ]
  },
  {
    "file_name": "COCO_val2014_000000433423.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "tv",
      "cat"
    ]
  },
  {
    "file_name": "COCO_val2014_000000187411.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "sheep"
    ]
  },
  {
    "file_name": "COCO_val2014_000000170389.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "tv",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000402798.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "airplane"
    ]
  },
  {
    "file_name": "COCO_val2014_000000186950.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "train"
    ]
  },
  {
    "file_name": "COCO_val2014_000000300943.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "truck"
    ]
  },
  {
    "file_name": "COCO_val2014_000000312081.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "person",
      "book"
    ]
  },
  {
    "file_name": "COCO_val2014_000000300245.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "toilet",
      "sink"
    ]
  },
  {
    "file_name": "COCO_val2014_000000048196.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bus"
    ]
  },
  {
    "file_name": "COCO_val2014_000000150267.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bus",
      "bench",
      "person",
      "parking meter"
    ]
  },
  {
    "file_name": "COCO_val2014_000000321973.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "banana",
      "dining table"
    ]
  },
  {
    "file_name": "COCO_val2014_000000233238.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "dining table",
      "bottle",
      "bowl",
      "person",
      "spoon",
      "chair"
    ]
  },
  {
    "file_name": "COCO_val2014_000000197756.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "person",
      "bottle",
      "cell phone"
    ]
  },
  {
    "file_name": "COCO_val2014_000000133629.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "laptop",
      "book",
      "chair"
    ]
  },
  {
    "file_name": "COCO_val2014_000000017198.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bench",
      "train"
    ]
  },
  {
    "file_name": "COCO_val2014_000000374061.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bed",
      "teddy bear",
      "cat"
    ]
  },
  {
    "file_name": "COCO_val2014_000000023489.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bicycle",
      "bench",
      "boat",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000130386.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "person",
      "bench",
      "car",
      "bicycle"
    ]
  },
  {
    "file_name": "COCO_val2014_000000492362.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "hot dog",
      "bowl",
      "person",
      "backpack",
      "handbag",
      "umbrella",
      "skateboard"
    ]
  },
  {
    "file_name": "COCO_val2014_000000481327.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "potted plant",
      "vase",
      "chair"
    ]
  },
  {
    "file_name": "COCO_val2014_000000015029.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "person",
      "frisbee"
    ]
  },
  {
    "file_name": "COCO_val2014_000000412437.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "person",
      "bus",
      "car",
      "umbrella",
      "motorcycle"
    ]
  },
  {
    "file_name": "COCO_val2014_000000084866.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "sports ball",
      "person",
      "tennis racket",
      "chair"
    ]
  },
  {
    "file_name": "COCO_val2014_000000567562.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "broccoli",
      "dining table",
      "bottle",
      "bowl",
      "person",
      "fork",
      "spoon",
      "cup",
      "chair",
      "pizza",
      "book"
    ]
  },
  {
    "file_name": "COCO_val2014_000000237920.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bench",
      "chair"
    ]
  },
  {
    "file_name": "COCO_val2014_000000068114.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "stop sign",
      "traffic light",
      "car"
    ]
  },
  {
    "file_name": "COCO_val2014_000000211665.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": []
  },
  {
    "file_name": "COCO_val2014_000000239444.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "dining table",
      "oven",
      "person",
      "microwave",
      "chair",
      "pizza"
    ]
  },
  {
    "file_name": "COCO_val2014_000000221828.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": []
  },
  {
    "file_name": "COCO_val2014_000000190923.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "truck",
      "traffic light",
      "handbag",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000360772.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "toilet"
    ]
  },
  {
    "file_name": "COCO_val2014_000000256094.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bottle",
      "toilet"
    ]
  },
  {
    "file_name": "COCO_val2014_000000304379.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "car",
      "tie",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000058651.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "person",
      "car",
      "train"
    ]
  },
  {
    "file_name": "COCO_val2014_000000248364.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "person",
      "laptop",
      "umbrella",
      "chair",
      "book"
    ]
  },
  {
    "file_name": "COCO_val2014_000000104166.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "person",
      "umbrella",
      "tennis racket",
      "chair",
      "bench"
    ]
  },
  {
    "file_name": "COCO_val2014_000000567315.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "train"
    ]
  },
  {
    "file_name": "COCO_val2014_000000068814.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "mouse",
      "keyboard",
      "laptop",
      "cup",
      "chair",
      "tv"
    ]
  },
  {
    "file_name": "COCO_val2014_000000294209.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "person",
      "sink"
    ]
  },
  {
    "file_name": "COCO_val2014_000000549384.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "cup",
      "toilet",
      "sink"
    ]
  },
  {
    "file_name": "COCO_val2014_000000134346.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bear"
    ]
  },
  {
    "file_name": "COCO_val2014_000000330050.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bench",
      "person",
      "tennis racket"
    ]
  },
  {
    "file_name": "COCO_val2014_000000263612.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "dog"
    ]
  },
  {
    "file_name": "COCO_val2014_000000480000.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "bottle",
      "bowl",
      "person",
      "wine glass",
      "spoon",
      "cup",
      "tv",
      "orange",
      "knife"
    ]
  },
  {
    "file_name": "COCO_val2014_000000384188.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "suitcase",
      "train"
    ]
  },
  {
    "file_name": "COCO_val2014_000000225505.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "toilet"
    ]
  },
  {
    "file_name": "COCO_val2014_000000122996.jpg",
    "prompt": "USER: <image>\nPlease describe the image in detail.\nASSISTANT:",
    "gt_label": [
      "elephant"
    ]
  }
]