[
  {
    "file_name": "COCO_val2014_000000231236.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "handbag",
      "chair",
      "sink",
      "toilet"
    ]
  },
  {
    "file_name": "COCO_val2014_000000025430.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "bench"
    ]
  },
  {
    "file_name": "COCO_val2014_000000123627.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "horse",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000289702.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "dog"
    ]
  },
  {
    "file_name": "COCO_val2014_000000581328.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "baseball glove",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000305060.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "pizza",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000183650.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "carrot",
      "truck",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000021232.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "bottle",
      "toilet"
    ]
  },
  {
    "file_name": "COCO_val2014_000000570866.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "baseball glove",
      "baseball bat",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000008922.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "sandwich",
      "oven",
      "chair",
      "bowl",
      "vase",
      "potted plant",
      "dining table"
    ]
  },
  {
    "file_name": "COCO_val2014_000000235006.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "truck"
    ]
  },
  {
    "file_name": "COCO_val2014_000000520918.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "train",
      "suitcase",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000185046.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "knife",
      "bottle",
      "cup",
      "bowl",
      "spoon",
      "dining table"
    ]
  },
  {
    "file_name": "COCO_val2014_000000428945.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "zebra"
    ]
  },
  {
    "file_name": "COCO_val2014_000000481028.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "cat",
      "teddy bear",
      "chair",
      "mouse"
    ]
  },
  {
    "file_name": "COCO_val2014_000000208825.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "fork",
      "cake"
    ]
  },
  {
    "file_name": "COCO_val2014_000000051249.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "traffic light",
      "train",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000080613.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "umbrella",
      "tie",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000551998.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "broccoli",
      "bottle",
      "bowl"
    ]
  },
  {
    "file_name": "COCO_val2014_000000550713.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "bed",
      "dog",
      "tv",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000424984.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "potted plant"
    ]
  },
  {
    "file_name": "COCO_val2014_000000516212.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "cat",
      "microwave",
      "cup"
    ]
  },
  {
    "file_name": "COCO_val2014_000000004772.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000360328.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "microwave",
      "bottle",
      "sink",
      "cup",
      "refrigerator",
      "cell phone",
      "vase",
      "potted plant",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000514518.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "snowboard",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000080455.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "carrot"
    ]
  },
  {
    "file_name": "COCO_val2014_000000432605.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "sink"
    ]
  },
  {
    "file_name": "COCO_val2014_000000571215.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "skateboard"
    ]
  },
  {
    "file_name": "COCO_val2014_000000580255.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "dog",
      "suitcase"
    ]
  },
  {
    "file_name": "COCO_val2014_000000255536.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "motorcycle",
      "chair",
      "person",
      "umbrella"
    ]
  },
  {
    "file_name": "COCO_val2014_000000117988.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "umbrella",
      "handbag",
      "backpack",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000014940.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "cat"
    ]
  },
  {
    "file_name": "COCO_val2014_000000295016.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "cat",
      "cup"
    ]
  },
  {
    "file_name": "COCO_val2014_000000450127.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "potted plant",
      "couch",
      "tv"
    ]
  },
  {
    "file_name": "COCO_val2014_000000379476.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "wine glass",
      "chair",
      "dining table"
    ]
  },
  {
    "file_name": "COCO_val2014_000000370765.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "teddy bear",
      "dog"
    ]
  },
  {
    "file_name": "COCO_val2014_000000255654.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "toilet"
    ]
  },
  {
    "file_name": "COCO_val2014_000000357194.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "couch",
      "chair",
      "clock",
      "vase",
      "book",
      "tv"
    ]
  },
  {
    "file_name": "COCO_val2014_000000309662.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "bottle",
      "bench",
      "wine glass",
      "motorcycle",
      "handbag",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000096306.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "sports ball",
      "chair",
      "bottle",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000175082.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "tie",
      "wine glass",
      "bowl",
      "hot dog",
      "book",
      "sandwich",
      "spoon",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000095862.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "baseball glove",
      "baseball bat",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000146836.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "train"
    ]
  },
  {
    "file_name": "COCO_val2014_000000287328.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "bed",
      "dog"
    ]
  },
  {
    "file_name": "COCO_val2014_000000168811.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "train",
      "cell phone",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000395289.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "traffic light",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000398628.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "giraffe"
    ]
  },
  {
    "file_name": "COCO_val2014_000000140963.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "car",
      "sandwich",
      "potted plant",
      "bowl",
      "handbag",
      "spoon",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000099875.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "couch",
      "cup",
      "chair",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000470386.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "keyboard",
      "laptop",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000051598.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "sink",
      "bottle"
    ]
  },
  {
    "file_name": "COCO_val2014_000000137938.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "fork",
      "cup",
      "pizza",
      "book",
      "spoon",
      "dining table"
    ]
  },
  {
    "file_name": "COCO_val2014_000000059774.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "umbrella",
      "microwave",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000144694.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "sports ball",
      "chair",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000160556.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "microwave",
      "keyboard",
      "laptop",
      "teddy bear",
      "cell phone",
      "tv",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000432570.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "vase",
      "potted plant"
    ]
  },
  {
    "file_name": "COCO_val2014_000000461976.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "traffic light",
      "train"
    ]
  },
  {
    "file_name": "COCO_val2014_000000211042.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "cat",
      "toilet"
    ]
  },
  {
    "file_name": "COCO_val2014_000000085338.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "pizza"
    ]
  },
  {
    "file_name": "COCO_val2014_000000523871.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "couch",
      "cell phone",
      "chair",
      "book",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000158950.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "train",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000521643.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "vase"
    ]
  },
  {
    "file_name": "COCO_val2014_000000352093.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "spoon",
      "bottle"
    ]
  },
  {
    "file_name": "COCO_val2014_000000310622.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": []
  },
  {
    "file_name": "COCO_val2014_000000071145.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "bird"
    ]
  },
  {
    "file_name": "COCO_val2014_000000468751.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "handbag",
      "bench",
      "cell phone",
      "potted plant",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000289712.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "suitcase"
    ]
  },
  {
    "file_name": "COCO_val2014_000000497825.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "tie",
      "dining table",
      "cup",
      "chair",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000295242.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "airplane"
    ]
  },
  {
    "file_name": "COCO_val2014_000000498557.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "train"
    ]
  },
  {
    "file_name": "COCO_val2014_000000203292.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "dog"
    ]
  },
  {
    "file_name": "COCO_val2014_000000151000.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "tie",
      "handbag",
      "cell phone",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000240817.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "skis",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000445722.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "boat",
      "backpack",
      "suitcase",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000361481.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "carrot",
      "bowl"
    ]
  },
  {
    "file_name": "COCO_val2014_000000486114.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "wine glass",
      "airplane",
      "cup",
      "chair",
      "bowl",
      "vase",
      "book",
      "potted plant",
      "dining table"
    ]
  },
  {
    "file_name": "COCO_val2014_000000338256.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "horse",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000103723.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "person",
      "elephant"
    ]
  },
  {
    "file_name": "COCO_val2014_000000444444.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "car",
      "horse",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000383838.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "remote",
      "chair",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000026564.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "keyboard",
      "bottle",
      "laptop",
      "book",
      "tv",
      "mouse"
    ]
  },
  {
    "file_name": "COCO_val2014_000000315641.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "donut",
      "refrigerator",
      "person",
      "knife"
    ]
  },
  {
    "file_name": "COCO_val2014_000000358629.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "knife",
      "dining table",
      "cup",
      "refrigerator",
      "bowl",
      "tv",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000460623.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "baseball glove",
      "sports ball",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000346265.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "giraffe"
    ]
  },
  {
    "file_name": "COCO_val2014_000000356380.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "couch",
      "book",
      "bed",
      "chair",
      "clock",
      "remote",
      "tv"
    ]
  },
  {
    "file_name": "COCO_val2014_000000520237.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "umbrella",
      "potted plant",
      "chair",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000441253.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "keyboard",
      "chair",
      "laptop",
      "mouse"
    ]
  },
  {
    "file_name": "COCO_val2014_000000148067.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "knife",
      "bottle",
      "broccoli",
      "laptop",
      "fork",
      "dining table"
    ]
  },
  {
    "file_name": "COCO_val2014_000000384970.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "motorcycle",
      "person",
      "truck",
      "car"
    ]
  },
  {
    "file_name": "COCO_val2014_000000095692.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "umbrella",
      "person",
      "skateboard"
    ]
  },
  {
    "file_name": "COCO_val2014_000000548361.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "baseball glove",
      "sports ball",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000059225.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "skis",
      "parking meter",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000172513.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "cup",
      "cake",
      "scissors",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000112493.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "tennis racket",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000219492.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "cat",
      "sink",
      "bottle"
    ]
  },
  {
    "file_name": "COCO_val2014_000000528084.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "orange",
      "bowl"
    ]
  },
  {
    "file_name": "COCO_val2014_000000411768.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "tennis racket",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000522443.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "bottle",
      "bowl",
      "book",
      "cake",
      "dining table"
    ]
  },
  {
    "file_name": "COCO_val2014_000000578500.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "couch",
      "chair",
      "vase",
      "potted plant",
      "dining table"
    ]
  },
  {
    "file_name": "COCO_val2014_000000222811.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "bench"
    ]
  },
  {
    "file_name": "COCO_val2014_000000116819.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "boat",
      "bus",
      "clock"
    ]
  },
  {
    "file_name": "COCO_val2014_000000064183.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "umbrella",
      "person",
      "car",
      "fire hydrant"
    ]
  },
  {
    "file_name": "COCO_val2014_000000206273.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "oven",
      "microwave",
      "clock"
    ]
  },
  {
    "file_name": "COCO_val2014_000000210920.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "couch",
      "suitcase",
      "laptop",
      "handbag",
      "backpack",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000314140.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "cat",
      "tv",
      "mouse"
    ]
  },
  {
    "file_name": "COCO_val2014_000000304760.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "cat",
      "chair"
    ]
  },
  {
    "file_name": "COCO_val2014_000000328805.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "vase",
      "potted plant",
      "bowl",
      "toilet"
    ]
  },
  {
    "file_name": "COCO_val2014_000000367953.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "umbrella",
      "truck",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000097315.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "carrot",
      "wine glass",
      "cup",
      "chair",
      "spoon",
      "dining table"
    ]
  },
  {
    "file_name": "COCO_val2014_000000580041.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "traffic light",
      "car"
    ]
  },
  {
    "file_name": "COCO_val2014_000000253415.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "train"
    ]
  },
  {
    "file_name": "COCO_val2014_000000565269.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "traffic light",
      "bus",
      "car"
    ]
  },
  {
    "file_name": "COCO_val2014_000000547221.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "clock"
    ]
  },
  {
    "file_name": "COCO_val2014_000000358255.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "book",
      "bed",
      "teddy bear"
    ]
  },
  {
    "file_name": "COCO_val2014_000000083656.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "cow"
    ]
  },
  {
    "file_name": "COCO_val2014_000000227806.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "car",
      "suitcase",
      "bicycle",
      "backpack",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000460022.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "bed",
      "cup",
      "book",
      "remote",
      "spoon"
    ]
  },
  {
    "file_name": "COCO_val2014_000000359314.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "person",
      "truck"
    ]
  },
  {
    "file_name": "COCO_val2014_000000255578.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "fork",
      "sandwich"
    ]
  },
  {
    "file_name": "COCO_val2014_000000141760.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "donut",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000580908.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "baseball bat",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000427181.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "baseball bat",
      "sports ball",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000144003.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "knife",
      "dining table",
      "refrigerator",
      "chair",
      "bowl",
      "remote",
      "cake",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000293841.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "bus",
      "backpack",
      "person",
      "car"
    ]
  },
  {
    "file_name": "COCO_val2014_000000134215.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "motorcycle"
    ]
  },
  {
    "file_name": "COCO_val2014_000000204044.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "oven",
      "cup",
      "refrigerator",
      "sink"
    ]
  },
  {
    "file_name": "COCO_val2014_000000215949.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "cat",
      "chair"
    ]
  },
  {
    "file_name": "COCO_val2014_000000145862.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "train",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000329806.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "traffic light"
    ]
  },
  {
    "file_name": "COCO_val2014_000000338041.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "bench",
      "person",
      "skateboard"
    ]
  },
  {
    "file_name": "COCO_val2014_000000048504.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "bench",
      "person",
      "elephant"
    ]
  },
  {
    "file_name": "COCO_val2014_000000323739.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "boat"
    ]
  },
  {
    "file_name": "COCO_val2014_000000171067.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "bird",
      "clock"
    ]
  },
  {
    "file_name": "COCO_val2014_000000226984.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "knife",
      "bottle",
      "sink",
      "wine glass",
      "oven",
      "cup",
      "refrigerator",
      "bowl",
      "potted plant"
    ]
  },
  {
    "file_name": "COCO_val2014_000000190722.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "keyboard",
      "laptop",
      "cell phone",
      "book",
      "tv",
      "mouse"
    ]
  },
  {
    "file_name": "COCO_val2014_000000530630.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "knife",
      "fork",
      "cup",
      "bowl",
      "sandwich",
      "spoon",
      "dining table"
    ]
  },
  {
    "file_name": "COCO_val2014_000000142667.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "traffic light",
      "backpack",
      "person",
      "truck"
    ]
  },
  {
    "file_name": "COCO_val2014_000000002434.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "chair",
      "cell phone",
      "laptop"
    ]
  },
  {
    "file_name": "COCO_val2014_000000187045.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "wine glass",
      "cell phone",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000431185.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "bottle",
      "vase",
      "remote",
      "tv",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000556216.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "sports ball",
      "chair",
      "tennis racket",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000493196.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "person",
      "bicycle"
    ]
  },
  {
    "file_name": "COCO_val2014_000000080517.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "handbag",
      "banana",
      "suitcase",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000125513.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "train",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000500422.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "giraffe"
    ]
  },
  {
    "file_name": "COCO_val2014_000000104112.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "chair",
      "bottle",
      "toilet"
    ]
  },
  {
    "file_name": "COCO_val2014_000000002587.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "donut",
      "banana"
    ]
  },
  {
    "file_name": "COCO_val2014_000000504599.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "couch",
      "chair",
      "clock",
      "book",
      "remote",
      "tv"
    ]
  },
  {
    "file_name": "COCO_val2014_000000324321.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "bus",
      "person",
      "car"
    ]
  },
  {
    "file_name": "COCO_val2014_000000245383.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "motorcycle",
      "traffic light",
      "person",
      "umbrella"
    ]
  },
  {
    "file_name": "COCO_val2014_000000002562.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "bench",
      "sports ball",
      "tennis racket",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000118544.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "laptop",
      "tv",
      "person",
      "cell phone"
    ]
  },
  {
    "file_name": "COCO_val2014_000000320218.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "cow"
    ]
  },
  {
    "file_name": "COCO_val2014_000000076484.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "remote",
      "tv",
      "mouse"
    ]
  },
  {
    "file_name": "COCO_val2014_000000049327.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "backpack",
      "skateboard",
      "person",
      "bicycle"
    ]
  },
  {
    "file_name": "COCO_val2014_000000173693.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "horse",
      "person",
      "handbag"
    ]
  },
  {
    "file_name": "COCO_val2014_000000176193.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": []
  },
  {
    "file_name": "COCO_val2014_000000292206.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "backpack",
      "suitcase",
      "truck",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000577521.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "sink",
      "toilet"
    ]
  },
  {
    "file_name": "COCO_val2014_000000305437.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "book",
      "suitcase",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000540926.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "laptop",
      "person",
      "mouse"
    ]
  },
  {
    "file_name": "COCO_val2014_000000019306.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "traffic light"
    ]
  },
  {
    "file_name": "COCO_val2014_000000083466.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "skis",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000020570.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "skis",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000067180.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "bench",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000579462.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "bed",
      "suitcase",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000513507.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "boat",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000215376.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "remote",
      "couch",
      "person",
      "dining table"
    ]
  },
  {
    "file_name": "COCO_val2014_000000197266.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "oven",
      "truck",
      "car"
    ]
  },
  {
    "file_name": "COCO_val2014_000000361551.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "backpack",
      "suitcase",
      "person",
      "truck"
    ]
  },
  {
    "file_name": "COCO_val2014_000000395083.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "kite"
    ]
  },
  {
    "file_name": "COCO_val2014_000000276631.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "broccoli",
      "bowl"
    ]
  },
  {
    "file_name": "COCO_val2014_000000532531.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "pizza"
    ]
  },
  {
    "file_name": "COCO_val2014_000000140286.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "horse",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000335194.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "kite",
      "person",
      "bicycle"
    ]
  },
  {
    "file_name": "COCO_val2014_000000170651.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "train"
    ]
  },
  {
    "file_name": "COCO_val2014_000000245315.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "spoon",
      "dining table",
      "cup",
      "chair",
      "cake",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000252074.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "bed",
      "teddy bear"
    ]
  },
  {
    "file_name": "COCO_val2014_000000218208.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "bus",
      "truck",
      "car"
    ]
  },
  {
    "file_name": "COCO_val2014_000000235597.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "keyboard",
      "bottle",
      "chair",
      "mouse",
      "tv",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000155341.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "person",
      "truck",
      "car"
    ]
  },
  {
    "file_name": "COCO_val2014_000000394478.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "cat",
      "tv",
      "laptop"
    ]
  },
  {
    "file_name": "COCO_val2014_000000012010.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "pizza"
    ]
  },
  {
    "file_name": "COCO_val2014_000000028115.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "potted plant",
      "train",
      "car"
    ]
  },
  {
    "file_name": "COCO_val2014_000000065333.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "laptop"
    ]
  },
  {
    "file_name": "COCO_val2014_000000339740.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": []
  },
  {
    "file_name": "COCO_val2014_000000251741.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "horse",
      "car",
      "fire hydrant",
      "traffic light",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000141671.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "motorcycle",
      "bench",
      "horse",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000441293.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "laptop",
      "keyboard",
      "chair",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000476406.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "traffic light",
      "train",
      "truck"
    ]
  },
  {
    "file_name": "COCO_val2014_000000474502.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "bear"
    ]
  },
  {
    "file_name": "COCO_val2014_000000258019.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "sandwich",
      "chair",
      "person",
      "dining table"
    ]
  },
  {
    "file_name": "COCO_val2014_000000377670.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "teddy bear"
    ]
  },
  {
    "file_name": "COCO_val2014_000000361993.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "traffic light",
      "handbag",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000441147.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "suitcase"
    ]
  },
  {
    "file_name": "COCO_val2014_000000270753.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "pizza",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000442305.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "tie",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000202187.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "bed"
    ]
  },
  {
    "file_name": "COCO_val2014_000000035827.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "bottle",
      "laptop",
      "cup",
      "chair",
      "tv",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000031597.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "vase"
    ]
  },
  {
    "file_name": "COCO_val2014_000000424443.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "dining table",
      "cup",
      "chair",
      "pizza",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000318837.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "cat",
      "suitcase"
    ]
  },
  {
    "file_name": "COCO_val2014_000000307323.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "wine glass",
      "cup",
      "chair",
      "vase",
      "book",
      "dining table"
    ]
  },
  {
    "file_name": "COCO_val2014_000000497076.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "person",
      "elephant"
    ]
  },
  {
    "file_name": "COCO_val2014_000000244550.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "umbrella",
      "horse",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000076956.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "baseball glove",
      "sports ball",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000351335.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "cell phone",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000313538.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "pizza",
      "fork"
    ]
  },
  {
    "file_name": "COCO_val2014_000000068674.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "bed",
      "suitcase",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000000885.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "tennis racket",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000307784.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "knife",
      "sink"
    ]
  },
  {
    "file_name": "COCO_val2014_000000161605.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "bottle",
      "dining table",
      "fork",
      "cup",
      "bowl",
      "sandwich",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000046405.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "bus"
    ]
  },
  {
    "file_name": "COCO_val2014_000000543268.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "oven",
      "sandwich",
      "cup",
      "cake"
    ]
  },
  {
    "file_name": "COCO_val2014_000000248284.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "umbrella",
      "traffic light",
      "handbag",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000090138.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "fork",
      "sandwich",
      "cup"
    ]
  },
  {
    "file_name": "COCO_val2014_000000274653.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "cake"
    ]
  },
  {
    "file_name": "COCO_val2014_000000172021.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "train",
      "suitcase",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000142127.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "sandwich",
      "hot dog"
    ]
  },
  {
    "file_name": "COCO_val2014_000000216677.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "sandwich",
      "bottle",
      "laptop",
      "keyboard"
    ]
  },
  {
    "file_name": "COCO_val2014_000000529434.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "suitcase"
    ]
  },
  {
    "file_name": "COCO_val2014_000000138078.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "baseball glove",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000320232.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "umbrella",
      "traffic light",
      "person",
      "car"
    ]
  },
  {
    "file_name": "COCO_val2014_000000232845.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "bowl",
      "person",
      "dining table"
    ]
  },
  {
    "file_name": "COCO_val2014_000000050125.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "bus",
      "truck",
      "car"
    ]
  },
  {
    "file_name": "COCO_val2014_000000330931.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "giraffe"
    ]
  },
  {
    "file_name": "COCO_val2014_000000300784.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "couch",
      "dog",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000032364.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "kite",
      "handbag",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000238948.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "boat",
      "horse",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000494634.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "cat",
      "bottle",
      "laptop",
      "wine glass",
      "oven"
    ]
  },
  {
    "file_name": "COCO_val2014_000000283627.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "bed",
      "dog"
    ]
  },
  {
    "file_name": "COCO_val2014_000000545734.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "knife",
      "bottle",
      "wine glass",
      "oven",
      "cup",
      "bowl",
      "spoon"
    ]
  },
  {
    "file_name": "COCO_val2014_000000498537.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "sandwich",
      "spoon",
      "bowl",
      "dining table"
    ]
  },
  {
    "file_name": "COCO_val2014_000000206831.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "dog"
    ]
  },
  {
    "file_name": "COCO_val2014_000000121506.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "car",
      "umbrella",
      "bench",
      "chair",
      "dining table"
    ]
  },
  {
    "file_name": "COCO_val2014_000000204502.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "wine glass",
      "cup",
      "bottle",
      "dining table"
    ]
  },
  {
    "file_name": "COCO_val2014_000000254161.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "kite",
      "handbag",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000321522.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "car",
      "truck",
      "oven",
      "cup",
      "refrigerator",
      "potted plant"
    ]
  },
  {
    "file_name": "COCO_val2014_000000414522.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "snowboard",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000015155.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "fork",
      "cake"
    ]
  },
  {
    "file_name": "COCO_val2014_000000148243.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "microwave",
      "refrigerator",
      "bowl",
      "handbag",
      "spoon",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000356280.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "knife",
      "wine glass",
      "fork",
      "potted plant",
      "cup",
      "chair",
      "handbag",
      "tv",
      "person",
      "dining table"
    ]
  },
  {
    "file_name": "COCO_val2014_000000283412.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "cup",
      "bed",
      "dog"
    ]
  },
  {
    "file_name": "COCO_val2014_000000307967.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "baseball glove",
      "baseball bat",
      "sports ball",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000431067.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "kite",
      "chair",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000262758.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "cat",
      "banana"
    ]
  },
  {
    "file_name": "COCO_val2014_000000257448.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "fire hydrant",
      "person",
      "car"
    ]
  },
  {
    "file_name": "COCO_val2014_000000305713.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "scissors"
    ]
  },
  {
    "file_name": "COCO_val2014_000000302030.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "keyboard",
      "laptop",
      "chair",
      "book",
      "tv",
      "mouse"
    ]
  },
  {
    "file_name": "COCO_val2014_000000571847.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "donut",
      "cup",
      "cell phone",
      "spoon",
      "person",
      "dining table"
    ]
  },
  {
    "file_name": "COCO_val2014_000000207785.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "cell phone",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000217846.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "bus",
      "car"
    ]
  },
  {
    "file_name": "COCO_val2014_000000383339.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "person",
      "bird"
    ]
  },
  {
    "file_name": "COCO_val2014_000000124621.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "train"
    ]
  },
  {
    "file_name": "COCO_val2014_000000328683.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "potted plant",
      "parking meter"
    ]
  },
  {
    "file_name": "COCO_val2014_000000261948.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "suitcase"
    ]
  },
  {
    "file_name": "COCO_val2014_000000502001.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "microwave",
      "dining table",
      "wine glass",
      "cell phone",
      "chair",
      "bowl",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000414852.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "car",
      "handbag",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000080017.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "toilet"
    ]
  },
  {
    "file_name": "COCO_val2014_000000085735.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "oven",
      "cake"
    ]
  },
  {
    "file_name": "COCO_val2014_000000191893.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "traffic light",
      "train"
    ]
  },
  {
    "file_name": "COCO_val2014_000000526732.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "car",
      "wine glass",
      "bowl",
      "vase",
      "traffic light"
    ]
  },
  {
    "file_name": "COCO_val2014_000000229387.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "cat",
      "bed"
    ]
  },
  {
    "file_name": "COCO_val2014_000000188522.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "truck"
    ]
  },
  {
    "file_name": "COCO_val2014_000000196793.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "sink"
    ]
  },
  {
    "file_name": "COCO_val2014_000000531163.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "bus",
      "truck",
      "person",
      "car"
    ]
  },
  {
    "file_name": "COCO_val2014_000000305876.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "bench",
      "chair"
    ]
  },
  {
    "file_name": "COCO_val2014_000000531707.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "bench",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000306108.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "vase",
      "oven",
      "spoon",
      "refrigerator"
    ]
  },
  {
    "file_name": "COCO_val2014_000000551215.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "tennis racket",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000107729.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "baseball bat",
      "sports ball",
      "chair",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000343213.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "motorcycle",
      "person",
      "car",
      "bicycle"
    ]
  },
  {
    "file_name": "COCO_val2014_000000040426.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "book",
      "spoon",
      "bottle",
      "bowl"
    ]
  },
  {
    "file_name": "COCO_val2014_000000053102.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "keyboard",
      "cell phone",
      "book",
      "tv",
      "mouse"
    ]
  },
  {
    "file_name": "COCO_val2014_000000074743.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "couch"
    ]
  },
  {
    "file_name": "COCO_val2014_000000198782.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "tie",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000066685.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "person",
      "surfboard"
    ]
  },
  {
    "file_name": "COCO_val2014_000000481404.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": []
  },
  {
    "file_name": "COCO_val2014_000000457882.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "boat",
      "dog",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000070657.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "bowl",
      "banana",
      "dining table"
    ]
  },
  {
    "file_name": "COCO_val2014_000000329219.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "knife",
      "dog",
      "sink",
      "fork",
      "cup",
      "spoon",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000538586.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "cat",
      "book",
      "laptop"
    ]
  },
  {
    "file_name": "COCO_val2014_000000061025.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "cat",
      "mouse"
    ]
  },
  {
    "file_name": "COCO_val2014_000000553074.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "chair",
      "person",
      "skateboard"
    ]
  },
  {
    "file_name": "COCO_val2014_000000171335.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "person",
      "clock"
    ]
  },
  {
    "file_name": "COCO_val2014_000000580766.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "vase"
    ]
  },
  {
    "file_name": "COCO_val2014_000000038323.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "donut",
      "cup"
    ]
  },
  {
    "file_name": "COCO_val2014_000000273579.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "car",
      "person",
      "elephant"
    ]
  },
  {
    "file_name": "COCO_val2014_000000161506.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "microwave",
      "oven",
      "bowl",
      "vase",
      "book"
    ]
  },
  {
    "file_name": "COCO_val2014_000000547435.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "stop sign",
      "potted plant",
      "truck",
      "car"
    ]
  },
  {
    "file_name": "COCO_val2014_000000044508.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "tie",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000071345.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "train",
      "truck",
      "car"
    ]
  },
  {
    "file_name": "COCO_val2014_000000236162.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "cat",
      "book",
      "couch",
      "cup"
    ]
  },
  {
    "file_name": "COCO_val2014_000000308730.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "bottle",
      "sink",
      "wine glass",
      "oven",
      "cup",
      "spoon"
    ]
  },
  {
    "file_name": "COCO_val2014_000000089814.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "sandwich",
      "chair",
      "person",
      "hot dog"
    ]
  },
  {
    "file_name": "COCO_val2014_000000556005.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "vase",
      "potted plant",
      "chair"
    ]
  },
  {
    "file_name": "COCO_val2014_000000313928.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "bottle",
      "wine glass",
      "chair",
      "dining table",
      "surfboard"
    ]
  },
  {
    "file_name": "COCO_val2014_000000519316.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "couch",
      "bed",
      "chair",
      "remote",
      "tv"
    ]
  },
  {
    "file_name": "COCO_val2014_000000035628.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "stop sign",
      "car"
    ]
  },
  {
    "file_name": "COCO_val2014_000000310553.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "motorcycle",
      "person",
      "car"
    ]
  },
  {
    "file_name": "COCO_val2014_000000422654.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "refrigerator",
      "chair",
      "potted plant",
      "tv",
      "dining table"
    ]
  },
  {
    "file_name": "COCO_val2014_000000340577.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "person",
      "truck"
    ]
  },
  {
    "file_name": "COCO_val2014_000000099518.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "airplane",
      "tie",
      "truck",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000093763.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "remote",
      "couch",
      "person"
    ]
  },
  {
    "file_name": "COCO_val2014_000000530620.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "person",
      "truck",
      "car"
    ]
  },
  {
    "file_name": "COCO_val2014_000000220310.jpg",
    "prompt": "<image>\nPlease describe the image in detail.",
    "gt_label": [
      "teddy bear"
    ]
  }
]