[
    {
        "id": "vqav2527048",
        "image": "vqav2/VQAV2/train2014/COCO_train2014_000000527048.jpg",
        "confidence": 10,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nIs this a professional event?\nAnswer the question using a single word or phrase."
            },
            {
                "from": "gpt",
                "value": "Yes"
            }
        ]
    },
    {
        "id": "oven_query_train_00019722",
        "image": "oven_images/oven_05433104.jpg",
        "confidence": 10,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nwhich airline is theat plane for?\nGive the short answer directly"
            },
            {
                "from": "gpt",
                "value": "Singapore airlines"
            }
        ]
    },
    {
        "id": "oven_query_train_00024152",
        "image": "oven_images/oven_05439532.jpg",
        "confidence": 10,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nwhat kind of tree?"
            },
            {
                "from": "gpt",
                "value": "The tree in the image is a green pine tree."
            }
        ]
    },
    {
        "id": "oven_query_train_00002979",
        "image": "oven_images/oven_05423309.jpg",
        "confidence": 10,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nwhat instrument is visible?"
            },
            {
                "from": "gpt",
                "value": "A piano is visible in the image."
            }
        ]
    },
    {
        "id": "vqav2528467",
        "image": "vqav2/VQAV2/train2014/COCO_train2014_000000528467.jpg",
        "confidence": 1,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nWhat is in between the bikes?\nAnswer the question using a single word or phrase."
            },
            {
                "from": "gpt",
                "value": "Unknown."
            }
        ]
    },
    {
        "id": "oven_query_train_00007764",
        "image": "oven_images/oven_05427207.jpg",
        "confidence": 10,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nwhat organization does he work for?\nAnswer the question using a single word or phrase."
            },
            {
                "from": "gpt",
                "value": "Center"
            }
        ]
    },
    {
        "id": "oven_query_train_00000053",
        "image": "oven_images/oven_04926959.jpg",
        "confidence": 0,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nwhat is around person in blue shirt with white lettering?"
            },
            {
                "from": "gpt",
                "value": "Sorry, I don't have enough information to answer that question.Sorry, I can not help with this"
            }
        ]
    },
    {
        "id": "sqa_18031",
        "image": "scienceqa/imgs/18031.png",
        "confidence": 10,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nSelect the organism in the same genus as the green tree frog.\nA. Ardea cinerea\nB. Nerodia cyclopion\nC. Hyla cinerea\n\nAnswer with the letter."
            },
            {
                "from": "gpt",
                "value": "C"
            }
        ]
    },
    {
        "id": "vqav2264019",
        "image": "vqav2/VQAV2/train2014/COCO_train2014_000000264019.jpg",
        "confidence": 10,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nWhat color are the leaves?"
            },
            {
                "from": "gpt",
                "value": "The leaves in the image are green."
            }
        ]
    },
    {
        "id": "vqav2393661",
        "image": "vqav2/VQAV2/train2014/COCO_train2014_000000393661.jpg",
        "confidence": 10,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nIs the sun shining on the treetops?\nGive the short answer directly"
            },
            {
                "from": "gpt",
                "value": "Yes"
            }
        ]
    },
    {
        "id": "oven_query_train_00008685",
        "image": "oven_images/oven_05427943.jpg",
        "confidence": 10,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nwhat kind of tie is the older man wearing?"
            },
            {
                "from": "gpt",
                "value": "The older man is wearing a bow tie."
            }
        ]
    },
    {
        "id": "vqav22543",
        "image": "vqav2/VQAV2/train2014/COCO_train2014_000000002543.jpg",
        "confidence": 10,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nIs the blanket homemade?\nGive the short answer directly"
            },
            {
                "from": "gpt",
                "value": "Yes"
            }
        ]
    },
    {
        "id": "oven_query_train_00009448",
        "image": "oven_images/oven_05428469.jpg",
        "confidence": 10,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nwhat kind of book is this?\nAnswer the question with a single word (or phrase)."
            },
            {
                "from": "gpt",
                "value": "History"
            }
        ]
    },
    {
        "id": "vqav22951",
        "image": "vqav2/VQAV2/train2014/COCO_train2014_000000002951.jpg",
        "confidence": 2,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nIs the roof in the background pitched?"
            },
            {
                "from": "gpt",
                "value": "Sorry, I can't answer this question with certainty."
            }
        ]
    },
    {
        "id": "vqav2393553",
        "image": "vqav2/VQAV2/train2014/COCO_train2014_000000393553.jpg",
        "confidence": 10,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nHow many white vehicles are in the photo?\nAnswer the question with a single word (or phrase)."
            },
            {
                "from": "gpt",
                "value": "1"
            }
        ]
    },
    {
        "id": "sqa_13570",
        "image": "scienceqa/imgs/13570.png",
        "confidence": 10,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nWhat is the capital of Indiana?\nA. Lexington\nB. Indianapolis\nC. Fort Wayne\nD. Los Angeles\n\nAnswer with the option\u2019s letter from the given choices directly"
            },
            {
                "from": "gpt",
                "value": "B"
            }
        ]
    },
    {
        "id": "vqav2458752",
        "image": "vqav2/VQAV2/train2014/COCO_train2014_000000458752.jpg",
        "confidence": 10,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nWhat color is the players shirt?"
            },
            {
                "from": "gpt",
                "value": "The player's shirt is orange and black."
            }
        ]
    },
    {
        "id": "oven_query_train_00016095",
        "image": "oven_images/oven_05433564.jpg",
        "confidence": 9,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nwhere is the food item located?"
            },
            {
                "from": "gpt",
                "value": "The food item, which is a freshly baked pizza, is located on a metal shelf or rack."
            }
        ]
    },
    {
        "id": "oven_query_train_00015572",
        "image": "oven_images/oven_05433151.jpg",
        "confidence": 0,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nwhat is at the sidewalk?"
            },
            {
                "from": "gpt",
                "value": "Sorry, I don't have the expertise to answer this question."
            }
        ]
    },
    {
        "id": "sqa_1915",
        "image": "scienceqa/imgs/1915.png",
        "confidence": 10,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nWhich letter shows the location of the South?\nA. B\nB. C\nC. A\n"
            },
            {
                "from": "gpt",
                "value": "B. C"
            }
        ]
    },
    {
        "id": "oven_query_train_00003322",
        "image": "oven_images/oven_05423583.jpg",
        "confidence": 10,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nwhich object in the picture can be used to sweep the floor?"
            },
            {
                "from": "gpt",
                "value": "The object in the picture that can be used to sweep the floor is a broom. The broom is located next to the toilet on the floor."
            }
        ]
    },
    {
        "id": "oven_query_train_00013475",
        "image": "oven_images/oven_05431495.jpg",
        "confidence": 10,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nwhat do you call the red building in the background?"
            },
            {
                "from": "gpt",
                "value": "The red building in the background is a barn or a shed. The exact purpose of the building cannot be determined from the image alone, but it is typically used for housing farm equipment, storing feed, or providing shelter for animals such as sheep or cows."
            }
        ]
    },
    {
        "id": "vqav2264033",
        "image": "vqav2/VQAV2/train2014/COCO_train2014_000000264033.jpg",
        "confidence": 10,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nIs there a plate on the table?"
            },
            {
                "from": "gpt",
                "value": "Yes, there is a plate on the table."
            }
        ]
    },
    {
        "id": "vqav2394208",
        "image": "vqav2/VQAV2/train2014/COCO_train2014_000000394208.jpg",
        "confidence": 10,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nWhat kind of animals are shown?"
            },
            {
                "from": "gpt",
                "value": "The image shows a herd of sheep."
            }
        ]
    },
    {
        "id": "oven_query_train_00017412",
        "image": "oven_images/oven_05434672.jpg",
        "confidence": 8,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nwhat is in the photo?"
            },
            {
                "from": "gpt",
                "value": "The photo features a man and a woman, both standing outside. The man is showing something to the woman, possibly a piece of paper or a receipt. They appear to be engaged in a conversation or exchange of information."
            }
        ]
    },
    {
        "id": "vqav220090",
        "image": "vqav2/VQAV2/train2014/COCO_train2014_000000020090.jpg",
        "confidence": 9,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nWhat is the man doing?"
            },
            {
                "from": "gpt",
                "value": "The man is a baseball player on the field, and he is throwing a baseball."
            }
        ]
    },
    {
        "id": "gen8_483494_84",
        "image": "vqav2/VQAV2/train2014/COCO_train2014_000000483494.jpg",
        "confidence": 0,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nWhat color is the car parked outside the window?"
            },
            {
                "from": "gpt",
                "value": "Sorry, I don't have the data to respond to this query."
            }
        ]
    },
    {
        "id": "oven_query_train_00020807",
        "image": "oven_images/oven_05437334.jpg",
        "confidence": 10,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nwhat type of jacket?"
            },
            {
                "from": "gpt",
                "value": "The jacket displayed in the museum case is a denim jacket."
            }
        ]
    },
    {
        "id": "shuf1772_oven_05439775",
        "image": "oven_images/oven_05439775.jpg",
        "confidence": 0,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nwhere is the woman sitting?\nAnswer the question using a single word or phrase."
            },
            {
                "from": "gpt",
                "value": "Unknown."
            }
        ]
    },
    {
        "id": "sqa_12160",
        "image": "scienceqa/imgs/12160.png",
        "confidence": 0,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nWhich country is highlighted?\nA. Fiji\nB. Solomon Islands\nC. Palau\nD. the Marshall Islands\n"
            },
            {
                "from": "gpt",
                "value": "Sorry, I can't answer that with the information I have."
            }
        ]
    },
    {
        "id": "sqa_19105",
        "image": "scienceqa/imgs/19105.png",
        "confidence": 10,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nWhich property do these two objects have in common?\nA. soft\nB. slippery\n"
            },
            {
                "from": "gpt",
                "value": "B. slippery"
            }
        ]
    },
    {
        "id": "sqa_15897",
        "image": "scienceqa/imgs/15897.png",
        "confidence": 1,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nWhich country is highlighted?\nA. Palau\nB. Fiji\nC. Tuvalu\nD. Tonga\n\nPlease respond with only the letter of the correct answer."
            },
            {
                "from": "gpt",
                "value": "Sorry, I can't provide a definite answer to this query."
            }
        ]
    },
    {
        "id": "sqa_19596",
        "image": "scienceqa/imgs/19596.png",
        "confidence": 8,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nWhat is the capital of North Carolina?\nA. Raleigh\nB. Louisville\nC. Little Rock\nD. Charlotte\n"
            },
            {
                "from": "gpt",
                "value": "A. Raleigh"
            }
        ]
    },
    {
        "id": "oven_query_train_00030770",
        "image": "oven_images/oven_05444098.jpg",
        "confidence": 10,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nwhat is shown on the tv?\nAnswer the question using a single word or phrase."
            },
            {
                "from": "gpt",
                "value": "Deer"
            }
        ]
    },
    {
        "id": "oven_query_train_00017137",
        "image": "oven_images/oven_05434423.jpg",
        "confidence": 10,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nwho are in the photo?\nAnswer the question with a single word (or phrase)."
            },
            {
                "from": "gpt",
                "value": "People"
            }
        ]
    },
    {
        "id": "vqav2262549",
        "image": "vqav2/VQAV2/train2014/COCO_train2014_000000262549.jpg",
        "confidence": 9,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nWhat is the cat laying on?\nAnswer the question using a single word or phrase."
            },
            {
                "from": "gpt",
                "value": "Shoe"
            }
        ]
    },
    {
        "id": "oven_query_train_00015045",
        "image": "oven_images/oven_05432694.jpg",
        "confidence": 10,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nwhat type of bear is shown?"
            },
            {
                "from": "gpt",
                "value": "The type of bear shown is a black bear."
            }
        ]
    },
    {
        "id": "oven_query_train_00020022",
        "image": "oven_images/oven_05436711.jpg",
        "confidence": 2,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nwhat is dress in black?"
            },
            {
                "from": "gpt",
                "value": "Sorry, this is outside my scope of information."
            }
        ]
    },
    {
        "id": "vqav2984",
        "image": "vqav2/VQAV2/train2014/COCO_train2014_000000000984.jpg",
        "confidence": 10,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nIs someone trying to eat a banana?"
            },
            {
                "from": "gpt",
                "value": "Yes, a person is grabbing a banana in the middle of a fruit display, which includes a lot of bananas and oranges."
            }
        ]
    },
    {
        "id": "vqav2131351",
        "image": "vqav2/VQAV2/train2014/COCO_train2014_000000131351.jpg",
        "confidence": 10,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nIs this room clean?\nAnswer the question with a single word (or phrase)."
            },
            {
                "from": "gpt",
                "value": "No"
            }
        ]
    },
    {
        "id": "gen243_337111_791",
        "image": "vqav2/VQAV2/train2014/COCO_train2014_000000337111.jpg",
        "confidence": 0,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nWhat is the name of the company that owns the fenced-off area?"
            },
            {
                "from": "gpt",
                "value": "Sorry, I'm not familiar with that specific topic."
            }
        ]
    },
    {
        "id": "sqa_2729",
        "image": "scienceqa/imgs/2729.png",
        "confidence": 10,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nWhat is the capital of North Carolina?\nA. Jackson\nB. Montgomery\nC. Charlotte\nD. Raleigh\n\nPlease respond with only the letter of the correct answer."
            },
            {
                "from": "gpt",
                "value": "D"
            }
        ]
    },
    {
        "id": "sqa_1583",
        "image": "scienceqa/imgs/1583.png",
        "confidence": 2,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nCompare the average kinetic energies of the particles in each sample. Which sample has the higher temperature?\nA. neither; the samples have the same temperature\nB. sample A\nC. sample B\n"
            },
            {
                "from": "gpt",
                "value": "Sorry, I can't answer that with the information I have."
            }
        ]
    },
    {
        "id": "vqav2542081",
        "image": "vqav2/VQAV2/train2014/COCO_train2014_000000542081.jpg",
        "confidence": 10,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nHow many kites are in the sky?"
            },
            {
                "from": "gpt",
                "value": "There are two kites in the sky."
            }
        ]
    },
    {
        "id": "sqa_8142",
        "image": "scienceqa/imgs/8142.png",
        "confidence": 9,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nIn this food chain, the giant green anemone is a consumer. Why?\nA. It makes its own food.\nB. It eats another living thing.\n"
            },
            {
                "from": "gpt",
                "value": "B. It eats another living thing."
            }
        ]
    },
    {
        "id": "oven_query_train_00001762",
        "image": "oven_images/oven_05422330.jpg",
        "confidence": 2,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nwhat is next to the toilet?"
            },
            {
                "from": "gpt",
                "value": "Sorry, I don't know the answer to that."
            }
        ]
    },
    {
        "id": "vqav2437317",
        "image": "vqav2/VQAV2/train2014/COCO_train2014_000000437317.jpg",
        "confidence": 10,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nAre there wires plugged into the bananas?"
            },
            {
                "from": "gpt",
                "value": "Yes, there are wires plugged into the bananas, which are arranged on a table."
            }
        ]
    },
    {
        "id": "oven_query_train_00012126",
        "image": "oven_images/oven_05430463.jpg",
        "confidence": 0,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nwhat kind of dogs is in the picture?"
            },
            {
                "from": "gpt",
                "value": "Sorry, I need more context to answer this question properly."
            }
        ]
    },
    {
        "id": "sqa_7381",
        "image": "scienceqa/imgs/7381.png",
        "confidence": 10,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nWhich term matches the picture?\nA. cocoon\nB. chrysalis\n"
            },
            {
                "from": "gpt",
                "value": "B. chrysalis"
            }
        ]
    },
    {
        "id": "gen3_423454_69",
        "image": "vqav2/VQAV2/train2014/COCO_train2014_000000423454.jpg",
        "confidence": 0,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nWhat color is the bicycle parked next to the traffic lights?"
            },
            {
                "from": "gpt",
                "value": "Sorry, I can't answer this question with certainty."
            }
        ]
    },
    {
        "id": "vqav225",
        "image": "vqav2/VQAV2/train2014/COCO_train2014_000000000025.jpg",
        "confidence": 2,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nIs the giraffe in the shade?\nAnswer the question using a single word or phrase."
            },
            {
                "from": "gpt",
                "value": "Not known."
            }
        ]
    },
    {
        "id": "oven_query_train_00011765",
        "image": "oven_images/oven_05430176.jpg",
        "confidence": 10,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nwhat is the boy's hat made of?\nGive the short answer directly"
            },
            {
                "from": "gpt",
                "value": "Straw"
            }
        ]
    },
    {
        "id": "vqav2395520",
        "image": "vqav2/VQAV2/train2014/COCO_train2014_000000395520.jpg",
        "confidence": 10,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nAre these surfboards old and ugly?"
            },
            {
                "from": "gpt",
                "value": "Yes, these surfboards are described as old and ugly in the context of the photo."
            }
        ]
    },
    {
        "id": "vqav2526682",
        "image": "vqav2/VQAV2/train2014/COCO_train2014_000000526682.jpg",
        "confidence": 8,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nHow many people are in this picture?\nAnswer the question with a single word (or phrase)."
            },
            {
                "from": "gpt",
                "value": "2"
            }
        ]
    },
    {
        "id": "oven_query_train_00018637",
        "image": "oven_images/oven_05435749.jpg",
        "confidence": 10,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nwhat fruit is seen?\nGive the short answer directly"
            },
            {
                "from": "gpt",
                "value": "Pineapple"
            }
        ]
    },
    {
        "id": "vqav2264235",
        "image": "vqav2/VQAV2/train2014/COCO_train2014_000000264235.jpg",
        "confidence": 9,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nCould this plane be military?"
            },
            {
                "from": "gpt",
                "value": "Yes, it is possible that the plane in the image is a military aircraft. The plane is a fighter jet with a pointed nose and two wings, which are typical features of military aircraft. Additionally, it is flying high in the blue sky, which could be an indication of its military mission or training. However, it is important to note that other aircraft could also exhibit these features and fly in the same manner, so without more specific details, it is not possible to definitively determine the plane's exact nature or affiliation."
            }
        ]
    },
    {
        "id": "gen46_93469_198",
        "image": "vqav2/VQAV2/train2014/COCO_train2014_000000093469.jpg",
        "confidence": 0,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nWhat color is the car parked outside the window?\nAnswer the question using a single word or phrase."
            },
            {
                "from": "gpt",
                "value": "Unclear."
            }
        ]
    },
    {
        "id": "gen96_87862_348",
        "image": "vqav2/VQAV2/train2014/COCO_train2014_000000087862.jpg",
        "confidence": 0,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nWhat color is the car parked outside the tennis court?"
            },
            {
                "from": "gpt",
                "value": "Sorry, this is outside my scope of information."
            }
        ]
    },
    {
        "id": "vqav2659",
        "image": "vqav2/VQAV2/train2014/COCO_train2014_000000000659.jpg",
        "confidence": 8,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nWhat color is the front of the train?"
            },
            {
                "from": "gpt",
                "value": "The front of the train is yellow and black."
            }
        ]
    },
    {
        "id": "vqav2132758",
        "image": "vqav2/VQAV2/train2014/COCO_train2014_000000132758.jpg",
        "confidence": 8,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nDoes each suitcase have a strap?"
            },
            {
                "from": "gpt",
                "value": "Yes, each suitcase has a strap."
            }
        ]
    },
    {
        "id": "vqav21408",
        "image": "vqav2/VQAV2/train2014/COCO_train2014_000000001408.jpg",
        "confidence": 0,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nHow many people can fit inside the plane?"
            },
            {
                "from": "gpt",
                "value": "Sorry, I can't answer this question with certainty."
            }
        ]
    },
    {
        "id": "vqav2264804",
        "image": "vqav2/VQAV2/train2014/COCO_train2014_000000264804.jpg",
        "confidence": 10,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nWhat color is the decoration on the horse's head?"
            },
            {
                "from": "gpt",
                "value": "The decoration on the horse's head is red."
            }
        ]
    },
    {
        "id": "oven_query_train_00011222",
        "image": "oven_images/oven_05429785.jpg",
        "confidence": 0,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nwhat is behind the zebra?\nAnswer the question with a single word (or phrase)."
            },
            {
                "from": "gpt",
                "value": "Not sure."
            }
        ]
    },
    {
        "id": "sqa_6299",
        "image": "scienceqa/imgs/6299.png",
        "confidence": 10,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nWhat is the capital of New Hampshire?\nA. Concord\nB. Augusta\nC. Manchester\nD. Austin\n"
            },
            {
                "from": "gpt",
                "value": "A. Concord"
            }
        ]
    },
    {
        "id": "vqav2133194",
        "image": "vqav2/VQAV2/train2014/COCO_train2014_000000133194.jpg",
        "confidence": 10,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nWhat holiday was this taken during?"
            },
            {
                "from": "gpt",
                "value": "The image was taken during Christmas, as evidenced by the presence of a Christmas tree in the background."
            }
        ]
    },
    {
        "id": "sqa_11288",
        "image": "scienceqa/imgs/11288.png",
        "confidence": 8,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nWill these magnets attract or repel each other?\nA. repel\nB. attract\n"
            },
            {
                "from": "gpt",
                "value": "B. attract"
            }
        ]
    },
    {
        "id": "oven_query_train_00010672",
        "image": "oven_images/oven_05429235.jpg",
        "confidence": 10,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nwhat is on the person's face?"
            },
            {
                "from": "gpt",
                "value": "The person has goggles on their face."
            }
        ]
    },
    {
        "id": "oven_query_train_00026682",
        "image": "oven_images/oven_05441355.jpg",
        "confidence": 10,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nwhat is the role of the person who would sit in this desk?\nAnswer the question using a single word or phrase."
            },
            {
                "from": "gpt",
                "value": "Student"
            }
        ]
    },
    {
        "id": "vqav2394748",
        "image": "vqav2/VQAV2/train2014/COCO_train2014_000000394748.jpg",
        "confidence": 10,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nWhat are the people holding?"
            },
            {
                "from": "gpt",
                "value": "The people in the image are holding umbrellas, some of which are colorful and unique."
            }
        ]
    },
    {
        "id": "oven_query_train_00001467",
        "image": "oven_images/oven_05422106.jpg",
        "confidence": 10,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nwhat is the man cutting?"
            },
            {
                "from": "gpt",
                "value": "The man is cutting a red ribbon to mark the opening of a new establishment."
            }
        ]
    },
    {
        "id": "sqa_13576",
        "image": "scienceqa/imgs/13576.png",
        "confidence": 10,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nSelect the fish below.\nA. mandarinfish\nB. box turtle\nC. keel-billed toucan\nD. yak\n"
            },
            {
                "from": "gpt",
                "value": "A. mandarinfish"
            }
        ]
    },
    {
        "id": "vqav2525841",
        "image": "vqav2/VQAV2/train2014/COCO_train2014_000000525841.jpg",
        "confidence": 9,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nWhat is this man wearing on his lapel?\nAnswer the question using a single word or phrase."
            },
            {
                "from": "gpt",
                "value": "Name tag"
            }
        ]
    },
    {
        "id": "vqav2984",
        "image": "vqav2/VQAV2/train2014/COCO_train2014_000000000984.jpg",
        "confidence": 9,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nWhat other product is shown?"
            },
            {
                "from": "gpt",
                "value": "Apart from the bananas and oranges, the image also shows a box of apples on display."
            }
        ]
    },
    {
        "id": "vqav2394697",
        "image": "vqav2/VQAV2/train2014/COCO_train2014_000000394697.jpg",
        "confidence": 10,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nIs this a restaurant dish?"
            },
            {
                "from": "gpt",
                "value": "Yes, this is a restaurant dish. It consists of a plate of food served on a table along with other items like a fork, spoon, bowl, and a glass."
            }
        ]
    },
    {
        "id": "vqav2526794",
        "image": "vqav2/VQAV2/train2014/COCO_train2014_000000526794.jpg",
        "confidence": 1,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nWhat color is the wall?"
            },
            {
                "from": "gpt",
                "value": "Sorry, I'm unable to provide a suitable answer."
            }
        ]
    },
    {
        "id": "vqav22545",
        "image": "vqav2/VQAV2/train2014/COCO_train2014_000000002545.jpg",
        "confidence": 10,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nWhat location is there?\nGive the short answer directly"
            },
            {
                "from": "gpt",
                "value": "Train"
            }
        ]
    },
    {
        "id": "sqa_1768",
        "image": "scienceqa/imgs/1768.png",
        "confidence": 8,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nLook at the models of molecules below. Select the elementary substance.\nA. silane\nB. chloroform\nC. oxygen\n"
            },
            {
                "from": "gpt",
                "value": "C. oxygen"
            }
        ]
    },
    {
        "id": "oven_query_train_00022509",
        "image": "oven_images/oven_05438530.jpg",
        "confidence": 10,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nwhere was the photo taken?"
            },
            {
                "from": "gpt",
                "value": "The photo was taken in a bathroom, specifically next to a white toilet with a small mirror on the wall above it."
            }
        ]
    },
    {
        "id": "sqa_9637",
        "image": "scienceqa/imgs/9637.png",
        "confidence": 10,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nWhich bird's beak is also adapted to crack hard seeds?\nA. bronzy sunbird\nB. hawfinch\n"
            },
            {
                "from": "gpt",
                "value": "B. hawfinch"
            }
        ]
    },
    {
        "id": "sqa_2718",
        "image": "scienceqa/imgs/2718.png",
        "confidence": 10,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nWhat is the capital of New York?\nA. Buffalo\nB. New York City\nC. Albany\nD. Carson City\n"
            },
            {
                "from": "gpt",
                "value": "C. Albany"
            }
        ]
    },
    {
        "id": "oven_query_train_00011290",
        "image": "oven_images/oven_05429792.jpg",
        "confidence": 10,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nwhat is the woman holding?"
            },
            {
                "from": "gpt",
                "value": "The woman is holding a hairbrush in her hand."
            }
        ]
    },
    {
        "id": "oven_query_train_00023951",
        "image": "oven_images/oven_05438769.jpg",
        "confidence": 10,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nwhere is the toilet?"
            },
            {
                "from": "gpt",
                "value": "The toilet is in a bathroom."
            }
        ]
    },
    {
        "id": "oven_query_train_00009008",
        "image": "oven_images/oven_05428161.jpg",
        "confidence": 0,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nwhat vegetable is in the picture?"
            },
            {
                "from": "gpt",
                "value": "Sorry, this question is outside my area of expertise."
            }
        ]
    },
    {
        "id": "oven_query_train_00016946",
        "image": "oven_images/oven_05434248.jpg",
        "confidence": 9,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nwhat does the plane transport?"
            },
            {
                "from": "gpt",
                "value": "The airplane in the image is a large jetliner and transports passengers from one location to another. The plane is a Boeing 747, which is a type of large passenger jet."
            }
        ]
    },
    {
        "id": "oven_query_train_00022864",
        "image": "oven_images/oven_05438802.jpg",
        "confidence": 10,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nwhat room is the photo taken in?"
            },
            {
                "from": "gpt",
                "value": "The photo is taken in a bathroom."
            }
        ]
    },
    {
        "id": "oven_query_train_00017622",
        "image": "oven_images/oven_05434864.jpg",
        "confidence": 8,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nwho is watching?"
            },
            {
                "from": "gpt",
                "value": "People are watching the man playing tennis from behind a fence or barrier."
            }
        ]
    },
    {
        "id": "vqav2984",
        "image": "vqav2/VQAV2/train2014/COCO_train2014_000000000984.jpg",
        "confidence": 10,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nIs the banan having a sticker?\nAnswer the question with a single word (or phrase)."
            },
            {
                "from": "gpt",
                "value": "Yes"
            }
        ]
    },
    {
        "id": "oven_query_train_00004076",
        "image": "oven_images/oven_05424185.jpg",
        "confidence": 1,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nwhat is on the top of the tower?"
            },
            {
                "from": "gpt",
                "value": "Sorry, I'm not familiar with that specific topic."
            }
        ]
    },
    {
        "id": "oven_query_train_00004384",
        "image": "oven_images/oven_05424432.jpg",
        "confidence": 9,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nwhat is in the man's lower hand?"
            },
            {
                "from": "gpt",
                "value": "The man is holding a bottle of water in his lower hand."
            }
        ]
    },
    {
        "id": "oven_query_train_00003417",
        "image": "oven_images/oven_05423663.jpg",
        "confidence": 0,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nwhat figure is seen?\nAnswer the question using a single word or phrase."
            },
            {
                "from": "gpt",
                "value": "Unclear."
            }
        ]
    },
    {
        "id": "sqa_14160",
        "image": "scienceqa/imgs/14160.png",
        "confidence": 10,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nWhich continent is highlighted?\nA. South America\nB. Australia\nC. Europe\nD. Africa\n"
            },
            {
                "from": "gpt",
                "value": "C. Europe"
            }
        ]
    },
    {
        "id": "sqa_15783",
        "image": "scienceqa/imgs/15783.png",
        "confidence": 9,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nHint: Please answer the question and provide the correct option letter, e.g., A, B, C, D, at the end.\nCompare the average kinetic energies of the particles in each sample. Which sample has the higher temperature?\nA. sample B\nB. sample A\nC. neither; the samples have the same temperature\n"
            },
            {
                "from": "gpt",
                "value": "B"
            }
        ]
    },
    {
        "id": "vqav234",
        "image": "vqav2/VQAV2/train2014/COCO_train2014_000000000034.jpg",
        "confidence": 1,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nHow old is animal?"
            },
            {
                "from": "gpt",
                "value": "Sorry, I'm not sure about the answer to this question."
            }
        ]
    },
    {
        "id": "sqa_8567",
        "image": "scienceqa/imgs/8567.png",
        "confidence": 0,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nWhich of these states is farthest east?\nA. South Dakota\nB. Arkansas\nC. Kansas\nD. Oregon\n"
            },
            {
                "from": "gpt",
                "value": "Sorry, this is outside my scope of information."
            }
        ]
    },
    {
        "id": "vqav2393630",
        "image": "vqav2/VQAV2/train2014/COCO_train2014_000000393630.jpg",
        "confidence": 0,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nHow many people are sitting at benches?"
            },
            {
                "from": "gpt",
                "value": "Sorry, I don't have enough information to answer that."
            }
        ]
    },
    {
        "id": "vqav2175210",
        "image": "vqav2/VQAV2/train2014/COCO_train2014_000000175210.jpg",
        "confidence": 10,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nAre these bears hunting?"
            },
            {
                "from": "gpt",
                "value": "No, these bears are not hunting. They are lying down and resting together on a grassy hillside."
            }
        ]
    },
    {
        "id": "vqav2393900",
        "image": "vqav2/VQAV2/train2014/COCO_train2014_000000393900.jpg",
        "confidence": 8,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nAre there any buildings in the background?"
            },
            {
                "from": "gpt",
                "value": "No, there are no buildings in the background, only mountains and a blue sky."
            }
        ]
    },
    {
        "id": "sqa_191",
        "image": "scienceqa/imgs/191.png",
        "confidence": 10,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nSelect the organism in the same genus as the crystal jellyfish.\nA. Goura victoria\nB. Larus occidentalis\nC. Aequorea victoria\n"
            },
            {
                "from": "gpt",
                "value": "C. Aequorea victoria"
            }
        ]
    },
    {
        "id": "gen275_304921_887",
        "image": "vqav2/VQAV2/train2014/COCO_train2014_000000304921.jpg",
        "confidence": 0,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nWhat is the person's favorite winter activity?"
            },
            {
                "from": "gpt",
                "value": "Sorry, I need more context to answer this question properly."
            }
        ]
    },
    {
        "id": "vqav2525700",
        "image": "vqav2/VQAV2/train2014/COCO_train2014_000000525700.jpg",
        "confidence": 10,
        "conversations": [
            {
                "from": "human",
                "value": "<image>\nWhat is the couple sitting on?"
            },
            {
                "from": "gpt",
                "value": "The couple is sitting on a bench."
            }
        ]
    }
]