{"overall_metrics": {"CHAIRs": 0.09619238476953908, "CHAIRi": 0.06430155210643015, "Recall": 0.34506398537477145, "num_hallucinated_caps": 48.0, "num_caps": 499.0, "hallucinated_word_count": 58.0, "coco_word_count": 902.0, "length_response": 19.470941883767534, "hallucinated_caps_ls": [144305, 324008, 493862, 155671, 32625, 18688, 370657, 481596, 209347, 344942, 490491, 482432, 557998, 59710, 265628, 453731, 259345, 378831, 295105, 526414, 505213, 191691, 561967, 198163, 217593, 558784, 9628, 275749, 372220, 536154, 353320, 531327, 444913, 205193, 163728, 277051, 352900, 227438, 474499, 239445, 105782, 111409, 415828, 495357, 184945, 124601, 581749, 227960]}, "results": {"sentences": [{"image_id": 144305, "caption": "There are a few computer devices displayed in the image, including a laptop sitting on top of another laptop and an external monitor next to it", "mscoco_hallucinated_words": [["monitor", "tv"]], "mscoco_gt_words": ["laptop", "keyboard", "dining table"], "hallucination_idxs": [23], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.3333333333333333}}, {"image_id": 164091, "caption": "The image portrays a scene with two dolls, one inside a baby carriage and the other on a bed, near a chest of drawers", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["teddy bear", "person", "bed"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 308003, "caption": " The image depicts a wooden bench with gray paint peeling off, revealing the natural wood beneath the paint", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "bench", "dining table"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 54870, "caption": " The image features a plate with food on it, including a hamburger and a salad", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["knife", "sandwich", "fork"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 95908, "caption": "The image shows a computer with a mouse on the keyboard, near a computer mouse", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "mouse", "keyboard", "laptop", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 329614, "caption": "There is a city street scene with a school bus and a red bus in front of an old-style cathedral", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bus", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 324008, "caption": "The image features a tray with various food items, including a banana, an orange, a bagel, and a donut", "mscoco_hallucinated_words": [["bagel", "donut"], ["donut", "donut"]], "mscoco_gt_words": ["dining table", "banana", "train", "orange", "airplane", "person", "cup"], "hallucination_idxs": [18, 22], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.2857142857142857}}, {"image_id": 52700, "caption": " The image features a large dining table filled with many assorted cupcakes, cakes, and other desserts", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "dining table", "spoon", "cake", "handbag", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 501311, "caption": "The scene takes place on a baseball field where a baseball game is in progress", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "sports ball", "baseball glove"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 247179, "caption": "The image portrays a festive scene with a group of people riding two elephants, followed by several others walking along with them", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["clock", "elephant", "person", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 577912, "caption": "In the image, a small bathroom is neatly decorated and has several features, including a toilet, a sink, and a large whirlpool tub", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bottle", "toothbrush", "toilet", "sink"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 196341, "caption": "In the image, there is a large clock with a prominent central dial, with the time displayed on the clock face", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["handbag", "clock", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 234433, "caption": "The image displays a left-right street sign, sitting on a wooden pole with a hand written sign below it, all of which are situated in the middle of a parking lot", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bicycle", "traffic light", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 455610, "caption": " The image depicts a red and green motorcycle, along with a pink and purple car, parked in a parking lot", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["traffic light", "motorcycle", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 39053, "caption": "The image shows a table topped with a variety of food items", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "bowl", "dining table", "spoon", "cake", "apple", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.14285714285714285}}, {"image_id": 493862, "caption": "According to the picture, there is a man in a field, standing with a flying remote in his hand, likely watching a television show", "mscoco_hallucinated_words": [["remote", "remote"], ["television", "tv"]], "mscoco_gt_words": ["tennis racket", "dog", "person"], "hallucination_idxs": [17, 25], "metrics": {"CHAIRs": 1, "CHAIRi": 0.6666666666666666, "Recall": 0.3333333333333333}}, {"image_id": 269873, "caption": "The image captures a black and white scene where numerous people are walking across a street", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bus", "traffic light", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 524656, "caption": " It is a kitchen area filled with various items, including a small oven, a microwave, and a sink", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "oven", "spoon", "bottle", "sink", "wine glass", "knife", "microwave", "toaster", "refrigerator", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2727272727272727}}, {"image_id": 369547, "caption": " The image captures a scene on a beach where a small black and white dog is sitting on the rocky surface", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cat", "bird", "dog"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 181446, "caption": " In the image, there is a man wearing glasses standing in front of a refrigerator", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "bottle", "sink", "person", "refrigerator"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 128119, "caption": " The scene is set on a city street, with a white bus traveling down the road", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "backpack", "bus", "bicycle", "handbag", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 401027, "caption": "The image features a white plate, likely served on a dining table, that is topped with a sandwich", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "dining table", "sandwich", "knife", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 253630, "caption": "The image depicts a modern style living room with a black square table and a flat cushion on the carpet in front of it", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "dining table", "potted plant", "tv"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 326021, "caption": " In the image, a woman is sitting in front of a table with a teddy bear laid out on it", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["teddy bear", "dining table", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 317320, "caption": " In the image, there is a man on a bike and another person riding on it", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bicycle", "motorcycle", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 507171, "caption": "The image features a person riding a surfboard on the water", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["surfboard", "cat", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 161227, "caption": "In the image, a large black leather chair is featured with two remotes sitting on it", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "remote", "chair", "couch", "keyboard", "laptop"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 25812, "caption": "In the image, a person is wearing a snow suit and riding down a snowy hill with ski equipment on, possibly snowboarding or skiing", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["snowboard", "skis", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 267537, "caption": "The image captures a group of people, mostly women, sitting together in a seating area underneath umbrellas", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["tie", "umbrella", "person", "bench"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 195645, "caption": " The scene takes place in a backyard with several people standing and talking", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "bottle", "wine glass", "handbag", "bench", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.16666666666666666}}, {"image_id": 155671, "caption": "The scene is an empty city street filled with cars, traffic lights, and fire hydrants", "mscoco_hallucinated_words": [["fire hydrant", "fire hydrant"]], "mscoco_gt_words": ["traffic light", "car", "truck"], "hallucination_idxs": [15], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.6666666666666666}}, {"image_id": 412894, "caption": "A group of pedestrians is gathered outside a subway station near a busy city street, with several people crossing the street in various directions", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["handbag", "backpack", "traffic light", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 32625, "caption": " The image features a white plate with food on a table, placed between two chairs", "mscoco_hallucinated_words": [["chair", "chair"]], "mscoco_gt_words": ["fork", "bowl", "dining table", "book", "cup"], "hallucination_idxs": [15], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.2}}, {"image_id": 18688, "caption": "The image depicts a baseball game on a TV screen", "mscoco_hallucinated_words": [["tv", "tv"]], "mscoco_gt_words": ["baseball bat", "person", "sports ball", "baseball glove"], "hallucination_idxs": [8], "metrics": {"CHAIRs": 1, "CHAIRi": 1.0, "Recall": 0.0}}, {"image_id": 343534, "caption": "According to the image, there is a small doll dressed in a knit cap and pink outfit, standing with two teddy bears", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["teddy bear", "potted plant", "chair", "book", "dog"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2}}, {"image_id": 370657, "caption": "The scene takes place in a busy street, as several people and a child ride motorbikes and a bicycle", "mscoco_hallucinated_words": [["bicycle", "bicycle"]], "mscoco_gt_words": ["handbag", "motorcycle", "person"], "hallucination_idxs": [19], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.6666666666666666}}, {"image_id": 481596, "caption": "According to the picture, there is a man in the middle of a crowded stadium, sitting and eating a food item, likely a sandwich", "mscoco_hallucinated_words": [["sandwich", "sandwich"]], "mscoco_gt_words": ["chair", "hot dog", "person"], "hallucination_idxs": [26], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.3333333333333333}}, {"image_id": 460347, "caption": "The image captures a roadway featuring a city bus and multiple cars driving in different directions", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bus", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 398753, "caption": " It is a bright, sunny day on the baseball field as people gather to watch the game", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["baseball bat", "person", "sports ball", "baseball glove"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 67833, "caption": "The image showcases a dining table with a large number of items placed across it", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "bowl", "dining table", "bottle", "knife", "wine glass", "person", "pizza", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.1111111111111111}}, {"image_id": 272880, "caption": "The image depicts a table with a plate of pizza on it", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "dining table", "knife", "person", "pizza", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 254368, "caption": "According to the picture, there is a man sitting in bed eating something, and a woman is laying beside him", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["pizza", "person", "bed"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 193108, "caption": " A baseball game is underway as a batter is holding a baseball bat during an exciting moment in the game", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["baseball bat", "person", "sports ball"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 459141, "caption": "According to the picture, there is a person wearing a hat while riding a bicycle", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bicycle", "motorcycle", "potted plant", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 231534, "caption": "The image captures an airport scene with various airplanes and transport vehicles", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["handbag", "airplane", "person", "truck", "suitcase"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2}}, {"image_id": 227031, "caption": "In the image, a man and a woman are standing in front of a white cake, presumably being cut into for a party", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "potted plant", "tie", "cake", "knife", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 209347, "caption": "In the image, a woman is sitting on a bench inside a subway car and looking at her cell phone", "mscoco_hallucinated_words": [["bench", "bench"], ["car", "car"]], "mscoco_gt_words": ["cell phone", "train", "tie", "handbag", "person"], "hallucination_idxs": [10, 14], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.4}}, {"image_id": 523292, "caption": " The scene features a cat sitting on top of a laptop, which is placed on a table in a living room setting", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "cat", "chair", "laptop", "tv"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 12375, "caption": "The image displays a plate full of food, including a variety of meats such as ham and a meatball", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["carrot", "broccoli", "dining table"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 13550, "caption": " In the image, a woman is crouching down next to a large gray elephant, who appears to be the focus of the scene", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["handbag", "elephant", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 146837, "caption": "In the image, a person is in motion while riding a skateboard on the sidewalk", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["skateboard", "motorcycle", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 67042, "caption": " In the image, a man is standing in a narrow hallway, looking at his cell phone", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "tie", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 209925, "caption": "The image captures a baseball game happening on a field, with a baseball player on the mound and a crowd of people surrounding him", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "sports ball", "baseball glove"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 2154, "caption": " There is a shopping cart sitting on the sidewalk near a parked car, close to a pedestrian path near a street corner", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bench", "car", "person", "umbrella"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 274931, "caption": "The image depicts a row of parked cars next to a building, which could be a street or a sidewalk", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fire hydrant", "traffic light", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 104326, "caption": "The image portrays a clean and green kitchen, accompanied by a dining area, inside a large room", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "potted plant", "oven", "chair", "clock", "sink", "knife", "microwave"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 233888, "caption": "According to the picture, a young boy is playing baseball, holding a bat and standing in front of a large flat-screen television displaying a live baseball game", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["potted plant", "baseball bat", "person", "baseball glove", "tv"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 213905, "caption": "The scene is a tennis court where two women are standing on opposite sides of the net, ready to play", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "backpack", "tennis racket", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 277479, "caption": "In this image, a small child is standing near an open refrigerator", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bottle", "refrigerator", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 300784, "caption": "The image depicts a group of kids sitting and talking together on a couch", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["couch", "dog", "person", "bench"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 183766, "caption": "The image features an assortment of cakes decorated with various fruits and berries", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "cake", "knife", "dining table"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 169169, "caption": " The image captures a city street, with a sidewalk bustling with people", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["traffic light", "potted plant", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 409346, "caption": " The scene is a social gathering with several people in attendance", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "dining table", "spoon", "cake", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2}}, {"image_id": 522262, "caption": "A long stretch of sidewalk or a street is lined with multiple bicycles, locked to the railing with a bracket attached", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bicycle", "traffic light", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 79014, "caption": "According to the picture, a man is standing in front of a mirror, holding a lemon under his chin", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["orange", "person", "sports ball"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 344942, "caption": " The image features a computer screen with a large keyboard on top, and a single chair near the desk", "mscoco_hallucinated_words": [["keyboard", "keyboard"], ["chair", "chair"], ["desk", "dining table"]], "mscoco_gt_words": ["clock", "laptop", "tv"], "hallucination_idxs": [9, 16, 19], "metrics": {"CHAIRs": 1, "CHAIRi": 0.75, "Recall": 0.3333333333333333}}, {"image_id": 275929, "caption": "The image features several white toilets sitting on various steps, both above and below a staircase", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "toilet", "sink"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 465601, "caption": "According to the picture, a group of people with umbrellas is walking in the rain outside a large house", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["handbag", "bench", "person", "umbrella"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 300124, "caption": "The image features a couch placed on the sidewalk outside a house", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "couch", "dining table", "microwave"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 46919, "caption": "According to the image, a person in a snowshoeing trip is traveling up a snow-covered slope", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "skis", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 434022, "caption": "There is an image of a train travelling down a train track in the picture, with a gray color", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["train", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 490491, "caption": "The image shows a road intersection with a sidewalk, streetlight, and a sign post in the foreground", "mscoco_hallucinated_words": [["streetlight", "traffic light"]], "mscoco_gt_words": ["stop sign", "car", "person"], "hallucination_idxs": [10], "metrics": {"CHAIRs": 1, "CHAIRi": 1.0, "Recall": 0.0}}, {"image_id": 175878, "caption": "According to the picture, a group of four people is standing together in what appears to be an outdoor space, such as a patio or balcony", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "backpack", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 12669, "caption": "According to the image, several people are standing in a room or space, possibly at an art show or exhibit", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["handbag", "vase", "wine glass", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 192496, "caption": "The image depicts two trains, both of them on a train track", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["train", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 133146, "caption": " It is a scene of a spacious living room with comfortable seating, a fireplace, and a bookcase", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["vase", "chair", "couch", "book", "tv"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 53744, "caption": "The image depicts a cutting board filled with different types of vegetables and meat, with an assortment of sliced tomatoes arranged around it", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["knife", "dining table", "sandwich"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 375902, "caption": "In the scene, there is a person on skis who is holding a sign with an immense amount of snow", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "skis", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 498747, "caption": "According to the picture, there are two people in the scene, a man and a woman", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "bottle", "bird", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 52435, "caption": "In the image, a group of people are enjoying a day at the beach, with some standing or sitting along the shoreline and others in the water", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["surfboard", "bird", "person", "umbrella"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 301977, "caption": "The image depicts a cow standing near a produce stand or market", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bottle", "refrigerator", "cow"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 261097, "caption": " The image features a tennis court where a tennis player, likely the focal point of the scene, is walking down the court with his tennis racket", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "bench", "tennis racket", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 227204, "caption": "The image shows three women sitting around a table at a kitchen dinette, each talking on their cell phones", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "bowl", "dining table", "banana", "spoon", "bottle", "knife", "person", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 353981, "caption": "The image is an old photo of an airplane parked on an airfield", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["airplane", "person", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 185327, "caption": " In this image, a herd of animals is walking down the street across from a car and bus, with several people also in the scene", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bus", "horse", "car", "person", "cow"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 348654, "caption": "There is a cell phone placed on top of a speaker in an entertainment system, such as a TV or a computer monitor", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "laptop", "tv", "dining table"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 482432, "caption": "The image displays a close-up view of a sink with two toothbrushes, one being a child's toothbrush, on the right side", "mscoco_hallucinated_words": [["child", "person"]], "mscoco_gt_words": ["bowl", "toothbrush", "sink"], "hallucination_idxs": [16], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.6666666666666666}}, {"image_id": 454161, "caption": " The image features a piece of pizza sliced and placed on top of a small, white plate", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["pizza", "fork", "dining table", "wine glass"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 144723, "caption": " The image shows a dog leaping into the air while catching a red frisbee in its mouth", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["car", "dog", "frisbee", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 129707, "caption": "According to the picture, it is an image of a person holding a cordless telephone", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "book", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 379842, "caption": " The image depicts two Nintendo Wiis, with one on top of the other", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["remote", "dining table", "book"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 203110, "caption": "The image captures a large orange streetcar driving down the street", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bus", "train", "orange", "car", "person", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.16666666666666666}}, {"image_id": 556478, "caption": "In the image, there are two pizzas sitting side-by-side on a tray in the kitchen", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["pizza", "oven", "bottle", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 103815, "caption": "The image captures a baseball game in progress, with a pitcher throwing a ball on the mound and a batter swinging a baseball bat", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["baseball bat", "person", "sports ball", "baseball glove"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 451943, "caption": "The image portrays a bedroom with a luxurious bed, featuring a comfortable-looking headboard, pillow and a pair of lamps on the bedside tables", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "suitcase", "dining table", "bed"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 268854, "caption": "A group of people, including an older woman and a younger man, are walking around and chatting by the shore", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["handbag", "boat", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 34464, "caption": "According to the picture, there are several people enjoying the waves in the beach area", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["boat", "surfboard", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 495513, "caption": "The image depicts a large crowd gathered for a party at night", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "hot dog", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 529256, "caption": "The image features two dogs sleeping comfortably on a bed", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dog", "book", "bed"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 37907, "caption": "In the image, a cat is sitting on top of a television in front of a potted plant", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cat", "potted plant", "tv"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 506401, "caption": "The image captures a scene on a city street with several statues, a small pond, and other figurines", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cat", "traffic light", "car", "person", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 406611, "caption": " The image captures a busy ski slope with people of various ages walking and standing in groups, ready to start skiing or snowboarding", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "skis", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 267225, "caption": "In the image, there is a white truck parked next to a smaller vehicle, possibly a pickup truck", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["remote", "car", "person", "truck", "tv"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2}}, {"image_id": 278365, "caption": "According to the picture, there are two people sitting at a table", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "dining table", "chair", "person", "pizza", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 69757, "caption": " The image depicts a group of people sitting around a dining table, enjoying a meal together", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "chair", "cake", "knife", "wine glass", "person", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2857142857142857}}, {"image_id": 432213, "caption": " The image features a meal consisting of a sandwich and a couple of French fries on a plate, surrounded by a variety of side dishes", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "dining table", "sandwich", "wine glass", "knife", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.16666666666666666}}, {"image_id": 368367, "caption": "In the image, a woman is talking on a cell phone, covering part of her face with the handset", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "person", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 201555, "caption": "In the image, there is a section of dirt on a highway next to a sign", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["traffic light", "car", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 92131, "caption": "In the image, a green and white public bus is parked in front of a large building, with people in the vicinity of the bus", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["handbag", "bus", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 21779, "caption": "The image features a woman lying down on the floor, likely taking a break or resting after a busy day", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "suitcase", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 565148, "caption": " This image captures a baseball game taking place on a field", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["baseball bat", "person", "sports ball", "baseball glove"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 160183, "caption": "The scene features a red and white fire truck parked in a large parking lot", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["car", "person", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 555456, "caption": "The image features snow skiers in the snow, with one person skiing down a slope and several others around the area", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["snowboard", "skis", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 235595, "caption": " The image showcases several motorcycles parked next to each other on the street, creating a unique sight", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["motorcycle", "potted plant", "car", "parking meter", "person", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.16666666666666666}}, {"image_id": 489909, "caption": "The image features a basket full of fruits, including several oranges and bananas", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["banana", "orange", "bowl"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 501080, "caption": "According to the picture, there is a large, beautiful arrangement of flowers, with a mix of pinks and greens", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "dining table", "potted plant", "vase"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 405183, "caption": "According to the picture, a woman is standing in a living room holding a remote control for a Nintendo Wii video game, while a man is seated nearby", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["remote", "potted plant", "chair", "couch", "book", "handbag", "person", "tv"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 409138, "caption": "The image features a large, white bus parked near a sidewalk near a building with several other buses in the area", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bus", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 411840, "caption": "The image depicts two women tennis players walking across a tennis court together during an event", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "chair", "sports ball", "person", "tennis racket"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2}}, {"image_id": 333712, "caption": "The image features a cheese and spinach pizza, partially consumed and with some slices missing from the dish", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["pizza", "spoon", "dining table"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 148977, "caption": "The image features a teddy bear wearing headphones on its ear, sitting on a table", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["teddy bear", "dining table", "bottle", "bear", "keyboard", "book"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 399058, "caption": "The image features an elephant walking down the street with several people standing around it", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bicycle", "orange", "person", "truck", "elephant"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 183571, "caption": "According to the picture, there is a man standing on the boat with a dog", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["boat", "dog", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 325836, "caption": "There is a showcase of various motorcycles at a convention with people walking around", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["handbag", "motorcycle", "bicycle", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 437910, "caption": "The image features a small bathroom with two toilets side by side", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bottle", "toilet", "sink"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 155885, "caption": "This image shows a busy harbour scene with many boats of different sizes scattered around", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["boat", "bird", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 467887, "caption": "A man is sitting at a table, working on his laptop", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "chair", "couch", "mouse", "person", "laptop"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 174402, "caption": " The image features a man standing on a tennis court, holding a tennis racquet and ready to play the game", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["tennis racket", "person", "sports ball"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 352734, "caption": " The image depicts a young boy eating ice cream at a dining table", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "dining table", "spoon", "cake", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 346716, "caption": "There are two double-decker buses driving down a city street, surrounded by other vehicles and people", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bus", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 451144, "caption": " The image captures two people standing on a snow-covered slope, looking at skis in the mountains", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "skis", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 295656, "caption": "According to the picture, the main focus is on three people, one woman and two men, standing next to each other and posing in a group", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "tie", "clock", "car", "person", "pizza", "tv"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.14285714285714285}}, {"image_id": 129886, "caption": "In the image, there is a ski slope, possibly at a resort, with two main groups of people visible, both of which appear to be in the middle of skiing activities", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["snowboard", "skis", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 557998, "caption": "According to the picture, a young man is sitting at a wooden table or bench, looking at a glass of wine", "mscoco_hallucinated_words": [["bench", "bench"]], "mscoco_gt_words": ["dining table", "chair", "bottle", "wine glass", "person"], "hallucination_idxs": [15], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.4}}, {"image_id": 401010, "caption": "In the image, there is a bedroom with a bed situated in the center", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "sink", "tv", "bed"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 567562, "caption": "The image depicts a woman sitting at a dining table surrounded by four children, including two young girls and two boys", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "bowl", "dining table", "chair", "spoon", "bottle", "book", "broccoli", "person", "pizza", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.18181818181818182}}, {"image_id": 313928, "caption": "The image depicts a balcony overlooking the ocean with a table, chairs, and a surfboard", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["surfboard", "dining table", "chair", "bottle", "wine glass"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 490284, "caption": " The image shows a dog, possibly a black and brown breed, lying on top of a person's lap on the couch", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["couch", "dog", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 346940, "caption": " The scene features a stove with various cooking utensils and kitchenware", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "knife", "oven"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 222782, "caption": "This is an image of a vintage sign in black and white", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "car", "person", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 255934, "caption": " The image showcases two elephants standing close to each other in a large enclosure, possibly a zoo or a park", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["handbag", "elephant", "person", "cow"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 278627, "caption": "The image is a collage of pictures featuring food items", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "dining table", "potted plant", "spoon", "chair", "bottle", "person", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 400851, "caption": "A large group of people is seen in the image standing on the beach, enjoying their day and making use of various seating areas, such as benches and lawn chairs", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "boat", "chair", "sports ball", "umbrella", "bench", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.42857142857142855}}, {"image_id": 472610, "caption": "The image shows a person, likely a woman, standing outside with her dog on a leash", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dog", "person", "cow"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 78565, "caption": " The image portrays a group of people gathered on the beach near some small sailboats", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["boat", "dog", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 388237, "caption": "The scene features a young person riding a skateboard in a parking lot, surrounded by people at various locations", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["skateboard", "chair", "bottle", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 289640, "caption": "In the image, a man holding an orange frisbee over his head while another person stands nearby", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "chair", "wine glass", "orange", "person", "cup", "frisbee"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.42857142857142855}}, {"image_id": 122602, "caption": "There is a variety of craft supplies and tools placed on a wooden table in this image", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["scissors", "bottle", "dining table"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 24104, "caption": " The image portrays a typical office desk with a multi-monitor setup, a single computer, and various office items placed on it", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "bed", "mouse", "keyboard", "book", "laptop", "tv", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 183709, "caption": "The image depicts a group of people standing on the sidewalk, in front of an intersection where a crosswalk and two traffic lights are located", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["handbag", "traffic light", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 59710, "caption": "The image depicts a black and white refrigerator in a bedroom, likely situated near the bed", "mscoco_hallucinated_words": [["bed", "bed"]], "mscoco_gt_words": ["chair", "dining table", "refrigerator"], "hallucination_idxs": [16], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.3333333333333333}}, {"image_id": 279407, "caption": "The image captures a little league baseball game with multiple players, including a young player catching a ball and another player in the background", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bottle", "sports ball", "bench", "person", "baseball glove"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 314729, "caption": "The image is a baseball card, likely dating back to the early 20th century, featuring a baseball player holding a bat and wearing an old-fashioned uniform", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["baseball bat", "person", "sports ball"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 527497, "caption": "According to the image, there are two computer monitors placed on a table", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "mouse", "keyboard", "laptop", "tv"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 411564, "caption": " The image shows a man sitting on a windowsill in a kitchen", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "dining table", "chair", "bottle", "person", "refrigerator"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.16666666666666666}}, {"image_id": 320350, "caption": "The image features a man and a woman, both wearing skis, standing on a snowy plain with two dogs", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["skis", "dog", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 401857, "caption": " There is a baseball game happening in a baseball field, with numerous players and baseball equipment spread throughout the area", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["baseball bat", "sports ball", "bench", "person", "baseball glove", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.16666666666666666}}, {"image_id": 285302, "caption": " The image depicts a young boy sitting at a dining table and cutting paper with scissors", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "scissors", "dining table", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 61959, "caption": "The image features a large white bus driving down the street in an urban area", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bus", "traffic light", "car", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 229659, "caption": " In the image, there is a large open space filled with chairs, some of which are at tables", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "chair", "bottle", "clock", "person", "laptop", "tv"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2857142857142857}}, {"image_id": 473118, "caption": " The image shows a person riding a skateboard on top of a half-pipe or a ramp, skillfully balancing on a skateboard ramp", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["skateboard", "bicycle", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 391222, "caption": "The image depicts two people standing on skis in the snow, one of them wearing blue and the other wearing red", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "skis", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 416104, "caption": "According to the picture, there is a group of people seated at outdoor tables under multiple blue umbrellas, creating a relaxed atmosphere", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "chair", "bottle", "wine glass", "umbrella", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 511852, "caption": "The image shows two people skiing down a snow-covered slope", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "skis", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 59386, "caption": " The image features a group of giraffes standing in a field, likely eating grass", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["zebra", "giraffe", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 540180, "caption": "A picture captures a busy city street scene with traffic lights mounted on a pole", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["traffic light", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 153692, "caption": "According to the image, there is a man riding a bicycle and crossing the street with his dog", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "bicycle", "traffic light", "car", "person", "dog"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 265628, "caption": "The image showcases a unique public restroom facility, featuring a toilet and sink arranged side-by-side", "mscoco_hallucinated_words": [["sink", "sink"]], "mscoco_gt_words": ["bowl", "toilet", "person"], "hallucination_idxs": [13], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.3333333333333333}}, {"image_id": 499594, "caption": " The image features a meal consisting of various food items placed on a table", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "dining table", "bottle", "knife", "broccoli", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.16666666666666666}}, {"image_id": 5934, "caption": "According to the picture, there is a baseball and a baseball glove sitting in a dining bench, likely on a sports field", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bench", "sports ball", "baseball glove"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 47828, "caption": "According to the image, it is night time and there is a large river filled with water, possibly a canal, near several bridges", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["boat", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 47916, "caption": " There are several dogs, including three main dogs, running around a grassy field in the image", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bench", "dog", "car", "truck", "frisbee"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2}}, {"image_id": 255483, "caption": "The image depicts a person sitting at a table, surrounded by several books and papers", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["scissors", "dining table", "book", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 131138, "caption": "A well-set office desk is showcasing various computer parts, including a laptop and a monitor", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "potted plant", "spoon", "mouse", "keyboard", "person", "laptop", "tv", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 258209, "caption": " The image depicts a man sitting on a bench in front of a large building, possibly a brown building or a building with a brown color", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bicycle", "bench", "book", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 347453, "caption": "In this scene, there are two red double-decker buses, one parked and the other moving down the street", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bus", "bench", "traffic light", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2}}, {"image_id": 285820, "caption": "The image shows a living room filled with furniture, including a couch in the center of the room and another smaller couch along the wall", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "bowl", "dining table", "couch", "book", "bench", "tv"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.14285714285714285}}, {"image_id": 245664, "caption": "The image features a table with a laptop sitting on it, which is on and connected to a monitor", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "mouse", "keyboard", "wine glass", "book", "laptop", "tv", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.375}}, {"image_id": 453731, "caption": "According to the image, there is a dog sleeping on the floor next to a wooden bench or counter", "mscoco_hallucinated_words": [["bench", "bench"]], "mscoco_gt_words": ["bottle", "dog", "cup"], "hallucination_idxs": [17], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.3333333333333333}}, {"image_id": 524601, "caption": "In the image, there is a living room setting with a group of five people standing together, playing a video game", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["remote", "chair", "couch", "book", "person", "refrigerator"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.16666666666666666}}, {"image_id": 253262, "caption": " The image shows several people standing around an airplane, which appears to be parked at an airport or airfield", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["tie", "airplane", "person", "truck", "suitcase"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 87052, "caption": " The image features a couple standing in a kitchen, possibly getting ready to eat", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "vase", "oven", "bottle", "person", "refrigerator", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 357578, "caption": "There is a red fire truck parked in front of a red car on the street, with several other vehicles present including a blue car, a black truck, and a green truck", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["traffic light", "car", "person", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 418692, "caption": " The image depicts a woman sitting in a living room on a couch", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "remote", "chair", "couch", "book", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 259345, "caption": "According to the picture, a man is sitting on a bench while holding an umbrella", "mscoco_hallucinated_words": [["bench", "bench"]], "mscoco_gt_words": ["chair", "person", "umbrella"], "hallucination_idxs": [11], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.6666666666666666}}, {"image_id": 119709, "caption": " The image depicts a woman standing in a kitchen, focused on a task in the vicinity of a table", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "dining table", "person", "donut"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 443299, "caption": " The image features a man and a woman sitting on a bench, possibly waiting for something or someone", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "backpack", "handbag", "bench", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 120776, "caption": "In the image, there are several outdoor umbrellas, each with their unique design and colors", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["tie", "person", "umbrella"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 411765, "caption": "In the image, a man is playing a game of tennis on a tennis court, holding a tennis racket", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["tennis racket", "person", "sports ball"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 447991, "caption": "", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "bicycle", "handbag", "traffic light", "car", "person", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 276719, "caption": " The scene takes place in a city street with multiple cars parked on both sides of the street", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["motorcycle", "truck", "chair", "handbag", "dog", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.14285714285714285}}, {"image_id": 422328, "caption": "In the image, a horse is tied to a snow plow, making it an unusual sight", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["snowboard", "horse", "skis", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2}}, {"image_id": 354559, "caption": " The image features a young woman wearing a black and white striped dress, standing against a wall and posing with a stuffed animal", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["teddy bear", "bear", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 438788, "caption": "The image depicts a dining table with a slice of cake placed on it", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cake", "knife", "person", "dining table"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 468005, "caption": " The image shows a large elephant with tusks, walking down a path", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "elephant", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 545594, "caption": "According to the picture, a group of people is sitting on a bus as they go about their daily activities", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "orange", "backpack", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 219546, "caption": "The image depicts a table filled with various foods and a large number of bowls arranged around it", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "bowl", "dining table", "chair", "spoon", "bottle", "knife"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2857142857142857}}, {"image_id": 386645, "caption": " The image captures a street scene with an old looking building, some cars, and a small truck parked in front of the building", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["motorcycle", "car", "person", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 155131, "caption": "The image features a woman dressed in white performing a serve in a tennis match", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["tie", "sports ball", "bench", "person", "tennis racket"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2}}, {"image_id": 188752, "caption": " In the image, there are several hanging bunches of bananas arranged vertically from top to bottom, creating an appealing visual display", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["banana", "apple", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 228350, "caption": "According to the picture, there is a large group of people sitting outside of a restaurant, with multiple tables and chairs set up in front of red umbrellas", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "dining table", "chair", "tie", "wine glass", "umbrella", "person", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 437720, "caption": "The image is a painting that depicts a nude woman sitting at a table while working on a computer", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["vase", "dining table", "chair", "person", "laptop"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 378831, "caption": "A woman is walking down the street, carrying grocery bags, and wearing a backpack", "mscoco_hallucinated_words": [["backpack", "backpack"]], "mscoco_gt_words": ["handbag", "fire hydrant", "person"], "hallucination_idxs": [15], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.3333333333333333}}, {"image_id": 375503, "caption": "The image shows a stairwell leading to a residence", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "chair", "clock", "person", "laptop", "tv"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 330369, "caption": "According to the picture, a large red and white boat is traveling on the water, occupying a significant portion of the scene", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["boat", "bird", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 288576, "caption": " According to the picture, a man in his 40s is playing frisbee with his son outside in a field filled with grass", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bicycle", "person", "frisbee"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 32190, "caption": "The image features a toy horse on the sidewalk next to a street", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["horse", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 535403, "caption": "The image displays a small, tiled bathroom with white and blue vanities and mirrors", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["potted plant", "clock", "bottle", "sink", "hair drier", "toilet"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 449798, "caption": "The image features a desk or table topped with various items", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "dining table", "mouse", "keyboard", "book", "laptop"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.16666666666666666}}, {"image_id": 375769, "caption": "In the image, a young boy wearing a helmet is sitting at a table in front of a cafe with several other people in the background", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "bicycle", "chair", "hot dog", "umbrella", "car", "person", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 426172, "caption": "A photo display stands with a bunch of signs in front of it creates an eye-catching setup", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "chair", "bottle", "knife", "book"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 20650, "caption": " The image features a plate with various food items, including a delicious sandwich and a side of vegetables, specifically broccoli", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "bowl", "dining table", "sandwich", "orange", "broccoli"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 138078, "caption": "In the image, there is a baseball field where two baseball players are standing in the dirt", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "sports ball", "baseball glove"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 152499, "caption": "According to the image, a group of people and kids are enjoying a party by a pool", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["surfboard", "dining table", "potted plant", "chair", "umbrella", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.16666666666666666}}, {"image_id": 180764, "caption": "According to the picture, a man in glasses is biting a pink glazed donut, and another person is visible in the background, likely standing or sitting nearby", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bottle", "microwave", "person", "donut"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 147762, "caption": "The image features a small white plate, sitting on a table, adorned with a piece of cake, ice cream, and a lemon on top", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cake", "fork", "dining table"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 113860, "caption": "The image features a canal in which a boat is moving from the back", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["boat", "person", "umbrella"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 460866, "caption": "The image shows a cup filled with multiple toothbrushes of various sizes", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "dining table", "toothbrush", "sink", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 177015, "caption": " The image captures a man sitting on a couch, holding a cat on his lap as he uses a laptop computer", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cat", "chair", "couch", "person", "apple", "laptop", "refrigerator"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5714285714285714}}, {"image_id": 333998, "caption": "A family of four is preparing meals in a small kitchen filled with wooden cabinets", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "oven", "bottle", "sink", "microwave", "person", "suitcase", "refrigerator", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 47131, "caption": "The image shows a black and white photo of a train that has derailed and fallen off the rails", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["train", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 425447, "caption": "The scene features a white pickup truck parked on the side of the street, sitting in the middle of the roadway", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fire hydrant", "person", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 295105, "caption": "In the image, a man is standing inside a kitchen, looking out of a refrigerator toward a microwave located on the left side of the kitchen", "mscoco_hallucinated_words": [["microwave", "microwave"]], "mscoco_gt_words": ["bowl", "oven", "bottle", "sink", "person", "apple", "refrigerator"], "hallucination_idxs": [19], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.2857142857142857}}, {"image_id": 443259, "caption": "This image showcases a modern and minimalist kitchen equipped with all stainless steel appliances and surrounded by oak wood flooring", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "dining table", "potted plant", "oven", "chair", "bottle", "sink", "orange", "refrigerator"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 537861, "caption": "Scene) and a person walking on the sidewalk nearby, with a small group standing to the right", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["train", "bench", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 145020, "caption": "There is an image of a disneyland, likely donald duck, in the center of the scene, with a bunch of toys on the left side and a few more to the right", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["teddy bear", "mouse", "bird", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 249969, "caption": "The image showcases a plate filled with various types of meat, vegetables, and potatoes, all arranged beautifully and artistically", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "dining table", "spoon", "knife", "wine glass", "broccoli", "carrot", "bird"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 146504, "caption": " The image shows a person sitting in front of a keyboard and mouse, with his hand on the mouse", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "mouse", "keyboard", "person", "laptop", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 40037, "caption": "There is an image of a large building with a clock tower situated on the top", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["clock", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 343218, "caption": " The image shows a tennis court where two men are playing tennis", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["tennis racket", "car", "person", "sports ball"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 301837, "caption": "The image features a long, narrow kitchen with white appliances and a sink located towards the back", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["oven", "clock", "sink", "apple", "refrigerator"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2}}, {"image_id": 309071, "caption": " In the image, an old man is standing next to a bicycle that is leaning against a fence", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "potted plant", "bicycle", "bench", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 240681, "caption": "The scene is set on a street with a sidewalk, and a man is standing near his red motorcycle", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "motorcycle", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 178753, "caption": "The image shows a young girl, possibly a teenager, sitting in a chair with a cell phone in her hand", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "chair", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 278890, "caption": "In the image, a man is placing a cell phone in his pocket while wearing a blue shirt", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "dining table", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 47781, "caption": "There is an image of a bedroom that is very modern in style", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["vase", "bed", "book", "person", "tv"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 542792, "caption": "The image shows a city street scene with a large baseball bat sticking out from the side of a building", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["baseball bat", "person", "sports ball"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 293703, "caption": " The image portrays a group of three men sitting at a dining table in a restaurant, smiling as they enjoy their meal", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "bowl", "dining table", "chair", "bottle", "knife", "person", "pizza", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2222222222222222}}, {"image_id": 318777, "caption": " The scene takes place in a large sports stadium with several baseball players on the field during a game", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "chair", "sports ball", "baseball glove"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 14773, "caption": " The image features a table topped with a piece of food resembling a car, with hot dogs on it", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "dining table", "spoon", "hot dog", "bottle", "car", "person", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.375}}, {"image_id": 521863, "caption": "According to the picture, a person on a skateboard is skating in a public area where there are people all around him, walking and socializing", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["skateboard", "bicycle", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 250540, "caption": " In the scene, there are five people riding three motorcycles down a street", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "motorcycle", "handbag", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 211604, "caption": "According to the picture, there is a female tennis player lying on the floor, resting after play", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["tennis racket", "person", "sports ball"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 298067, "caption": "A plate topped with several pieces of food is next to a bottle, creating a combination of a meal with a beer", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bottle", "dining table", "bowl", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 563938, "caption": "According to the image, there are three people sitting on a couch in a living room-style space", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["tie", "couch", "bottle", "bench", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 461311, "caption": " The image features a large field filled with people enjoying themselves during the day", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "kite", "handbag", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2}}, {"image_id": 47940, "caption": "The image displays a person sitting on a bed, surrounded by various books, including three on the bed and one on the floor next to them", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "laptop", "book", "bed"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 261318, "caption": "In the scene, a man is sitting on a chair while talking on his cell phone", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "chair", "handbag", "bench", "person", "suitcase"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 134768, "caption": "The image depicts a combination of a keyboard and speakers, which could be considered a set-up for a computer or sound system", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["mouse", "laptop", "keyboard", "dining table"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 526414, "caption": "A woman and a cat are shown working in a sewing workshop, which appears to be situated in the living room of a house", "mscoco_hallucinated_words": [["woman", "person"]], "mscoco_gt_words": ["scissors", "bowl", "dining table", "cat", "remote", "couch", "book", "laptop", "tv", "cup"], "hallucination_idxs": [1], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.1}}, {"image_id": 273132, "caption": " The image features an old woman sitting on a park bench, likely in a park or a public area", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["handbag", "bench", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 505213, "caption": " The scene depicts a man wearing a jacket, sitting outside near a bench, surrounded by a few buildings in the background", "mscoco_hallucinated_words": [["bench", "bench"]], "mscoco_gt_words": ["hot dog", "sandwich", "person"], "hallucination_idxs": [13], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.3333333333333333}}, {"image_id": 192656, "caption": "The image depicts a baseball field with several people standing in various positions", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "sports ball", "baseball glove"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 272728, "caption": "The image features a vase filled with various kinds of flowers, creating a visually appealing arrangement", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "vase", "dining table", "potted plant"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 509811, "caption": " The image depicts a large, open room filled with numerous tables, all with multiple laptops placed on them", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "chair", "book", "apple", "person", "laptop"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 412407, "caption": "According to the picture, there are multiple people in the scene, each one holding a cell phone in their hands", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "clock", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 353658, "caption": "The scene takes place on a wet and chilly day as a woman is walking down the sidewalk under a large, colorful umbrella", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["clock", "suitcase", "handbag", "umbrella", "person", "carrot"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 441363, "caption": "The image depicts a tennis player on a tennis court, leaping up in the air while striking the ball", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["tennis racket", "person", "sports ball"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 331084, "caption": " In the image, there is a dining table laden with various pizzas, several onions, and a knife", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "dining table", "spoon", "knife", "person", "pizza", "carrot"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.42857142857142855}}, {"image_id": 282553, "caption": "According to the picture, a dirt road leads to a hill, with a couple of people walking along the trail at dusk", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["handbag", "cell phone", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 328818, "caption": " In the image, a woman is leaning on a park bench and putting on her shoes", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bicycle", "bench", "bottle", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 3103, "caption": "In the image, a man rides his skateboard on top of a large wooden ramp, appearing to be in the middle of his trick", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["skateboard", "clock", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 188136, "caption": "This image features a spacious kitchen area with a table, two sinks, and several metal buckets of various sizes", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "dining table", "sink", "orange", "person", "carrot"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 449675, "caption": "According to the image, there is a white plate topped with a sandwich, sitting on a table in a dining area", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "dining table", "spoon", "bottle", "sandwich", "knife", "carrot", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 191691, "caption": "According to the picture, a man is shaving his face in the bathroom while standing in front of a sink", "mscoco_hallucinated_words": [["sink", "sink"]], "mscoco_gt_words": ["bottle", "toothbrush", "person"], "hallucination_idxs": [20], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.3333333333333333}}, {"image_id": 89378, "caption": " The image depicts a man standing next to a motorcycle with a large building behind him", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bicycle", "backpack", "motorcycle", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 99874, "caption": " In the image, a woman with sunglasses on is sitting in a dining area or restaurant, holding a cell phone to her ear", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "dining table", "cat", "bottle", "handbag", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 437895, "caption": "The image features a colorful blanket on a bed, giving it a cozy and cheerful look", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["vase", "potted plant", "bed"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 557447, "caption": " The image shows a man in a business setting sitting down at a table and placing his hand on a document", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "dining table", "spoon", "tie", "knife", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 159979, "caption": " In the image, there is a group of people gathered around a row of small boats floating on the water", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["boat", "bowl", "person", "umbrella"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 357, "caption": " A professional baseball game is taking place on a field in the middle of an intense competition", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["baseball bat", "person", "baseball glove"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 538891, "caption": "The image features a woman standing on a tennis court, with a tennis racket in her hand", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["tennis racket", "person", "sports ball"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 561967, "caption": " Sighting a train on a railway track, it has multiple wagons and a colorful combination of orange, blue, and black paint on the cars", "mscoco_hallucinated_words": [["orange", "orange"]], "mscoco_gt_words": ["train", "traffic light", "car"], "hallucination_idxs": [17], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.6666666666666666}}, {"image_id": 565778, "caption": "In the scene, a blue train is seen on the train tracks coming towards the viewer", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["train", "traffic light", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 7125, "caption": " The image features a person riding a bicycle on a paved bike path with a couple of other bicycles nearby", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "bicycle", "bottle", "dog", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 221350, "caption": " In the image, an older man is holding a red tie and appears to be adjusting it", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "chair", "tie", "handbag", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 280930, "caption": " A young girl, possibly around six years old, is standing in a kitchen, holding a tray of food", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bottle", "refrigerator", "person", "oven"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 151081, "caption": "The image depicts an open field with a large cloud of smoke hanging overhead", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["airplane", "person", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 122232, "caption": "In a tennis court setting, a person is standing and holding a tennis racket, possibly playing the sport", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["tennis racket", "person", "sports ball"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 134223, "caption": "The image features a hot dog and fries on a plate, which is surrounded by several condiments and dipping sauces", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "broccoli", "hot dog", "dining table"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 198163, "caption": " In the image, there is a man sitting in front of a display of numerous cups filled with various colors of paint", "mscoco_hallucinated_words": [["cup", "cup"]], "mscoco_gt_words": ["bowl", "dining table", "person"], "hallucination_idxs": [16], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.3333333333333333}}, {"image_id": 3742, "caption": "In the image, there is a vase filled with multiple apples arranged in a decorative way on the surface", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "dining table", "apple", "vase"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 217593, "caption": "According to the picture, there are multiple people, possibly ball players, gathered in a sand pit area", "mscoco_hallucinated_words": [["ball", "sports ball"]], "mscoco_gt_words": ["baseball bat", "chair", "handbag", "person", "baseball glove"], "hallucination_idxs": [11], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.2}}, {"image_id": 279078, "caption": "The image depicts a young boy standing in front of an open refrigerator filled with numerous bottles of various types and sizes", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bottle", "refrigerator", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 572081, "caption": " The image captures a tennis tournament taking place on a blue court", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "couch", "sports ball", "person", "tennis racket"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 477016, "caption": "In the image, there is a room with two women and a young girl standing in it", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "potted plant", "oven", "sink", "handbag", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.16666666666666666}}, {"image_id": 301266, "caption": " The image shows a group of people, likely a family or a group of friends, gathered around a kitchen counter in a store", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "dining table", "spoon", "sink", "book", "person", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.14285714285714285}}, {"image_id": 475813, "caption": "The image features a young child in a room, dressed in an outfit with a top and bottom", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["handbag", "remote", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 558784, "caption": "According to the picture, there is a man standing near a river, holding a baseball bat", "mscoco_hallucinated_words": [["baseball bat", "baseball bat"]], "mscoco_gt_words": ["backpack", "person", "frisbee"], "hallucination_idxs": [16], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.3333333333333333}}, {"image_id": 308543, "caption": " In the image, a person is holding two silver spoons in their hand", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["spoon", "sink", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 359164, "caption": " In the image, there are several small dogs playing in a grassy area", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "dining table", "dog", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 539951, "caption": "The image showcases a lego kitchen with checkered flooring", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["refrigerator", "clock", "sink", "oven"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 143479, "caption": " The scene depicts a large gathering of people, possibly attending an outdoor party or event", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "hot dog", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 475024, "caption": "The image depicts a vase placed on a wooden surface under a mirror", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["orange", "vase", "dining table", "potted plant"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 238065, "caption": "The image shows a young man riding on a skateboard down a ramp while performing tricks in the air", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["skateboard", "chair", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 314016, "caption": "According to the picture, there is a bathroom sink with toilet paper on a shelf above it", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bottle", "toilet", "sink", "book"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 322163, "caption": " The image depicts a man in a large kitchen, actively preparing food in the middle of the room", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "dining table", "potted plant", "remote", "oven", "bottle", "person", "pizza", "microwave"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.1111111111111111}}, {"image_id": 230983, "caption": "The image features a person on a skateboard, captured in mid-air while jumping over an object", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["skateboard", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 564629, "caption": "According to the image, there is a kitchen area that has wooden cabinets with different sizes throughout", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["oven", "refrigerator", "sink", "microwave"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 53431, "caption": "In the image, a man is sitting outside a building, possibly waiting for someone or enjoying the day", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "laptop", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 441840, "caption": "The image captures a typical baseball game, featuring a young boy in a baseball uniform who is swinging at a baseball, held in his hand", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["baseball bat", "baseball glove", "car", "person", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2}}, {"image_id": 53465, "caption": " The image features a large sheet cake decorated with pink frosting that is prominently displayed on a table", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "bowl", "dining table", "spoon", "cake", "person", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2857142857142857}}, {"image_id": 381031, "caption": " An image portrays a food scene laid out on a table top, containing a variety of food items", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "donut", "spoon", "bottle", "microwave", "apple", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.14285714285714285}}, {"image_id": 530520, "caption": " In the image, a group of four men, including two seated and two standing, sit outside on the grass, relaxing and enjoying their time together", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "motorcycle", "clock", "person", "laptop"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2}}, {"image_id": 539555, "caption": "According to the picture, a man in the center is catching a frisbee and performing a trick while holding it in his hand", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["skateboard", "person", "frisbee"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 279521, "caption": " In the image, there are two people standing near a public transit train", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "bus", "train", "handbag", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 560439, "caption": " The image captures a snowy winter scene where a group of three people, all wearing snowboards, are traveling down a snow-covered hill", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["snowboard", "backpack", "skis", "handbag", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 248353, "caption": " The scene is set at a ski slope where people are enjoying their skiing activities", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["snowboard", "skis", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 9628, "caption": " The image depicts a person, possibly a man, riding a water ski behind a boat", "mscoco_hallucinated_words": [["ski", "skis"]], "mscoco_gt_words": ["boat", "surfboard", "person"], "hallucination_idxs": [13], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.6666666666666666}}, {"image_id": 330050, "caption": "According to the picture, a man and woman are standing next to each other on a tennis court", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bench", "tennis racket", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 254161, "caption": " In this scene, a woman is flying a large kite outdoors, possibly in a city park", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["handbag", "kite", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 275749, "caption": "According to the picture, the scene involves a group of people gathered in a room, likely sitting on a couch or chairs, near several beverage bottles and a TV monitor", "mscoco_hallucinated_words": [["couch", "couch"]], "mscoco_gt_words": ["dining table", "chair", "bottle", "mouse", "person", "laptop", "tv", "cup"], "hallucination_idxs": [21], "metrics": {"CHAIRs": 1, "CHAIRi": 0.16666666666666666, "Recall": 0.5}}, {"image_id": 163518, "caption": " The image depicts a woman working in a kitchen, standing in front of a table filled with assorted salads", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "dining table", "oven", "chair", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 156696, "caption": "The image features a large train at a train station, positioned to the left of the platform", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["handbag", "train", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 525202, "caption": "The image features a pizza placed on top of a red and white tablecloth, likely in a restaurant or dining area", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "dining table", "chair", "spoon", "bottle", "knife", "person", "pizza", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.1111111111111111}}, {"image_id": 423984, "caption": " The image features a plate of food topped with carrots, broccoli, and bread", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["carrot", "broccoli", "dining table"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 499486, "caption": "The scene features two cats sitting on top of a unmade bed", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cat", "book", "bed"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 118124, "caption": "The image features a man wearing glasses, a blue tie, and a plaid shirt", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["tie", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 288729, "caption": " The image features a large cake that resembles a circus tent", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["teddy bear", "cake", "bear", "person", "elephant"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2}}, {"image_id": 177721, "caption": " In the image, a person is performing a trick on a skateboard", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["skateboard", "dining table", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 372220, "caption": " The image captures a man with gray hair and a beard wearing a black and white suit, black hat, and a tie", "mscoco_hallucinated_words": [["tie", "tie"]], "mscoco_gt_words": ["handbag", "cell phone", "horse", "person"], "hallucination_idxs": [23], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.25}}, {"image_id": 252625, "caption": "This is a photo capturing a small street or alley lined with many shops on the right side and a sidewalk on the left", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bicycle", "traffic light", "potted plant", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 493610, "caption": "The scene features a large truck or van with a flat top, occupied by a group of people", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bus", "car", "person", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 302789, "caption": "A small room is depicted with a bed sitting against the wall", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "bed", "bottle", "sink", "handbag", "suitcase", "refrigerator"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.14285714285714285}}, {"image_id": 30667, "caption": "According to the picture, there are two people sitting in the green booth, with a dog occupying one of the seating areas", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["boat", "dog", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 114108, "caption": " The image features several people seated around a table, some of them focused intently on the two slices of pizza placed on the table", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "dining table", "chair", "spoon", "knife", "person", "pizza", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.375}}, {"image_id": 328110, "caption": "According to the picture, there is a woman sitting on top of a park bench with a baby in her arms", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["handbag", "bench", "backpack", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 366111, "caption": " This image appears to be a vintage or black and white photo featuring several people riding bikes", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bicycle", "traffic light", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 532481, "caption": "The image features people enjoying a day on the water, with a man being pulled by a parasail in the middle of the ocean", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["surfboard", "kite", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 291634, "caption": "The scene is a sidewalk with a row of motorcycles parked in a row next to the curb", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bicycle", "motorcycle", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 463678, "caption": "The image shows a man on a tennis court swinging his tennis racket in preparation to return a serve, which is the main focus of the picture", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["tennis racket", "person", "sports ball"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 70815, "caption": " There is a dog sitting on the sidewalk near a bicycle, which is the main object in the scene", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bicycle", "dog", "person", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 367872, "caption": " The scene captures a moment of excitement during a baseball game as a batter swings at a ball on the field", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["baseball bat", "sports ball", "umbrella", "person", "baseball glove"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2}}, {"image_id": 353898, "caption": "The scene shows a person sitting on a cement walkway surrounded by a large group of birds", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "backpack", "bench", "person", "bird"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 88269, "caption": "The image displays a plate with a couple of sandwiches and a bowl of tomato soup next to them", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["spoon", "bowl", "sandwich"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 463211, "caption": "There is a close-up view of a young girl in a backpack walking in front of a school bus", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "bus", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 396269, "caption": "In a large and ornate room, there is a vase holding a bouquet of flowers and several chairs surrounding a circular table", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "vase", "dining table"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 98979, "caption": "The image shows a silver microwave oven sitting on a countertop, placed in the center of the scene", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["oven", "knife", "microwave"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 244455, "caption": " The image features two motorcycles riding on a street, with the riders wearing protective gear such as helmets, vests, and gloves", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["motorcycle", "bicycle", "car", "person", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 379443, "caption": " According to the picture, it is a close-up of a black material, with a purple plastic cutting shears held in a pair of scissors close to the material", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["scissors", "dining table", "orange"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 536154, "caption": "According to the image, there is a small child sitting on a couch or chair amidst a large pile of stuffed animals", "mscoco_hallucinated_words": [["couch", "couch"], ["chair", "chair"]], "mscoco_gt_words": ["teddy bear", "cat", "person"], "hallucination_idxs": [13, 15], "metrics": {"CHAIRs": 1, "CHAIRi": 0.6666666666666666, "Recall": 0.3333333333333333}}, {"image_id": 374061, "caption": "The image features a black cat sleeping and resting with its head against a stuffed animal", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["teddy bear", "cat", "bed", "couch", "bear"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2}}, {"image_id": 560018, "caption": "The image captures a lively ocean scene with a group of people enjoying water sports, such as surfing, in the waves", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["surfboard", "kite", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 353320, "caption": " The image captures a guitar, placed on the ground on top of a bench, as well as a backpack and two handbags lying nearby", "mscoco_hallucinated_words": [["backpack", "backpack"]], "mscoco_gt_words": ["handbag", "bench", "suitcase", "person"], "hallucination_idxs": [20], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.5}}, {"image_id": 256628, "caption": " In the image, a large, beautiful golden-colored dog is laying on the wooden floor of a patio, possibly enjoying some rest", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "bowl", "dog"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 158806, "caption": " The image features a person outside, likely in a backyard, with a large dog by their side", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sandwich", "person", "dog"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 424270, "caption": " The scene features a little girl sitting on a bed in the middle of the image", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "tv", "bed"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 368335, "caption": "The scene features a large parking lot filled with multiple cars", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["horse", "car", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 483227, "caption": " There is a group of people standing on a tennis court in the image, including at least nine people of various ages", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["tennis racket", "person", "sports ball"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 228306, "caption": "The image features a red bus traveling down a street near the water, possibly in a city", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bus", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 416384, "caption": "According to the picture, there is a woman sitting in a chair and using a cell phone", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "chair", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 364783, "caption": "The image is a picture of a red bathroom with a toilet, sink, and a tub or shower", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["potted plant", "chair", "bottle", "toothbrush", "sink", "toilet", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2857142857142857}}, {"image_id": 335041, "caption": " The image features a woman with skis standing on a snow-filled street, skiing past multiple cars parked alongside it", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["skis", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 531327, "caption": "The image features a white bowl placed on a dining table that is filled with a variety of mixed vegetables, consisting of broccoli, carrots, and other colored vegetables", "mscoco_hallucinated_words": [["bowl", "bowl"]], "mscoco_gt_words": ["fork", "dining table", "spoon", "knife", "wine glass", "broccoli", "carrot"], "hallucination_idxs": [5], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.42857142857142855}}, {"image_id": 451228, "caption": "The image features a busy street lined with holiday lights and decorations", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bicycle", "bus", "traffic light", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 256365, "caption": " The image features a large plate covered in various blue- and white-frosted cupcakes", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cake", "dining table", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 502936, "caption": "The scene is set at a tennis court in a large outdoor area, likely a park or a public recreational space", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["tennis racket", "person", "sports ball"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 451449, "caption": "According to the picture, there is a large dog lying in a dog bed, taking up most of the room", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dog", "book", "bed"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 51054, "caption": " The image features an elderly woman sitting on a bed in her bedroom", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "bed", "bottle", "person", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 1268, "caption": "According to the picture, there is a woman standing near the water, possibly taking a photograph or checking her phone", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "backpack", "boat", "handbag", "person", "bird"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 62692, "caption": "In the image, a woman is playing tennis on a sports court", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["tennis racket", "person", "sports ball"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 542771, "caption": "The image depicts a spacious room filled with a large array of chairs, dining tables, and a vase", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["vase", "dining table", "potted plant", "chair", "book", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 575406, "caption": " In the image, a red bus with a blue top and a white roof is driving along a street next to several other parked vehicles", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bus", "motorcycle", "potted plant", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 244834, "caption": "The scene features a group of people walking down a rainy street", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["potted plant", "bicycle", "clock", "umbrella", "handbag", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.14285714285714285}}, {"image_id": 151159, "caption": " There are several people present in the image, with some scattered throughout the scene and others grouped around skateboards", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["skateboard", "bench", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 277073, "caption": "The scene takes place on a street with multiple vehicles moving in different directions", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "motorcycle", "bicycle", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 377879, "caption": "The image features two military tanks, sitting on a large open area, likely a parking lot or a playground", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["train", "bed", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 436814, "caption": "The image displays a room with various types of technology set up in a small area", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "mouse", "laptop", "dining table"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 63934, "caption": "The scene features a person on a skateboard, dressed in black, navigating their way down a sidewalk in a suburban area", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["skateboard", "car", "person", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 275611, "caption": " The image features a small pizza sitting on top of a plate on a dining table", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["pizza", "dining table", "knife"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 516248, "caption": "In the image, a person is sitting at a dining table or desk, placing their hands near a computer keyboard and a mouse", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "mouse", "keyboard", "person", "laptop", "tv"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.8333333333333334}}, {"image_id": 478380, "caption": "The image depicts a person sitting in a van surrounded by a large flock of sheep", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sheep", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 422326, "caption": "The image depicts a parking lot with a variety of motorcycles parked along the side", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["motorcycle", "bicycle", "car", "person", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2}}, {"image_id": 110449, "caption": " The image shows two people standing behind a counter, each holding a remote", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["remote", "dining table", "person", "laptop", "tv"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 45550, "caption": " In the image, there is a man standing in a room filled with other people, taking a selfie", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["clock", "bowl", "sandwich", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 444913, "caption": "According to the picture, there is a man standing in a grassy area, possibly near some buildings, holding a bottle", "mscoco_hallucinated_words": [["bottle", "bottle"]], "mscoco_gt_words": ["car", "person", "frisbee"], "hallucination_idxs": [22], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.3333333333333333}}, {"image_id": 82709, "caption": "The image features a large field filled with a number of people scattered around, some seated, others standing or walking", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "frisbee", "bottle", "dog", "person", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.16666666666666666}}, {"image_id": 132796, "caption": "In the image, a group of three people are riding on the back of an elephant, enjoying their time together", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "chair", "bench", "person", "elephant"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 303099, "caption": "According to the picture, there are two cats sitting on a toilet in the bathroom", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bottle", "toilet", "cat"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 271565, "caption": "According to the image, a group of people are riding motorcycles down a paved street", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["motorcycle", "car", "person", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 205193, "caption": " In the image, there are two bowls on a kitchen counter next to each other", "mscoco_hallucinated_words": [["bowl", "bowl"]], "mscoco_gt_words": ["oven", "microwave", "person", "toaster"], "hallucination_idxs": [7], "metrics": {"CHAIRs": 1, "CHAIRi": 1.0, "Recall": 0.0}}, {"image_id": 272566, "caption": " The image shows a man sitting on the ground in front of a produce market", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["banana", "person", "apple", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 170099, "caption": " The image features a man standing in front of an orange couch, with his hands out and open, as if he is making a speech or presentation", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["tie", "orange", "couch", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 14940, "caption": "According to the picture, there is an orange and white cat sitting next to a stuffed animal or toy, perhaps hugging it", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cat", "chair", "couch", "orange", "dog"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 408449, "caption": "According to the picture, several people are present in the scene, with one man riding a skateboard and another walking behind him", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "bus", "handbag", "skateboard", "car", "person", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2857142857142857}}, {"image_id": 140702, "caption": " The scene features two elephants, an adult and a baby, walking together on an open grassy field", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["elephant", "bird", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 354540, "caption": "The image shows a person, likely a woman, sitting at a kitchen countertop with a laptop and a smartphone", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "oven", "chair", "person", "toaster", "laptop", "microwave"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.42857142857142855}}, {"image_id": 19763, "caption": " The image showcases a piece of pizza placed on a white plate on a dining table, accompanied by a fork", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "dining table", "chair", "knife", "person", "pizza", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.42857142857142855}}, {"image_id": 191301, "caption": "The image features a small, white tray containing two pieces of food \u2013 one dish, possibly consisting of chocolate cake, and the other a square piece of cake, perhaps vanilla", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "spoon", "cake", "person", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2}}, {"image_id": 124236, "caption": " The image showcases a kitchen filled with various items, including a toaster oven sitting on the counter", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "dining table", "oven", "spoon", "toaster"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 344930, "caption": "According to the picture, there is a red fire hydrant in the scene on the sidewalk, which is located at the edge of a residential street", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["orange", "car", "fire hydrant"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 14285, "caption": "In the image, a large, fluffy cat is laying on a bed, resting comfortably in a room", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["remote", "cat", "bed", "chair", "book", "tv"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 82488, "caption": "There is a hotel room or hotel bedroom setting with two twin beds in it, as indicated by the furniture, with a desk or nightstand on the left and another one on the right", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["remote", "dining table", "bed", "clock", "book", "orange"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 348251, "caption": "The image captures a man standing on top of a snow-covered slope, wearing skis and enjoying the winter scenery", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "skis", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 150703, "caption": "The image features a sandwich made with a hot dog and topped with various toppings, such as pickles", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["hot dog", "dining table", "sandwich", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 381615, "caption": "The image showcases a warm, cozy room with a bright window, where a variety of plants are displayed prominently throughout", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["vase", "potted plant", "chair", "book", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 352703, "caption": " The scene features a woman preparing food at a dinner party, possibly in an outdoor setting", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "dining table", "oven", "spoon", "bottle", "handbag", "person", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.125}}, {"image_id": 111109, "caption": " The image features a young boy wearing shorts standing on a chair in a room", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["motorcycle", "chair", "tie", "person", "tv"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 226802, "caption": "A group of people, many of whom appear to be tourists, are gathered around a red street near several buildings, with a bus visible in the scene", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bus", "motorcycle", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 49005, "caption": " The scene depicts a group of baseball players on a field during a game", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["baseball bat", "person", "baseball glove"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 410114, "caption": " The scene is a road or highway with a large herd of cows and a few people walking down it", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["truck", "horse", "person", "cow"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 100274, "caption": "According to the picture, there is a train on some tracks at a rail yard, sitting near other trains on the railways", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["train", "car", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 317254, "caption": "In the scene, a person is sitting on the back of a motorcycle, riding down a street", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["motorcycle", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 425569, "caption": " The image showcases a large kitchen featuring a variety of shiny silver cooking equipment", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "sink", "oven"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 28842, "caption": "The image features two young men in a park, possibly having fun on their skateboards", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["skateboard", "dog", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 319607, "caption": " The image captures an intersection scene where there is a traffic light at the top of the frame", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "bus", "bicycle", "traffic light", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.16666666666666666}}, {"image_id": 210372, "caption": "In the image, there is a small kitchen featuring red cupboards and drawers underneath the countertops", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["refrigerator", "bottle", "sink"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 156915, "caption": " The image features a vase filled with a variety of flowers, including red roses, white flowers, and greenery", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["vase", "dining table", "potted plant"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 349642, "caption": "The image shows a man sitting on a wooden bench while a dog is laying underneath it, giving the impression that they are enjoying each other's company", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bench", "dog", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 423008, "caption": " The image depicts a body of water, likely a canal, with a group of small boats lined up near the shore", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["boat", "umbrella", "handbag", "person", "suitcase"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2}}, {"image_id": 45435, "caption": " The image features a person holding up their cell phone, highlighting its camera", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "person", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 35827, "caption": " The image captures a man sitting in front of his desk, using his laptop and a computer screen as he is on his desktop computer working", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "chair", "bottle", "person", "laptop", "tv", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.42857142857142855}}, {"image_id": 72656, "caption": " The image features a group of children seated at a table outdoors", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "dining table", "chair", "person", "pizza", "suitcase"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 372087, "caption": " The image features a long, green and yellow train traveling down a train track as it approaches a train station", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["train", "bench", "suitcase", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 336209, "caption": "The image captures a young man in the process of jumping off a skateboard on a ramp, or off a ledge", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["skateboard", "bench", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 46031, "caption": "The image displays two laptops side by side on a table", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "dining table", "mouse", "keyboard", "laptop", "tv"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 283118, "caption": "The image features a family sitting at a table in a restaurant or a dining area, consisting of a man, a woman, and their two children", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "backpack", "dining table", "chair", "bottle", "handbag", "car", "person", "pizza"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2222222222222222}}, {"image_id": 429598, "caption": "The image depicts a kitchen with stained wood cabinets", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sink", "bottle", "refrigerator", "oven"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 333365, "caption": "The image shows an airport scene with several planes parked on the tarmac", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["car", "airplane", "person", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 424174, "caption": "The image features a large bowl full of various fruits, including bananas, oranges, and apples", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "dining table", "banana", "orange", "apple"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.8}}, {"image_id": 3035, "caption": " The image captures a scene at an airport, with two airplanes positioned at different locations on a runway", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["car", "airplane", "person", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 177213, "caption": " The image showcases a pizza placed on a white dish in the center of the scene", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "dining table", "knife", "person", "pizza", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.16666666666666666}}, {"image_id": 438535, "caption": " The image depicts a city street scene with a prominent clock in the center, surrounded by various buildings in the background", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "clock", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 490711, "caption": " The image features a white kitchen with clean and modern appliances", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sink", "banana", "refrigerator"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 163728, "caption": "According to the picture, there is a gray and white cat sleeping on a keyboard surface, curled up next to an empty glass", "mscoco_hallucinated_words": [["keyboard", "keyboard"]], "mscoco_gt_words": ["dining table", "cat", "mouse", "laptop", "cup"], "hallucination_idxs": [15], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.2}}, {"image_id": 456756, "caption": " The image features a group of animals including a giraffe and several zebras", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["zebra", "giraffe", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 281028, "caption": "The image depicts a room with multiple chairs arranged throughout the space", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["train", "chair", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 343937, "caption": " In the snow, a young woman wearing all white clothing is snowboarding down a slope", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["snowboard", "skis", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 277051, "caption": " The image showcases two little birds, sitting on a dining table near a pizza slice that's partially eaten", "mscoco_hallucinated_words": [["pizza", "pizza"]], "mscoco_gt_words": ["dining table", "chair", "bottle", "knife", "bird"], "hallucination_idxs": [14], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.4}}, {"image_id": 145666, "caption": " The image features a large metal pan filled with a variety of cooked broccoli and carrots, ready to be consumed", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "broccoli", "dining table", "carrot"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 304984, "caption": "The image features a white plate topped with two sandwiches", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "bowl", "cake", "sandwich", "wine glass", "orange"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.16666666666666666}}, {"image_id": 122467, "caption": "In the image, there is a person holding a video game controller in their right hand, indicating they are playing a game", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["couch", "remote", "dining table", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 518287, "caption": "According to the image, it features a toothbrush with a mouth full of teeth inside of a holder", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["orange", "toothbrush", "dining table", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 145448, "caption": " In the scene, there is a gray cat laying on top of a dining table near a tire and motorcycle", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["motorcycle", "dining table", "cat", "chair", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 352900, "caption": " There is a white plate on the table filled with a pasta dish with pieces of cooked broccoli", "mscoco_hallucinated_words": [["table", "dining table"]], "mscoco_gt_words": ["fork", "bowl", "broccoli", "knife"], "hallucination_idxs": [7], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.25}}, {"image_id": 153607, "caption": " The image is a collage of different vases filled with water", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["orange", "bowl", "dining table", "vase"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 157581, "caption": " There is an image showcasing a table filled with various bottles of wine placed side by side", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "chair", "bottle", "wine glass", "person", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 227438, "caption": "The image is of a hotel room with a double bed, a television, and a desk", "mscoco_hallucinated_words": [["television", "tv"], ["desk", "dining table"]], "mscoco_gt_words": ["chair", "couch", "clock", "bed"], "hallucination_idxs": [13, 17], "metrics": {"CHAIRs": 1, "CHAIRi": 0.6666666666666666, "Recall": 0.25}}, {"image_id": 116037, "caption": "The image captures a moment during a baseball game, with several people in the scene", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["baseball bat", "person", "sports ball", "baseball glove"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 202658, "caption": " In this image, a white toilet with a pink seat is sitting on the ground in a backyard", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "bowl", "toilet"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 18150, "caption": "According to the picture, a man and a little boy are sitting on the floor next to each other, with the boy giving the man a slice of pizza", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "couch", "bottle", "person", "pizza"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 418711, "caption": "In this image, a person on a bike is plowing through a long dirt road filled with bananas and multiple vehicles", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["banana", "bicycle", "car", "person", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 92107, "caption": "According to the image, there is a bowl filled with soup on a table", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["spoon", "bowl", "broccoli", "dining table"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 491000, "caption": "According to the image, a group of people is walking down a street, engaging in conversation while carrying various bags", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["motorcycle", "handbag", "car", "person", "dog"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2}}, {"image_id": 401163, "caption": "The image depicts a park, with a couple sitting on a bench near the center", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bench", "dog", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 39663, "caption": "The image displays a variety of assorted items including various books, a laptop, and a school backpack laid out on a floor", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "scissors", "backpack", "book", "laptop"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 268293, "caption": "The image features a man standing on a tennis court, holding a tennis racket as he prepares to swing and hit the tennis ball", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["tennis racket", "person", "sports ball"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 474499, "caption": "The image displays a well-equipped kitchen with various appliances such as a microwave, a sink, and a refrigerator", "mscoco_hallucinated_words": [["microwave", "microwave"], ["refrigerator", "refrigerator"]], "mscoco_gt_words": ["vase", "oven", "spoon", "bottle", "clock", "sink", "apple"], "hallucination_idxs": [12, 19], "metrics": {"CHAIRs": 1, "CHAIRi": 0.6666666666666666, "Recall": 0.14285714285714285}}, {"image_id": 358086, "caption": "The image depicts a group of people playing frisbee in a field", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "chair", "bottle", "person", "frisbee"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 89541, "caption": "In the image, there is a plastic food container filled with a variety of different food items", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["banana", "cake", "bowl", "dining table"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 239445, "caption": "According to the picture, the image features a man standing near a car, holding an empty frisbee in one hand and another, full frisbee in the other", "mscoco_hallucinated_words": [["car", "car"]], "mscoco_gt_words": ["person", "sports ball", "frisbee"], "hallucination_idxs": [13], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.6666666666666666}}, {"image_id": 105782, "caption": "According to the picture, a zebra and an airplane are flying in the field, creating an unusual scene", "mscoco_hallucinated_words": [["zebra", "zebra"], ["airplane", "airplane"]], "mscoco_gt_words": ["cat", "kite", "dog", "car"], "hallucination_idxs": [6, 9], "metrics": {"CHAIRs": 1, "CHAIRi": 1.0, "Recall": 0.0}}, {"image_id": 487990, "caption": "There is an image being displayed, with a small guitar on top of a table full of food", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "bowl", "dining table", "donut", "spoon", "bottle", "cake", "knife", "person", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.1}}, {"image_id": 138834, "caption": "In the picture, a person is carrying skis on their back, as they are either going skiing or returning from a skiing trip", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["skis", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 492057, "caption": "The image shows a man taking a selfie in a public bathroom, with him standing in front of the mirror", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "tie", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 388215, "caption": "The image depicts a man standing on a tennis court, getting ready to play a game of tennis", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["tennis racket", "person", "sports ball"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 111409, "caption": "The image features a man riding a motorcycle, wearing a helmet, and carrying a backpack", "mscoco_hallucinated_words": [["backpack", "backpack"]], "mscoco_gt_words": ["bicycle", "motorcycle", "person"], "hallucination_idxs": [16], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.6666666666666666}}, {"image_id": 451391, "caption": "There is a person holding a large bouquet of green broccoli at a grocery store, showcasing their artistic arranging skills", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["broccoli", "dining table", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 92462, "caption": " The image features a herd of cows moving along a red dirt road, accompanied by two cars on either side", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "car", "person", "cow"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 397268, "caption": " In the image, there is a shop or store with two bicycles displayed in the window", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bicycle", "chair", "bench", "potted plant"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 127659, "caption": " The scene depicts a train traveling along a railroad track, with people waiting for it at a train station", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["train", "bench", "dog", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 251857, "caption": "In the image, there are two people skateboarding on a cement surface", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["skateboard", "traffic light", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 243212, "caption": "According to the picture, a small child is standing on a grass-filled field while holding a blue Frisbee in each hand", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dog", "car", "truck", "person", "frisbee"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 444304, "caption": "According to the image, there is a young man squatting on his bed, possibly playing a video game", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "remote", "tv", "bed"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 305000, "caption": " The image shows an outdoor market with a woman standing in front of a fruit stand and two other people nearby", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["banana", "apple", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 44136, "caption": "In the image, two men wearing tuxedos are sitting at a table while a party is going on", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "tie", "bottle", "wine glass", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 154846, "caption": "This image captures a delicious pepperoni pizza with mushrooms on it sitting on a counter", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["pizza", "dining table", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 567254, "caption": "According to the picture, there is a young child standing in front of a television, with blonde hair, seemingly watching something on the screen", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "bottle", "tv", "vase"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 79261, "caption": " According to the picture, there is a man standing in the middle of a shallow water feature with a broom, sweeping the water", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["handbag", "backpack", "clock", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 301402, "caption": " The image shows a man sitting in a chair, possibly in a living room or dining room, with a laptop placed on his lap", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "potted plant", "chair", "bottle", "person", "laptop"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 415828, "caption": " There is a large group of people standing on a city street next to an alley, possibly waiting for a bus or train", "mscoco_hallucinated_words": [["train", "train"]], "mscoco_gt_words": ["backpack", "stop sign", "umbrella", "handbag", "traffic light", "car", "person"], "hallucination_idxs": [23], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.14285714285714285}}, {"image_id": 543231, "caption": " The scene depicts a woman in her living room, taking a picture", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["remote", "bowl", "bed", "book", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2}}, {"image_id": 495357, "caption": "In the image, a small motorcycle or toy car is being ridden by a small child", "mscoco_hallucinated_words": [["car", "car"]], "mscoco_gt_words": ["handbag", "motorcycle", "dog", "person"], "hallucination_idxs": [9], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.5}}, {"image_id": 523175, "caption": " The image features a plate with a bowl of soup, filled with various vegetables such as carrots", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["spoon", "bowl", "carrot", "dining table"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 184945, "caption": "The image features several motorcycles parked along a street next to a train station", "mscoco_hallucinated_words": [["train", "train"]], "mscoco_gt_words": ["bicycle", "motorcycle", "potted plant"], "hallucination_idxs": [12], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.3333333333333333}}, {"image_id": 49942, "caption": "The image portrays a man, likely the focal point of the photograph, holding a single open umbrella, while wearing a tie", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["tie", "person", "umbrella"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 223019, "caption": "There is a blue train stationed at a platform in a city or train station setting", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "train", "handbag", "car", "person", "suitcase"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.16666666666666666}}, {"image_id": 42889, "caption": " In the image, a white teddy bear is sitting on top of a keyboard and keyboard cover", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["teddy bear", "bear", "keyboard"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 22112, "caption": "The image showcases a collection of figurines and a pot with grass inside", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "dining table", "potted plant", "vase"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 247587, "caption": "According to the picture, there is a man standing on a surfboard in the middle of the beach scene", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["surfboard", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 171962, "caption": "In this scene, there is a large bus driving down a city street, with a car on the left side of the bus", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bicycle", "bus", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 545056, "caption": "The image depicts a large field full of black cows and a few scattered sheep, all in various positions within the field", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sheep", "dog", "car", "cow"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 401411, "caption": "In the image, there is a man standing in front of a table full of food, likely in a restaurant or kitchen setting", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "dining table", "oven", "book", "person", "carrot", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2857142857142857}}, {"image_id": 2867, "caption": " In the snow-covered scene, a group of skiers is gathered, with people standing close to each other, and some are skiing", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "skis", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 246963, "caption": "According to the picture, a group of motorcyclists are driving on a downward slope of a road, travelling south", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["stop sign", "motorcycle", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 498225, "caption": " In the image, a group of people, including a man and three women, are standing in front of a store window displaying numerous cakes", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "donut", "cake", "handbag", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 124601, "caption": "The image depicts a small, compact kitchen filled with various items, including a laptop and other electronic devices, ovens, and other cooking appliances", "mscoco_hallucinated_words": [["oven", "oven"]], "mscoco_gt_words": ["dining table", "bottle", "keyboard", "sink", "wine glass", "microwave", "laptop", "cup"], "hallucination_idxs": [21], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.125}}, {"image_id": 581749, "caption": " The image displays a variety of fruits and vegetables placed inside a container", "mscoco_hallucinated_words": [["container", "bowl"]], "mscoco_gt_words": ["orange", "broccoli", "dining table"], "hallucination_idxs": [12], "metrics": {"CHAIRs": 1, "CHAIRi": 1.0, "Recall": 0.0}}, {"image_id": 227960, "caption": "In the image, a bowl of food sits on a table filled with a variety of vegetables, including carrots and broccoli", "mscoco_hallucinated_words": [["table", "dining table"], ["broccoli", "broccoli"]], "mscoco_gt_words": ["bowl", "spoon", "wine glass", "carrot", "cup"], "hallucination_idxs": [11, 22], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.4}}, {"image_id": 286503, "caption": "The scene takes place in a large enclosure, with a couple of people standing in the background", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["elephant", "person", "sports ball"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 315740, "caption": "This image depicts a spacious and modern kitchen, featuring wood cabinets and stainless steel appliances", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "potted plant", "oven", "chair", "couch", "sink", "tv", "microwave"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 142108, "caption": "The image depicts a group of people in a kitchen, blindfolded while they are in line, ready to eat a banana", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["banana", "dining table", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 542933, "caption": "The image is a photograph taken at a baseball game, where a batter is getting ready to hit the ball and an umpire is standing nearby", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["baseball bat", "chair", "sports ball", "bench", "person", "baseball glove"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.16666666666666666}}, {"image_id": 475043, "caption": "A group of three people is sitting on couches in a room, using laptops to communicate and socialize with one another", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "spoon", "couch", "bottle", "person", "laptop"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 456784, "caption": "The image depicts a person cutting a white, chocolate-iced cake using a knife", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cake", "knife", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 33753, "caption": " The image depicts a wooden outdoor bench with a remote control sitting on it", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "bench", "remote", "tv"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 448694, "caption": " In the image, a group of young men is playing a friendly game of frisbee while a crowd of onlookers watches the action", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "person", "frisbee"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 99053, "caption": "The image features a bowl filled with a variety of ingredients, including noodles and vegetables", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "bowl", "dining table", "broccoli", "carrot"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2}}, {"image_id": 503210, "caption": " The image depicts a living room filled with various furniture", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["vase", "potted plant", "chair", "couch", "clock", "book", "orange"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 142257, "caption": " This scene captures a busy intersection filled with traffic, with several cars, a truck, and a taxi in the middle of the road", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["traffic light", "car", "person", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}], "overall_metrics": {"CHAIRs": 0.09619238476953908, "CHAIRi": 0.06430155210643015, "Recall": 0.34506398537477145, "num_hallucinated_caps": 48.0, "num_caps": 499.0, "hallucinated_word_count": 58.0, "coco_word_count": 902.0, "length_response": 19.470941883767534, "hallucinated_caps_ls": [144305, 324008, 493862, 155671, 32625, 18688, 370657, 481596, 209347, 344942, 490491, 482432, 557998, 59710, 265628, 453731, 259345, 378831, 295105, 526414, 505213, 191691, 561967, 198163, 217593, 558784, 9628, 275749, 372220, 536154, 353320, 531327, 444913, 205193, 163728, 277051, 352900, 227438, 474499, 239445, 105782, 111409, 415828, 495357, 184945, 124601, 581749, 227960]}}}