{"overall_metrics": {"CHAIRs": 0.258, "CHAIRi": 0.09568382735309412, "Recall": 0.5225512528473805, "num_hallucinated_caps": 129.0, "num_caps": 500.0, "hallucinated_word_count": 184.0, "coco_word_count": 1923.0, "length_response": 41.85, "hallucinated_caps_ls": [95908, 324008, 247179, 493862, 253630, 161227, 343534, 459141, 227031, 209347, 183766, 344942, 133146, 498747, 185327, 129707, 37907, 235595, 489909, 333712, 148977, 399058, 183571, 325836, 467887, 346716, 401010, 313928, 222782, 122602, 59710, 527497, 265628, 499594, 255483, 258209, 245664, 453731, 443299, 120776, 219546, 437720, 535403, 449798, 375769, 426172, 138078, 180764, 147762, 333998, 295105, 301837, 240681, 250540, 47940, 134768, 526414, 273132, 505213, 412407, 188136, 449675, 191691, 557447, 134223, 475813, 558784, 53431, 441840, 381031, 539555, 279521, 330050, 254161, 163518, 423984, 288729, 302789, 30667, 328110, 379443, 536154, 353320, 416384, 531327, 1268, 575406, 436814, 275611, 444913, 303099, 205193, 272566, 14940, 191301, 124236, 14285, 381615, 49005, 425569, 210372, 429598, 490711, 304984, 153607, 227438, 18150, 491000, 474499, 358086, 487990, 397268, 127659, 444304, 305000, 567254, 79261, 543231, 184945, 42889, 247587, 124601, 581749, 227960, 315740, 475043, 456784, 33753, 503210]}, "results": {"sentences": [{"image_id": 144305, "caption": "A laptop computer is sitting on a desk with a keyboard and headphones next to it. There are several wires connecting the computer to various devices.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["laptop", "keyboard", "dining table"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 164091, "caption": "In the image, there is a girl sitting in a baby carriage, with a stuffed animal and a toy next to her. The baby carriage is placed in a bedroom, with a dresser and a bed in the background. The girl is smiling, creating a warm and cozy atmosphere.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "teddy bear", "bed"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 308003, "caption": "A wooden bench sits in a grassy area, surrounded by trees and a dirt path. The bench has a green and wooden appearance, with some wood chips scattered on the ground. The setting provides a tranquil and natural atmosphere, creating a comfortable space for relaxation and contemplation.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bench", "chair", "dining table"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 54870, "caption": "The image features a delicious meal consisting of a chicken sandwich, a slice of tomato, and a salad on a plate.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["knife", "sandwich", "fork"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 95908, "caption": "A small white cup with a coffee stain sits on a table next to a mouse and a keyboard. The mouse is connected to a computer, and a laptop is also present on the table. The scene suggests that the person is working on a computer while drinking a cup of coffee.", "mscoco_hallucinated_words": [["person", "person"]], "mscoco_gt_words": ["laptop", "mouse", "keyboard", "dining table", "cup"], "hallucination_idxs": [43], "metrics": {"CHAIRs": 1, "CHAIRi": 0.09090909090909091, "Recall": 1.0}}, {"image_id": 329614, "caption": "A city street is filled with cars, buses, and pedestrians, while a large building stands out in the background.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "car", "bus"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 324008, "caption": "A person is sitting in a plane seat, enjoying a meal consisting of a sandwich, fruit, and a drink. The meal is served on a tray, which is placed on their lap.", "mscoco_hallucinated_words": [["seat", "chair"], ["sandwich", "sandwich"]], "mscoco_gt_words": ["banana", "person", "dining table", "train", "cup", "airplane", "orange"], "hallucination_idxs": [7, 15], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.2857142857142857}}, {"image_id": 52700, "caption": "A group of people is enjoying a cake-making event at a table. There are many delicious-looking cakes and desserts on the table, and some people are using forks to taste the food. One person is wearing a white apron, possibly indicating that they are the host or", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "person", "cake", "dining table", "spoon", "handbag"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 501311, "caption": "A baseball player is pitching a baseball in a dirt field, with a person standing behind him to catch the ball. The player is wearing a baseball uniform, and the image is taken from a close-up perspective. The background of the image is the dirt field, which is a common location for baseball", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sports ball", "person", "baseball glove"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 247179, "caption": "A group of people dressed in traditional clothing, including a man holding a tusked elephant, are standing in front of a decorated elephant, with the city in the background. The scene is lit up by streetlights and a lighted elephant, adding a festive and color", "mscoco_hallucinated_words": [["streetlight", "traffic light"]], "mscoco_gt_words": ["person", "elephant", "truck", "clock"], "hallucination_idxs": [39], "metrics": {"CHAIRs": 1, "CHAIRi": 0.16666666666666666, "Recall": 0.5}}, {"image_id": 577912, "caption": "A large bathroom with a freestanding bathtub and a separate shower area is shown in the image. The bathtub is surrounded by marble tiles, giving it a luxurious appearance. A sink and a toilet are also present in the bathroom. The bathroom has", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sink", "toothbrush", "toilet", "bottle"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 196341, "caption": "A person walks past a large clock in a busy, dimly lit hallway. The clock features a large face with Roman numerals and is situated on a wall. The presence of the clock creates a sense of time and movement in the image, while the person adds a sense of scale and human interaction to the", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "handbag", "clock"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 234433, "caption": "A sign is posted on a pole at the side of a road, pointing out the left turn lane. The image shows a bicycle parked near the sign, and there is a person walking by.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "traffic light", "bicycle", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 455610, "caption": "A group of people are gathered around a motorcycle, admiring its unique design and vibrant colors. The motorcycle has a large front wheel and a red and green paint scheme. It appears to be parked on the side of a street or a parking lot, surrounded by people who are curious about the", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "traffic light", "motorcycle", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 39053, "caption": "A dining table is filled with a variety of food items, including pancakes, eggs, and a spoon.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "dining table", "bowl", "cup", "spoon", "cake", "apple"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.42857142857142855}}, {"image_id": 493862, "caption": "A young man is seen standing on a hill, with his tennis racket in hand, ready to hit a tennis ball. The image captures the sun-drenched landscape, creating a serene and picturesque setting. The young man's outdoor tennis practice is a perfect example of enjoying the out", "mscoco_hallucinated_words": [["ball", "sports ball"]], "mscoco_gt_words": ["person", "tennis racket", "dog"], "hallucination_idxs": [22], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.6666666666666666}}, {"image_id": 269873, "caption": "A group of people is walking down a city street in front of a bus stop, looking at a sign that reads \"Avenue.\"", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "traffic light", "bus", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 524656, "caption": "A kitchen filled with various appliances and cookware, including a stove, refrigerator, sink, and microwave, is shown in the image.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["toaster", "microwave", "sink", "bottle", "bowl", "knife", "cup", "spoon", "wine glass", "oven", "refrigerator"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.36363636363636365}}, {"image_id": 369547, "caption": "A black and white dog is sitting on the beach, looking out at the ocean while a seagull is flying overhead.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bird", "cat", "dog"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 181446, "caption": "The image shows a man standing next to a refrigerator, holding a bottle of soda, and looking at the contents in the refrigerator.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "sink", "bottle", "bowl", "refrigerator"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 128119, "caption": "A group of people is standing on the sidewalk, waiting for a bus. One person is holding a bicycle, while another person is holding a purple backpack. There are also bicycles hanging on the bus rack, indicating that the bus is likely a public transportation option for those who", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bus", "bicycle", "cell phone", "person", "handbag", "backpack"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 401027, "caption": "A sandwich is sitting on a white plate in a dark room, with a cup of soup nearby. It's a cold and dark setting, possibly indoors, with the light source coming from the lamp.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "sandwich", "dining table", "knife", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 253630, "caption": "A large dining table is sitting in a room with a television, a couch, and a rug. The room has a nice, comfortable atmosphere, making it a suitable place for gathering or spending time with family and friends.", "mscoco_hallucinated_words": [["couch", "couch"]], "mscoco_gt_words": ["potted plant", "chair", "dining table", "tv"], "hallucination_idxs": [14], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.5}}, {"image_id": 326021, "caption": "A woman is sitting at a table with a teddy bear and a sign that reads \"Badger Day - Come and Get Your Free Eye Exam\" and \"Just See the Results.\"", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "teddy bear", "dining table"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 317320, "caption": "A man rides a bicycle on a yellow line down a street, while another man is walking past a street crossing with a bicycle.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "bicycle", "motorcycle"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 507171, "caption": "A man rides a surfboard in the water, performing tricks and jumps.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "surfboard", "cat"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 161227, "caption": "The image shows a black leather chair with a remote control on a coffee table. The chair is empty, and there is a TV set with a remote control in front of it. The scene is a living room setting where someone might be relaxing and watching TV.", "mscoco_hallucinated_words": [["table", "dining table"], ["tv", "tv"], ["tv", "tv"]], "mscoco_gt_words": ["laptop", "chair", "cell phone", "keyboard", "remote", "couch"], "hallucination_idxs": [14, 25, 50], "metrics": {"CHAIRs": 1, "CHAIRi": 0.42857142857142855, "Recall": 0.3333333333333333}}, {"image_id": 25812, "caption": "A young man is seen skiing down a snowy slope in a forest, with a mountainous backdrop and a ski lift in the distance.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "skis", "snowboard"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 267537, "caption": "A group of three women are sitting together on a bench in a stadium, with umbrellas above them. They appear to be enjoying a rainy day, watching a sporting event or waiting for the start of a game. The image captures the essence of the shared experience and the bond", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "umbrella", "bench", "tie"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 195645, "caption": "A group of people, including children and adults, are gathered together at a picnic table, enjoying a glass of wine and socializing. They are in a scenic outdoor setting, surrounded by trees and a mountain in the background. The atmosphere appears to be relaxed and friendly, with the group enjo", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "bottle", "dining table", "wine glass", "handbag", "bench"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 155671, "caption": "A street with a red traffic light is visible in the image, along with a few cars and a large, white building in the background. The street is quite busy, with multiple cars passing through the intersection.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["traffic light", "truck", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 412894, "caption": "A group of people is walking down a street in London, passing by a red double-decker bus and a streetlight. The scene is bustling and full of activity, showcasing the city's vibrant atmosphere and the diverse crowd of pedestrians.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "handbag", "backpack", "traffic light"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 32625, "caption": "A glass of cola, a bowl of soup, and a fork sit on a table.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "dining table", "bowl", "cup", "book"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 18688, "caption": "A baseball player is standing on the field, wearing a baseball uniform and holding a baseball bat. He is positioned at home plate, ready to hit the ball.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sports ball", "person", "baseball glove", "baseball bat"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 343534, "caption": "A young girl is sitting on a chair, holding a stuffed teddy bear, while a stuffed dog is sitting next to her. The girl is wearing a pink and black outfit and a hat, and the dog is wearing a red collar. The scene is set in a living room,", "mscoco_hallucinated_words": [["girl", "person"], ["girl", "person"]], "mscoco_gt_words": ["chair", "potted plant", "teddy bear", "book", "dog"], "hallucination_idxs": [2, 26], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.6}}, {"image_id": 370657, "caption": "A group of people, including a man, a woman, and a child, ride their motorcycles on the street, with the man and the child wearing helmets. The woman is wearing a helmet as well, but her head is not visible due to the angle of the image. They are", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "handbag", "motorcycle"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 481596, "caption": "A man is sitting in the stands at a baseball game, eating a hot dog while enjoying the game.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "hot dog", "chair"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 460347, "caption": "A caption for the image could be: A city street is filled with cars and a bus, while a person stands on the sidewalk, looking down.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "car", "bus"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 398753, "caption": "A group of people, possibly family members, is gathered in the stands, watching a baseball game in progress. They are all seated together and enjoying the event.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sports ball", "person", "baseball glove", "baseball bat"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 67833, "caption": "A caption for the image could be: \"A group of friends are enjoying a meal together, sitting around a table with a delicious pizza in the center. They are using knives and forks to cut the pizza into slices, and the meal is accompanied by a wine glass and", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "person", "dining table", "bottle", "bowl", "pizza", "knife", "cup", "wine glass"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5555555555555556}}, {"image_id": 272880, "caption": "The image shows a person holding a pizza slice and a fork, with a pizza box in front of them on a dining table.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "person", "dining table", "pizza", "knife", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 254368, "caption": "A man is sitting on a bed, wearing a bathrobe, and holding a plate of food in his hand.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "pizza", "bed"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 193108, "caption": "A young man is standing in a baseball field, wearing a black and yellow baseball jersey and holding a baseball bat. He is in a stance, ready to swing at a ball being pitched by another player. The image captures the excitement and anticipation of a game, where players are preparing", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sports ball", "person", "baseball bat"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 459141, "caption": "A woman is riding a bicycle, holding a green umbrella, and carrying a large bag on the back of her bike.", "mscoco_hallucinated_words": [["umbrella", "umbrella"]], "mscoco_gt_words": ["potted plant", "person", "bicycle", "motorcycle"], "hallucination_idxs": [10], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.5}}, {"image_id": 231534, "caption": "An airplane sits on the tarmac, surrounded by luggage carts and cargo trucks.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "suitcase", "truck", "airplane", "handbag"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 227031, "caption": "A man and woman are standing in front of a cake, smiling and holding a pair of scissors as they prepare to cut the cake. The cake is decorated with flowers, and there is a candle on top.", "mscoco_hallucinated_words": [["scissors", "scissors"]], "mscoco_gt_words": ["person", "dining table", "knife", "tie", "potted plant", "cake"], "hallucination_idxs": [18], "metrics": {"CHAIRs": 1, "CHAIRi": 0.16666666666666666, "Recall": 0.3333333333333333}}, {"image_id": 209347, "caption": "A woman is sitting on a train, using her cell phone while wearing a leather jacket and a purse. She is seated in a train car with a window view.", "mscoco_hallucinated_words": [["car", "car"]], "mscoco_gt_words": ["cell phone", "person", "train", "tie", "handbag"], "hallucination_idxs": [27], "metrics": {"CHAIRs": 1, "CHAIRi": 0.16666666666666666, "Recall": 0.8}}, {"image_id": 523292, "caption": "A cat is sitting on a computer desk, looking at a laptop screen.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["laptop", "chair", "cat", "dining table", "tv"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 12375, "caption": "A plate full of delicious food, including a pork chop, potatoes, carrots, and broccoli, is being served on a white tablecloth.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["carrot", "broccoli", "dining table"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 13550, "caption": "A woman is sitting on a rock, feeding an elephant in a zoo. She is smiling and appears to be enjoying the interaction.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "elephant", "handbag"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 146837, "caption": "A young man is seen jumping off a skateboard ramp in a park, performing a trick. He is wearing a blue t-shirt and a red and white striped hat. The park is surrounded by trees and a sidewalk, creating a unique environment for skateboarding.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "skateboard", "motorcycle"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 67042, "caption": "A man is standing near a doorway, looking at his phone while waiting for someone or something. He is dressed in a suit and tie, and appears to be in a business setting. The man is in a position where he can see the doorway, which is likely a common area for people to gather or pass", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "cell phone", "tie"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 209925, "caption": "A baseball player stands on a baseball field, preparing to pitch a ball. The player is wearing a baseball uniform and has a baseball glove on their left hand. The field is empty, and the player is positioned in the middle of the field.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sports ball", "person", "baseball glove"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 2154, "caption": "A shopping cart is sitting on a bench in a city street, surrounded by trash and a green umbrella.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "umbrella", "bench", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 274931, "caption": "A black and white image shows a city street with cars parked along the sidewalk, a street lamp, and a building in the background.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fire hydrant", "traffic light", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 104326, "caption": "A large, spacious kitchen with an island, a dining table, and a green color scheme. The kitchen has a large window, allowing natural light to flood in. There are several chairs and a table, making it suitable for dining or gathering with friends and family.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "clock", "sink", "dining table", "knife", "potted plant", "oven", "microwave"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 233888, "caption": "A young boy is practicing his pitching skills while standing in front of a television set. He is wearing a baseball cap and a baseball glove, and he has a baseball in his hand. He is aiming to throw the baseball into the television, which is displaying a baseball game on its screen. The", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "tv", "potted plant", "baseball glove", "baseball bat"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 213905, "caption": "Two women, one wearing a white tennis outfit and the other wearing a black tennis outfit, are standing on a tennis court. They are both holding tennis rackets and smiling, indicating that they are enjoying playing tennis. The image captures their enthusiastic moment during the game.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "backpack", "tennis racket", "chair"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 277479, "caption": "A young girl is reaching into a refrigerator to grab a bottle of ketchup. She is standing in front of the open door and looking inside. Her mother is also in the kitchen, possibly supervising her.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "refrigerator", "bottle"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 300784, "caption": "A group of children are sitting in a room with a dog, while they hold a large paper tube and a pencil. They are likely engaged in an art or creative project.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "bench", "couch", "dog"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 183766, "caption": "A beautifully decorated plate of cheesecake sits on a white dining table, surrounded by a decorative vase and three silver spoons. The plate is adorned with fresh berries, which add a touch of color and elegance to the setting.", "mscoco_hallucinated_words": [["vase", "vase"], ["spoon", "spoon"]], "mscoco_gt_words": ["cake", "fork", "knife", "dining table"], "hallucination_idxs": [17, 21], "metrics": {"CHAIRs": 1, "CHAIRi": 0.6666666666666666, "Recall": 0.25}}, {"image_id": 169169, "caption": "In the image, a city street is lined with tall trees and a beautiful green space, creating a serene atmosphere. A tall, thin flagpole stands in the center of the park, and a green and white banner is displayed on the pole. This banner likely promotes a local event or celebration", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["potted plant", "traffic light", "person", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 409346, "caption": "A group of women are gathered at a table, enjoying a spread of food, including desserts and various types of fruits. One woman is holding a plate, and the other woman is taking a bite from her dessert. They are both smiling and appear to be having a good time.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "dining table", "bowl", "spoon", "cake"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 522262, "caption": "In the image, there are several bicycles parked along a sidewalk, with some of them locked to a metal pole. The scene is taken at a city street, and the bicycles are lined up next to each other, making it a convenient and organized parking space for commuters and residents", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "traffic light", "bicycle", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 79014, "caption": "A man is holding an orange ball while standing behind a fence, possibly in a park or at a public event.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "sports ball", "orange"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 344942, "caption": "A small, wooden doll is perched on top of a computer screen, looking down at the user's browsing history on the screen. The doll is placed on a table, and there is a window with a view of the outdoors visible behind it.", "mscoco_hallucinated_words": [["table", "dining table"]], "mscoco_gt_words": ["laptop", "clock", "tv"], "hallucination_idxs": [32], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.3333333333333333}}, {"image_id": 275929, "caption": "A pair of toilets sits on a staircase, with a building in the background. The staircase is covered in rust and has a few steps leading up to the building.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sink", "toilet", "bowl"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 465601, "caption": "A man and a woman are standing under an umbrella while walking through a park, looking at a building. They seem to be engaged in conversation, and the woman is carrying a purse.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "handbag", "bench", "umbrella"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 300124, "caption": "A couch with an open door is sitting in front of a brick house, with a microwave on the couch.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["couch", "microwave", "chair", "dining table"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 46919, "caption": "A man is skiing down a snowy slope, wearing a red jacket and carrying a backpack. He is on a trail surrounded by trees, and the snowy terrain creates a picturesque scene.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "skis", "backpack"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 434022, "caption": "A white train engine is seen on a track, with smoke rising from its exhaust. The train is traveling down the tracks, and there are railroad tracks in the background.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "train", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 490491, "caption": "A man stands in front of a street sign with a red and white pole, while a street sign with a black background and white letters hangs nearby. The street sign has the name \"Alto\" written on it, and there is a street with a brick wall on the side. The man is likely waiting for", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "car", "stop sign"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 175878, "caption": "A group of friends are gathered together, talking and laughing while using their cell phones outdoors. They are standing near a window and a backpack, with a tree and a building in the background.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "backpack", "cell phone"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 12669, "caption": "A group of people is gathered at an art gallery, admiring various art pieces. A woman is holding a glass of wine, while the other individuals are discussing the artwork. The scene captures the social aspect of art appreciation, where people come together to share their perspectives and enjoy each other'", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "handbag", "vase", "wine glass"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 192496, "caption": "A train is parked at a railroad track, with a red-and-white passenger train car in front of it. The train is positioned next to a blue passenger train car. The scene is set on a track with a railroad crossing nearby.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "train", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 133146, "caption": "In this image, a living room is filled with a couch, a chair, and a television. The room is well-lit, with a lamp on the coffee table and a window providing natural light. The living room also features a few pieces of artwork on the walls and a rug on the floor. This", "mscoco_hallucinated_words": [["table", "dining table"]], "mscoco_gt_words": ["chair", "vase", "tv", "book", "couch"], "hallucination_idxs": [31], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.6}}, {"image_id": 53744, "caption": "A close-up image of a sandwich with tomato slices, lettuce, and a knife, sitting on a white plate, is captured.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["knife", "sandwich", "dining table"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 375902, "caption": "In the image, a person is shown skiing down a snowy slope while wearing a ski suit, and carrying a pair of skis. The person is in a race, and there are two flags or banners in the background.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "skis", "backpack"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 498747, "caption": "A man is sitting at a table surrounded by friends, laughing and talking. He is using his cell phone to make a call while holding a beer bottle. The image shows a fun and lively atmosphere, with the man and his friends enjoying each other's company and possibly discussing important matters or", "mscoco_hallucinated_words": [["table", "dining table"]], "mscoco_gt_words": ["person", "bird", "cell phone", "bottle"], "hallucination_idxs": [6], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2, "Recall": 0.75}}, {"image_id": 52435, "caption": "In the image, a group of people are enjoying a day at the beach, with some on surfboards and others on boards, riding the waves in the ocean.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "surfboard", "bird", "umbrella"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 301977, "caption": "The image features a cow standing by a collection of various drinks and snacks, including bottles of soda, juice, and other beverages, as well as a box of milk.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cow", "refrigerator", "bottle"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 261097, "caption": "A tennis player stands on the court, wearing a black and white striped shirt, white shorts, and a tennis cap. He holds a tennis racket and is looking up at the scoreboard on the court.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["tennis racket", "person", "bench", "chair"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 227204, "caption": "A group of three women, one elderly and two young, are sitting at a dining table, enjoying their meal together. One woman is eating a banana, while the other two women are eating food from their bowls. They are all smiling and engaged in conversation. The image capt", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["banana", "cell phone", "person", "dining table", "bottle", "bowl", "knife", "cup", "spoon"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4444444444444444}}, {"image_id": 353981, "caption": "A large, silver airplane is parked on a runway, with a smaller aircraft nearby. The airplane has a long, curved wing, and the smaller aircraft appears to be a military jet.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "truck", "airplane"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 185327, "caption": "In the image, a group of people, including a man, woman, and child, are walking along a street in a city. They are surrounded by a group of elephants, which are walking behind them. The man is holding a camera to capture the scene. This unusual and unexpected sight is likely causing a", "mscoco_hallucinated_words": [["elephant", "elephant"]], "mscoco_gt_words": ["bus", "person", "cow", "car", "horse"], "hallucination_idxs": [34], "metrics": {"CHAIRs": 1, "CHAIRi": 0.16666666666666666, "Recall": 0.2}}, {"image_id": 348654, "caption": "A smartphone is placed on a table next to a computer, while a speaker is sitting on the table as well.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["laptop", "cell phone", "dining table", "tv"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 482432, "caption": "A toothbrush is sitting on top of a sink, and a tube of toothpaste is next to it. A toothbrush and toothpaste are essential for maintaining good oral hygiene.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sink", "toothbrush", "bowl"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 454161, "caption": "A delicious pizza with various toppings is being enjoyed at a dining table, accompanied by a glass of wine. The toppings include pepperoni, onions, and green peppers. The pizza is served on a white plate, and the wine glass is placed next to it.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["pizza", "fork", "dining table", "wine glass"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 144723, "caption": "A dog is flying through the air while catching a frisbee in a grassy field. The dog is enjoying the thrill of playing with its owner and the frisbee, demonstrating its agility and enthusiasm for the game.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["truck", "car", "dog", "frisbee"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 129707, "caption": "A hand is holding a cell phone with a small screen, and it is connected to a handheld remote control.", "mscoco_hallucinated_words": [["remote", "remote"]], "mscoco_gt_words": ["person", "book", "cell phone"], "hallucination_idxs": [19], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.3333333333333333}}, {"image_id": 379842, "caption": "A white Nintendo Wii controller is sitting on top of a book with a cover featuring Mario and Luigi, as well as a video game instruction booklet. The controller is next to a small white and black gaming console.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["book", "remote", "dining table"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 203110, "caption": "A vintage streetcar is stopped on a city street, with a man walking past it. The streetcar is painted with an orange color and has a unique design, giving it an old-fashioned appearance. The scene is set in a busy urban area, with the streetcar sitting on the tracks and", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bus", "person", "truck", "train", "car", "orange"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 556478, "caption": "A close-up image of two pizzas on a baking sheet, one with a thick crust and a white sauce, and the other with a thin crust and a red sauce, is shown. The pizzas are in the process of being baked in a kitchen, and they are", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["oven", "pizza", "cup", "bottle"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 103815, "caption": "A baseball player is pitching a baseball on a field, while another player is preparing to catch the ball.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sports ball", "person", "baseball glove", "baseball bat"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 451943, "caption": "A large, spacious bed is shown in the image, with a number of pillows and blankets on it. The bed is positioned in a room with a wooden floor and is surrounded by a bedside table and a lamp. The room has a warm, inviting atmosphere, making it a comfortable place", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["suitcase", "bed", "backpack", "dining table"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 268854, "caption": "A group of people is gathered around a dock, where they are holding a large wooden crate. The dock is located near a body of water, possibly a lake or a river. The scene is vibrant and colorful, with the people and the wooden crate being surrounded by boats and other watercraft.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "handbag", "boat"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 34464, "caption": "A group of people, including a man and a woman, are enjoying the ocean on a sandy beach. They are standing on the shoreline with surfboards, and a man is holding a red surfboard.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "surfboard", "boat"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 495513, "caption": "A man and a woman are holding a hot dog and a bun at an outdoor event, possibly a barbecue or a campfire. They are smiling and enjoying their food together.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "hot dog", "fork"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 529256, "caption": "A pair of dogs, a brown and white one, and a brown one, are laying on a red bed together.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bed", "book", "dog"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 37907, "caption": "A cat sits on a TV stand, watching TV as a video game is playing on a nearby computer screen. The cat is perched on top of a wooden TV stand, its eyes fixed on the screen, enjoying the entertainment.", "mscoco_hallucinated_words": [["computer", "laptop"]], "mscoco_gt_words": ["potted plant", "cat", "tv"], "hallucination_idxs": [19], "metrics": {"CHAIRs": 1, "CHAIRi": 0.16666666666666666, "Recall": 0.6666666666666666}}, {"image_id": 506401, "caption": "A street scene with a city, a large concrete statue of a wolf, a traffic light, and a busy street.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "truck", "cat", "traffic light", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2}}, {"image_id": 406611, "caption": "A group of people is skiing down a snowy slope in a mountain resort, with snow-covered trees and a ski lift in the background.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "skis", "backpack"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 267225, "caption": "A large, white truck is parked next to a group of vehicles in a parking lot. In the back of the truck, there is a large satellite dish. A man is standing next to the truck, looking at a small screen on the side of the vehicle. There are a few cars", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "truck", "car", "tv", "remote"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 278365, "caption": "A couple is enjoying a meal together while sitting on a patio, eating pizza and drinking beer.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "cell phone", "person", "dining table", "pizza", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.16666666666666666}}, {"image_id": 69757, "caption": "A group of friends gathered around a table, sharing a birthday cake and enjoying their time together.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "person", "dining table", "knife", "cup", "wine glass", "cake"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2857142857142857}}, {"image_id": 432213, "caption": "A delicious sandwich is sitting on a plate in front of a person at a restaurant, with a glass of wine to the side. The sandwich is made with a fried egg, lettuce, and fries, and it's being enjoyed by the person at the dining table.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "sandwich", "dining table", "bowl", "knife", "wine glass"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 368367, "caption": "A young woman is smiling while talking on her cell phone, sitting outside a restaurant with a glass of water.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cup", "person", "cell phone"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 201555, "caption": "A busy intersection with a road construction site is shown in the image, with a road sign pointing towards Grand National Boulevard. There are also vehicles, traffic lights, and construction equipment on the street. The scene suggests that the area is currently undergoing renovation or expansion.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["traffic light", "truck", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 92131, "caption": "A group of people, including a woman and a man, are standing in front of a bus, waiting for it to arrive. The bus has a sign on it that reads \"Green Line.\"", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "handbag", "bus"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 21779, "caption": "In the image, a young woman is lying on her back on the floor with her backpack open. She is probably resting or relaxing after a long day, as the backpack is open and she is not actively using it. This scene might suggest that the woman is taking a break and enjoying her", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["suitcase", "person", "backpack"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 565148, "caption": "A baseball player is swinging a bat at a ball, surrounded by a crowd of people. The player is in the middle of a game, possibly during a home run, and the crowd is excitedly cheering and watching the action unfold. The image captures the intensity and excitement of the game, showcasing", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sports ball", "person", "baseball glove", "baseball bat"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 160183, "caption": "A fire truck is parked in front of a building, and there is a fire hose being used in the parking lot.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "truck", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 555456, "caption": "A group of people are skiing down a snow-covered mountain, enjoying their time on the slopes. One man is particularly focused on his skiing, while others appear to be enjoying the winter sports activity. The image captures the excitement and thrill of skiing down a snow-cover", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "skis", "snowboard"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 235595, "caption": "A group of motorcycles are parked in a row on a city street, with a large bike in the middle. People are walking around the area, and there are cars and a caf\u00e9 nearby.", "mscoco_hallucinated_words": [["bike", "bicycle"]], "mscoco_gt_words": ["parking meter", "motorcycle", "person", "car", "cup", "potted plant"], "hallucination_idxs": [17], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.5}}, {"image_id": 489909, "caption": "A colorful assortment of fruits and vegetables is displayed in a basket or container, showcasing a variety of fresh produce. The image features a mix of brightly colored fruits such as oranges, bananas, and apples, as well as green cucumbers and other vegetables", "mscoco_hallucinated_words": [["apple", "apple"]], "mscoco_gt_words": ["banana", "orange", "bowl"], "hallucination_idxs": [38], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 1.0}}, {"image_id": 501080, "caption": "A brightly colored Christmas cactus sits in a vase, illuminated by the light from the lamp. This beautiful plant is surrounded by pink flowers, adding a touch of festive cheer to the room. The vase serves as a decorative centerpiece, elevating the aesth", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["potted plant", "vase", "dining table", "bowl"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 405183, "caption": "A young girl is in a living room with a group of people, playing a video game on a console. She is standing in front of the TV and appears to be holding a controller in her hand. The scene is lively and engaging, with the group of friends gathered around the TV, enjoying their time", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["book", "chair", "person", "tv", "potted plant", "handbag", "remote", "couch"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 409138, "caption": "A green city bus is parked at the side of the road in front of a building.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "car", "bus"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 411840, "caption": "Two tennis players, a man and a woman, walk on a grassy tennis court, each holding tennis rackets. They are walking side by side, looking at each other.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sports ball", "tennis racket", "chair", "person", "backpack"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 333712, "caption": "A close-up image of a slice of pizza with bacon toppings and green onions on a yellow plate, with a fork and a knife on the side, is presented. This delicious pizza is ready to be enjoyed, and the presence of a fork and knife indicates that it can be", "mscoco_hallucinated_words": [["fork", "fork"], ["knife", "knife"], ["fork", "fork"], ["knife", "knife"]], "mscoco_gt_words": ["pizza", "spoon", "dining table"], "hallucination_idxs": [21, 24, 46, 48], "metrics": {"CHAIRs": 1, "CHAIRi": 0.6666666666666666, "Recall": 0.3333333333333333}}, {"image_id": 148977, "caption": "A teddy bear is sitting on a table next to a computer with headphones on, listening to music while a book is open on the table.", "mscoco_hallucinated_words": [["computer", "laptop"]], "mscoco_gt_words": ["bottle", "keyboard", "dining table", "bear", "teddy bear", "book"], "hallucination_idxs": [11], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2, "Recall": 0.5}}, {"image_id": 399058, "caption": "A man rides a motorcycle alongside a large elephant while driving down a dirt road, with a truck in the background.", "mscoco_hallucinated_words": [["motorcycle", "motorcycle"]], "mscoco_gt_words": ["elephant", "bicycle", "person", "truck", "orange"], "hallucination_idxs": [4], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.6}}, {"image_id": 183571, "caption": "A man is standing next to a red train car, holding a small dog while riding a boat on a river.", "mscoco_hallucinated_words": [["train", "train"], ["car", "car"]], "mscoco_gt_words": ["person", "dog", "boat"], "hallucination_idxs": [8, 9], "metrics": {"CHAIRs": 1, "CHAIRi": 0.4, "Recall": 1.0}}, {"image_id": 325836, "caption": "A red and black motorcycle with a colorful engine sits on a red carpet-like surface, attracting the attention of the people around it. The motorcycle has a unique and eye-catching design, with an orange and purple engine, making it a standout among other vehicles. The presence", "mscoco_hallucinated_words": [["orange", "orange"]], "mscoco_gt_words": ["person", "handbag", "bicycle", "motorcycle"], "hallucination_idxs": [36], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.5}}, {"image_id": 437910, "caption": "In the image, we see a small bathroom with a sink, toilet, and a shower. There is also a trash can and a newspaper next to the toilet. The bathroom appears to be unfinished or under construction, as there are exposed pipes and a messy appearance", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sink", "bottle", "toilet"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 155885, "caption": "A picturesque scene of a fishing village on the shore, with boats and birds in the water, and a bird in the sky.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "bird", "boat"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 467887, "caption": "A man sits at a table, using a computer and wearing glasses, while he is on a phone call. He is wearing a red shirt and is sitting in a living room setting.", "mscoco_hallucinated_words": [["phone", "cell phone"]], "mscoco_gt_words": ["laptop", "chair", "mouse", "person", "dining table", "couch"], "hallucination_idxs": [19], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.5}}, {"image_id": 174402, "caption": "A man in a blue shirt and white tennis shoes is holding a tennis racket, standing on a tennis court, and looking at a tennis ball.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sports ball", "person", "tennis racket"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 352734, "caption": "A little boy is eating a slice of chocolate cake from a plate, using a spoon to eat the creamy dessert.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "person", "dining table", "spoon", "cake"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 346716, "caption": "A group of old red buses is driving down a city street, passing by a large building with a clock on it. The scene is captured in a black and white photograph, giving it a timeless feel.", "mscoco_hallucinated_words": [["clock", "clock"]], "mscoco_gt_words": ["person", "car", "bus"], "hallucination_idxs": [20], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.3333333333333333}}, {"image_id": 451144, "caption": "Two men are standing atop a snowy hill, looking out at the beautiful landscape below. They are wearing hiking gear and appear to be enjoying the scenic view. The snow-covered hill provides a serene and picturesque setting, and the men are likely taking in the beauty of", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "skis", "backpack"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 295656, "caption": "A group of people, including a man and a woman, are enjoying a meal together in a restaurant. They are eating pizza and drinking beer, and one of the people is wearing a suit. The image shows them laughing and enjoying their time together.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "clock", "person", "tie", "pizza", "car", "tv"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2857142857142857}}, {"image_id": 129886, "caption": "A man and a woman are skiing down a snow-covered slope, both wearing skiing gear. The man is using a snowboard, while the woman is skiing with a pair of skis. The scene takes place on a mountain, with a ski lift in the background, and a large", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "skis", "snowboard"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 557998, "caption": "A young woman sits at a table in a lush outdoor setting, surrounded by plants and greenery. She is holding a glass of wine, possibly a bottle, and looking at the camera. This image captures a moment of relaxation and enjoyment, as the woman enjoys her drink in a", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "person", "dining table", "bottle", "wine glass"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 401010, "caption": "A white bed with pillows is seen in a room, with a desk in the background. The room has a mirror on the wall, and there is a chair or stool near the bed. The image shows a cozy, inviting atmosphere, and it could be used for various purposes, such as a", "mscoco_hallucinated_words": [["desk", "dining table"]], "mscoco_gt_words": ["sink", "chair", "bed", "tv"], "hallucination_idxs": [13], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2, "Recall": 0.5}}, {"image_id": 567562, "caption": "A family is having dinner at a table with a white tablecloth, enjoying a variety of foods on their plates. The scene is filled with laughter and joy as the two young girls are engaging in conversation while eating their meals.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "chair", "person", "bottle", "bowl", "dining table", "pizza", "broccoli", "cup", "spoon", "book"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.18181818181818182}}, {"image_id": 313928, "caption": "A yellow surfboard is sitting on the beach, next to a blue table with white chairs and a green umbrella. A bottle of wine is on the table, and a yellow beach towel is draped over the chair. This idyllic scene captures the essence of a relax", "mscoco_hallucinated_words": [["umbrella", "umbrella"]], "mscoco_gt_words": ["surfboard", "chair", "dining table", "bottle", "wine glass"], "hallucination_idxs": [20], "metrics": {"CHAIRs": 1, "CHAIRi": 0.14285714285714285, "Recall": 0.8}}, {"image_id": 490284, "caption": "A black dog is leaning against a person, likely resting its head on the person's shoulder. The image captures a moment of affection and companionship between the dog and its owner.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "couch", "dog"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 346940, "caption": "A close-up of a kitchen scene features a pot on a stove, with steam rising from the pot.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["oven", "knife", "bowl"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 222782, "caption": "A couple walks down a city street past an old gas station with a vintage sign and a car parked outside. The woman is carrying a purse and wearing a hat, while the man is walking next to her. The scene captures the charm and nostalgia of a bygone era", "mscoco_hallucinated_words": [["purse", "handbag"]], "mscoco_gt_words": ["person", "truck", "cell phone", "car"], "hallucination_idxs": [27], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.5}}, {"image_id": 255934, "caption": "A mother elephant and her baby are walking together in an enclosure. The mother is carrying her baby on her back, and they are being watched by people in the background. The image captures the loving bond between the mother and her young, showcasing their natural and playful behavior.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "cow", "handbag", "elephant"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 278627, "caption": "A young couple enjoys their dinner at a restaurant, with a smiling man holding a chicken dish and a woman holding a plate of vegetables. They are seated at a wooden table, surrounded by a warm and inviting atmosphere.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "chair", "person", "dining table", "bottle", "cup", "spoon", "potted plant"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 400851, "caption": "A group of people is gathered on a beach, enjoying the sunny day and spending time together. They are sitting on benches and chairs, and some people are even lounging on a beach mat. This image captures the essence of a relaxing and leisurely day at", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sports ball", "chair", "person", "backpack", "umbrella", "bench", "boat"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.42857142857142855}}, {"image_id": 472610, "caption": "The woman is standing in a field surrounded by cows and a dog, with the dog sitting on the ground and looking up at her. The image captures the woman's interaction with the animals, creating a serene and peaceful atmosphere.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "cow", "dog"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 78565, "caption": "A group of people, including a man and a woman, are gathered near a body of water, possibly a lake or the ocean, watching a sailboat race. The scene is quite picturesque, capturing the excitement and fun of the sport.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "dog", "boat"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 388237, "caption": "A group of people is hanging out on a street corner, enjoying a skateboarding session.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "skateboard", "chair", "bottle"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 289640, "caption": "A group of friends are sitting around a table, with a man in the center holding a yellow frisbee. They are having a fun time together, enjoying the outdoors and engaging in a game of frisbee toss.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "person", "dining table", "cup", "wine glass", "orange", "frisbee"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.42857142857142855}}, {"image_id": 122602, "caption": "A woman is sitting at a table with a paper and scissors, surrounded by various art supplies, including glue, markers, and a pencil. She is likely working on a craft project or artwork, using the paper and scissors to create intricate designs or patterns. The presence of the", "mscoco_hallucinated_words": [["woman", "person"]], "mscoco_gt_words": ["dining table", "bottle", "scissors"], "hallucination_idxs": [1], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.6666666666666666}}, {"image_id": 24104, "caption": "The image shows a cluttered workspace with a computer, a monitor, and a keyboard on a desk. A laptop is placed on top of the monitor, and there is a cup of coffee on the desk as well.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["laptop", "mouse", "keyboard", "dining table", "bed", "cup", "tv", "book"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.625}}, {"image_id": 183709, "caption": "A group of people, including a man and a woman, are standing on a city street, looking at a crosswalk. They are likely waiting for the traffic light to turn green before crossing the street.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "handbag", "traffic light", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 59710, "caption": "A black refrigerator with a shelf inside is sitting on a wooden floor. It has a door open and is filled with an ice maker, a bottle, and a bag of ice.", "mscoco_hallucinated_words": [["bottle", "bottle"]], "mscoco_gt_words": ["refrigerator", "chair", "dining table"], "hallucination_idxs": [28], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.3333333333333333}}, {"image_id": 279407, "caption": "A young boy is standing in a baseball field, holding a baseball glove and wearing a green and yellow baseball shirt. He is surrounded by other kids and adults, possibly waiting for their turn to play or watching the game. The image captures the boy's enthusiasm and excitement as he", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sports ball", "person", "bottle", "bench", "baseball glove"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 314729, "caption": "A black and white photograph shows a man standing in a baseball uniform, holding a baseball bat. The image is from an old-time baseball card, which captures the essence of the sport and its players from the past.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sports ball", "person", "baseball bat"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 527497, "caption": "A computer workspace is seen in the image, featuring a computer monitor, keyboard, and mouse. There is also a phone sitting on the desk, and a large display screen with various screenshots on it. The room is spacious, and the workspace is well-organized, indicating a professional", "mscoco_hallucinated_words": [["phone", "cell phone"]], "mscoco_gt_words": ["laptop", "mouse", "keyboard", "dining table", "tv"], "hallucination_idxs": [23], "metrics": {"CHAIRs": 1, "CHAIRi": 0.14285714285714285, "Recall": 1.0}}, {"image_id": 411564, "caption": "A young man is sitting on a chair next to a window in a kitchen, enjoying his phone. The image is taken at a low angle, which emphasizes the man's height and perspective, making it seem as though he is looking down at the scene below.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "cell phone", "person", "dining table", "bottle", "refrigerator"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 320350, "caption": "A man and woman are walking on a frozen lake with their dogs, enjoying a winter activity together.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "skis", "dog"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 401857, "caption": "A baseball player is attempting to hit the ball during a game at a stadium. He is swinging his bat, and the ball is in mid-air. The crowd is watching the action on the field, and the player is likely trying to score a run or hit a home run.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sports ball", "person", "cup", "bench", "baseball glove", "baseball bat"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 285302, "caption": "A young boy is sitting at a dining table, surrounded by various materials, such as scissors, paper, and a pencil. He is likely working on a craft project or art piece.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "chair", "dining table", "scissors"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 61959, "caption": "A city bus is driving down the street, passing by a restaurant and a traffic light. The bus is red and white, and it is moving through the intersection, possibly stopping at the traffic light.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["truck", "traffic light", "bus", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 229659, "caption": "A group of friends are gathered at a table in a restaurant, using their laptops and a large screen to access the internet. They are seated in a cozy atmosphere, enjoying their time together while using their devices to browse the internet.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["laptop", "chair", "clock", "person", "bottle", "dining table", "tv"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2857142857142857}}, {"image_id": 473118, "caption": "A man skateboarding on a ramp, with a skateboard and a pair of blue jeans, is shown in the image. He is performing a trick or trickery on the skateboard, possibly jumping or riding the board in the air. The image captures a moment of the", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "bicycle", "skateboard"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 391222, "caption": "Two women, one wearing a purple jacket and the other wearing a blue jacket, are standing next to a sign in the snowy woods. The sign provides information about the area, which appears to be a hiking trail. The women are likely out for a winter hike, enjoying", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "skis", "backpack"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 416104, "caption": "A group of friends sit at a table outside a restaurant, enjoying their drinks and conversation. The outdoor setting provides a pleasant and relaxing atmosphere, and the umbrella overhead adds a touch of protection from the sun or rain.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "person", "umbrella", "dining table", "bottle", "wine glass"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 511852, "caption": "Two men are skiing down a snow-covered slope, one with a backpack on, and the other is carrying a backpack. They are enjoying the winter sport, and their presence on the mountain suggests that they may be participating in a skiing competition or engaging in a leisurely", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "skis", "backpack"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 59386, "caption": "In this image, there are several giraffes gathered together, with one giraffe reaching up to eat a leaf from a tree. This moment showcases the unique and fascinating behavior of these tall creatures as they interact with each other in their natural habitat.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["car", "zebra", "giraffe"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 540180, "caption": "A green pedestrian crossing signal is illuminated in the middle of a city street, signaling that pedestrians have the right of way.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "traffic light", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 153692, "caption": "A man rides a bicycle down a street, with a dog sitting on the back of the bike. The man is wearing a backpack and appears to be traveling on a city street. The image is captured during a sunny day, with a red traffic light visible in the background.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bicycle", "person", "car", "traffic light", "backpack", "dog"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.8333333333333334}}, {"image_id": 265628, "caption": "A man is sitting on a toilet inside a small, enclosed bathroom. The toilet is located in a wooden stall, and there is a sink nearby. The man is wearing dress shoes and appears to be in a professional setting, as there is a suitcase in the image.", "mscoco_hallucinated_words": [["sink", "sink"], ["suitcase", "suitcase"]], "mscoco_gt_words": ["person", "toilet", "bowl"], "hallucination_idxs": [27, 49], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.6666666666666666}}, {"image_id": 499594, "caption": "A plate of broccoli and chicken is placed on a table in front of a blue background, with a fork and knife next to it. The broccoli is arranged on top of the chicken, and there is a green salad bowl on the table as well. The dish is served", "mscoco_hallucinated_words": [["bowl", "bowl"]], "mscoco_gt_words": ["fork", "dining table", "bottle", "broccoli", "knife", "cup"], "hallucination_idxs": [43], "metrics": {"CHAIRs": 1, "CHAIRi": 0.14285714285714285, "Recall": 0.6666666666666666}}, {"image_id": 5934, "caption": "A baseball glove, with a baseball sitting inside, is on a bench. The glove is made of leather, and it has a checkered pattern on the fingers. The baseball is made of leather and is in the process of being thrown.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bench", "sports ball", "baseball glove"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 47828, "caption": "A boat floats on the water, illuminated by blue lights, while a city bridge stands behind it. The image captures the nighttime ambiance of the city, with the boat and the bridge reflecting off the water, creating a stunning and serene scene.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "car", "boat"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 47916, "caption": "A group of dogs is playing in the grass, with one dog holding a red frisbee in its mouth. The dogs are running around and having fun, engaging in a game of catch.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["truck", "car", "bench", "dog", "frisbee"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 255483, "caption": "A man is sitting at a desk, surrounded by piles of papers, and he is writing with a pen. There is also a cup of coffee nearby. The image is a representation of a busy work environment where the man is engaged in his tasks, possibly working on a story or preparing to write an article", "mscoco_hallucinated_words": [["cup", "cup"]], "mscoco_gt_words": ["person", "book", "dining table", "scissors"], "hallucination_idxs": [26], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.5}}, {"image_id": 131138, "caption": "A man is sitting at a desk with a computer, a television, and a coffee cup. There is a laptop on the desk as well. The man is using the computer and watching television simultaneously, while also enjoying his coffee. This scene suggests that the man is multitasking and likely spending", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["laptop", "mouse", "person", "keyboard", "dining table", "cup", "spoon", "tv", "potted plant"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5555555555555556}}, {"image_id": 258209, "caption": "A man sitting on a bench in front of a brick wall, looking at his phone.", "mscoco_hallucinated_words": [["phone", "cell phone"]], "mscoco_gt_words": ["person", "book", "bench", "bicycle"], "hallucination_idxs": [16], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.5}}, {"image_id": 347453, "caption": "A busy street scene with multiple red double-decker buses, cars, and people walking. The street is lined with tall buildings and streetlights, and a pedestrian crossing is present. The image captures a bustling city scene with various modes of transportation and people going about their day", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bus", "person", "car", "traffic light", "bench"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.8}}, {"image_id": 285820, "caption": "In the image, a living room is shown with a couch, a television, and a dining table. The couch has a black and white striped cushion, and there are two brown pillows on it. The television is positioned on the wall above the couch, and there is a", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "dining table", "bowl", "tv", "book", "bench", "couch"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.42857142857142855}}, {"image_id": 245664, "caption": "A man sits at a desk in front of a computer, laptop, and a TV. He is holding a glass of wine and has a laptop open in front of him. There is a notebook and a pen on the desk as well. The image shows a cluttered workspace with a mix", "mscoco_hallucinated_words": [["man", "person"]], "mscoco_gt_words": ["laptop", "mouse", "keyboard", "dining table", "cup", "wine glass", "tv", "book"], "hallucination_idxs": [1], "metrics": {"CHAIRs": 1, "CHAIRi": 0.125, "Recall": 0.375}}, {"image_id": 453731, "caption": "A dog is lying on the floor near a table with a bottle and a wooden barrel. The dog is likely enjoying the sunny day and the warmth on the floor.", "mscoco_hallucinated_words": [["table", "dining table"]], "mscoco_gt_words": ["dog", "cup", "bottle"], "hallucination_idxs": [9], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.6666666666666666}}, {"image_id": 524601, "caption": "A group of friends are gathered around a couch playing video games. They are all holding controllers and participating in the game together.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "person", "book", "remote", "couch", "refrigerator"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.16666666666666666}}, {"image_id": 253262, "caption": "A large plane is parked on the tarmac at an airport, surrounded by people. Some of them are walking around the aircraft, while others are standing next to a truck. There is also a person standing in front of the plane, looking at the camera.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "suitcase", "truck", "tie", "airplane"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 87052, "caption": "A couple is sitting in a kitchen, possibly preparing or enjoying a meal together. The man is leaning against a counter, and the woman is standing next to him. They appear to be engaging in conversation or preparing food, as they are both holding utensils. The scene is captured in", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "bottle", "bowl", "vase", "cup", "oven", "refrigerator"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.14285714285714285}}, {"image_id": 357578, "caption": "A red fire engine is parked on a city street, next to a car and a pedestrian.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "traffic light", "truck", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 418692, "caption": "A young woman sits on a couch in a living room, reading a book while her boyfriend is laying on the couch next to her. They are both surrounded by colorful pillows and a couple of lamps. The room has a warm and cozy atmosphere, with a large window that allows", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "cell phone", "person", "book", "remote", "couch"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 259345, "caption": "A man with a beard and a rain umbrella is sitting on a chair, smiling at the camera. He is wearing a colorful and patterned outfit, which could be a traditional costume or a vibrant shirt. The image captures a lively and playful atmosphere,", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "umbrella", "chair"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 119709, "caption": "A woman is kneeling on a kitchen table, surrounded by a large number of donuts, using a small cutting tool to cut each donut into a hole.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "chair", "dining table", "donut"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 443299, "caption": "A couple is sitting on a bench at a train station, looking at their cell phones. The woman is wearing a black coat, and the man is wearing a red jacket. They are both using their phones to text or scroll, and they appear to be engaged in conversation. The image capt", "mscoco_hallucinated_words": [["train", "train"]], "mscoco_gt_words": ["cell phone", "person", "backpack", "handbag", "bench"], "hallucination_idxs": [9], "metrics": {"CHAIRs": 1, "CHAIRi": 0.16666666666666666, "Recall": 0.6}}, {"image_id": 120776, "caption": "A group of people are gathered around a large metal sculpture in a city square. The sculpture appears to be a man or a person with a large head, which is a common art form in public spaces. People are sitting on chairs, enjoying their time and the artwork, while others are standing nearby", "mscoco_hallucinated_words": [["chair", "chair"]], "mscoco_gt_words": ["person", "umbrella", "tie"], "hallucination_idxs": [45], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2, "Recall": 0.3333333333333333}}, {"image_id": 411765, "caption": "A man is standing in a tennis court, holding a tennis racket and about to hit a tennis ball. He is dressed in white tennis attire and is concentrating on his upcoming swing.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sports ball", "person", "tennis racket"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 447991, "caption": "In the image, a group of people, including a girl in shorts, are walking down a sidewalk in the city at night. The city is bustling with people, cars, and streetlights, creating a lively atmosphere. The girl is holding a blue toy car and a yellow toy", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bicycle", "cell phone", "person", "truck", "traffic light", "car", "handbag"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.42857142857142855}}, {"image_id": 276719, "caption": "A small dog is walking on the sidewalk next to a group of people, including a man, a woman, and a young girl, who are gathered near a car. The dog is brown and white in color, and it is wearing a collar.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "motorcycle", "person", "truck", "car", "handbag", "dog"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.42857142857142855}}, {"image_id": 422328, "caption": "A horse-drawn wagon is parked outside a building, likely a restaurant or a bar, in the snowy environment. The wagon is filled with hay, and there is a man standing next to it, possibly unloading it. The scene captures the winter atmosphere and the importance of hay for animals", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "car", "horse", "snowboard", "skis"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2}}, {"image_id": 354559, "caption": "A woman is holding a teddy bear and smiling for the camera while wearing a black dress.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "teddy bear", "bear"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 438788, "caption": "A group of people are gathered around a large slice of cake, which is on a white plate. The cake is covered in chocolate and is decorated with a birthday candle. The people are enjoying the cake and celebrating a special occasion, as evidenced by the presence of", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "cake", "knife", "dining table"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 468005, "caption": "A large elephant stands on a wooden platform, near a staircase. It appears to be enjoying its time at the beach, with the people nearby looking at the elephant with a mix of curiosity and excitement.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "elephant", "backpack"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 545594, "caption": "A man is standing in the middle of a crowded bus, holding a backpack and looking out the window.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "backpack", "chair", "orange"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 219546, "caption": "A large dining table is filled with various dishes, including a ham, a salad, and a bowl of appetizers. The table is set with plates, cups, and a knife, and there are a few utensils on the table. The scene appears to be a gather", "mscoco_hallucinated_words": [["cup", "cup"]], "mscoco_gt_words": ["fork", "chair", "bottle", "dining table", "bowl", "knife", "spoon"], "hallucination_idxs": [30], "metrics": {"CHAIRs": 1, "CHAIRi": 0.16666666666666666, "Recall": 0.42857142857142855}}, {"image_id": 386645, "caption": "A city street is crowded with cars and a truck, while a pedestrian walks down the sidewalk. A large, run-down building with a sign reading \"Tavern\" stands nearby, and a person rides a motorcycle on the street.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "car", "truck", "motorcycle"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 155131, "caption": "A young woman in a white tennis outfit is playing a tennis match on a green tennis court. She is wearing a tennis hat and holding a tennis racket, and is in the process of serving the ball. The woman is standing at the baseline, ready to hit the ball back. The tennis match is", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sports ball", "tennis racket", "person", "tie", "bench"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 188752, "caption": "A man is standing in front of a fruit stand at a market, looking at a bunch of bananas hanging from a rope. The man is likely a vendor, inspecting the quality of the bananas before deciding how to price them or prepare them for sale. The image captures the interaction between the", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "banana", "apple"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 228350, "caption": "A group of people are sitting at a long dining table in an outdoor setting, enjoying a meal together. They are seated under a canopy of umbrellas and chairs, providing shade and protection from the sun. The atmosphere is casual and relaxed, with people conversing", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "person", "umbrella", "dining table", "bowl", "tie", "cup", "wine glass"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 437720, "caption": "A young woman is sitting at a desk, typing on a laptop. She is also wearing a red dress and has a book open in front of her. The woman is in a room with a red floor and a red chair, which adds a pop of color to the space. The image captures a moment", "mscoco_hallucinated_words": [["book", "book"]], "mscoco_gt_words": ["laptop", "chair", "person", "dining table", "vase"], "hallucination_idxs": [24], "metrics": {"CHAIRs": 1, "CHAIRi": 0.16666666666666666, "Recall": 0.8}}, {"image_id": 378831, "caption": "A woman is walking down the sidewalk carrying a large red bag, passing by a fire hydrant near a street.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "fire hydrant", "handbag"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 375503, "caption": "A man sits at a desk in a room with a large wooden staircase.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["laptop", "chair", "clock", "person", "dining table", "tv"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 330369, "caption": "A fishing boat is parked in the water, with a man standing on the deck, and another man is standing on the pier, looking at the boat.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "bird", "boat"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 288576, "caption": "A man is playing with a red frisbee on a grassy field, with a tree in the background. He is running towards a tree stump and attempting to catch the frisbee in mid-air.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "bicycle", "frisbee"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 32190, "caption": "A life-like horse figurine stands on the sidewalk in front of a small, old-style building. The horse figurine is made of metal, with a shiny, black finish. It is positioned on a black-colored base, creating a striking visual contrast between the figurine and the surrounding", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "horse", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 535403, "caption": "In the image, a bathroom is captured with a sink, a toilet, and a hair dryer. A woman is standing in front of the sink, brushing her hair with a hair dryer. There is also a hairbrush, a bottle of shampoo, and a to", "mscoco_hallucinated_words": [["woman", "person"]], "mscoco_gt_words": ["clock", "hair drier", "sink", "bottle", "toilet", "potted plant"], "hallucination_idxs": [21], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2, "Recall": 0.5}}, {"image_id": 449798, "caption": "The image shows a desk with a computer, a mouse, and a keyboard. The desk has a large monitor and a lamp next to it. There are also a few figurines and a television on the desk.", "mscoco_hallucinated_words": [["monitor", "tv"], ["television", "tv"]], "mscoco_gt_words": ["laptop", "cell phone", "mouse", "keyboard", "dining table", "book"], "hallucination_idxs": [21, 37], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.6666666666666666}}, {"image_id": 375769, "caption": "A young boy is sitting at a table outside a restaurant, eating a sandwich and drinking water.", "mscoco_hallucinated_words": [["sandwich", "sandwich"]], "mscoco_gt_words": ["chair", "bicycle", "person", "umbrella", "hot dog", "dining table", "car", "cup"], "hallucination_idxs": [14], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.25}}, {"image_id": 426172, "caption": "A colorful and inviting dining area features a table with a wine bottle on it, a wine glass, and a wine aerator. There are also a few other items on the table, such as a vase, a wine aerator, and a plate. The image is set in a shop,", "mscoco_hallucinated_words": [["wine glass", "wine glass"], ["vase", "vase"]], "mscoco_gt_words": ["chair", "dining table", "bottle", "knife", "book"], "hallucination_idxs": [17, 39], "metrics": {"CHAIRs": 1, "CHAIRi": 0.4, "Recall": 0.4}}, {"image_id": 20650, "caption": "A sandwich with broccoli and a side of fries sits on a plate, ready to be enjoyed. The sandwich is a tasty and healthy option, combining the nutritious vegetable broccoli with a crispy bun and possibly some delicious toppings. The side", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "sandwich", "dining table", "bowl", "broccoli", "orange"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 138078, "caption": "A young baseball player stands on a field, holding a baseball bat. He is wearing a red and white baseball uniform and gloves, and has a baseball cap on his head. The player is positioned in the middle of the field, ready to swing his bat and hit a ball. The image captures the", "mscoco_hallucinated_words": [["baseball bat", "baseball bat"]], "mscoco_gt_words": ["sports ball", "person", "baseball glove"], "hallucination_idxs": [11], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.6666666666666666}}, {"image_id": 152499, "caption": "A group of people is gathered around a pool, enjoying the sunny day while a little girl is sitting on the edge of the pool with a red water toy.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["surfboard", "chair", "person", "umbrella", "dining table", "potted plant"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.16666666666666666}}, {"image_id": 180764, "caption": "A man is sitting at a table, eating a donut from a box.", "mscoco_hallucinated_words": [["table", "dining table"]], "mscoco_gt_words": ["person", "microwave", "bottle", "donut"], "hallucination_idxs": [6], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.5}}, {"image_id": 147762, "caption": "A dessert topped with ice cream and a scoop of chocolate cake sits on a white plate, served with a side of nuts and a small bowl of yogurt.", "mscoco_hallucinated_words": [["bowl", "bowl"]], "mscoco_gt_words": ["cake", "fork", "dining table"], "hallucination_idxs": [27], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.3333333333333333}}, {"image_id": 113860, "caption": "A boat is traveling down a river, surrounded by trees and water.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "umbrella", "boat"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 460866, "caption": "A toothbrush and toothpaste are sitting on a bathroom sink, with a toothbrush bristle partially covering a toothpaste tube.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sink", "toothbrush", "dining table", "bowl", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 177015, "caption": "A man is sitting on a couch, using his laptop and a cat is sitting on his lap.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["laptop", "chair", "person", "cat", "refrigerator", "couch", "apple"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5714285714285714}}, {"image_id": 333998, "caption": "A large kitchen with a countertop and a dining table is filled with various objects, including a refrigerator, a stove, and a microwave oven. There is also a sink, a dishwasher, and a trash can in the kitchen. A cup is sitting on", "mscoco_hallucinated_words": [["table", "dining table"]], "mscoco_gt_words": ["microwave", "person", "sink", "suitcase", "bottle", "bowl", "cup", "oven", "refrigerator"], "hallucination_idxs": [9], "metrics": {"CHAIRs": 1, "CHAIRi": 0.14285714285714285, "Recall": 0.5555555555555556}}, {"image_id": 47131, "caption": "A group of people are gathered around a train wreck, which has caused significant damage to the train and the surrounding area. The train wreck has resulted in a mess of debris, with parts of the train scattered across the ground. The people are trying to make sense of the situation, assessing the damage", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "train", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 425447, "caption": "A man is standing next to a white pickup truck, which has a fire hose attached to it. The truck is parked on a dirt road, and there is a person standing next to it.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "fire hydrant", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 295105, "caption": "In the image, a man is standing in a kitchen, holding a bottle of soda and looking at a refrigerator. He is surrounded by various kitchen appliances, including a stove, a microwave, and a sink. The man is dressed in a red shirt and blue je", "mscoco_hallucinated_words": [["microwave", "microwave"]], "mscoco_gt_words": ["person", "sink", "bottle", "bowl", "oven", "refrigerator", "apple"], "hallucination_idxs": [36], "metrics": {"CHAIRs": 1, "CHAIRi": 0.14285714285714285, "Recall": 0.7142857142857143}}, {"image_id": 443259, "caption": "A well-designed kitchen features a white countertop, wooden cabinets, and a stainless steel appliance. There is a dining table and chairs, a sink, a refrigerator, and an oven. A potted plant adds a touch of greenery to the space. The", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "sink", "dining table", "bowl", "bottle", "potted plant", "oven", "refrigerator", "orange"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 537861, "caption": "A train is traveling down the tracks, passing by a station platform.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "train", "bench"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 145020, "caption": "A duck is posing in front of a Christmas tree and a Mickey Mouse statue, while a man and a woman are standing nearby. The Mickey Mouse statue is holding a sign with the message \"Merry Christmas\" written on it. The duck and the statue are both dressed in festive attire", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "teddy bear", "bird", "mouse"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 249969, "caption": "The image features a plate with a variety of vegetables, including carrots, broccoli, and potatoes, as well as a roasted chicken and a turkey. The dish is served on a white plate with a red background, making it visually appealing. The vegetables are arranged", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "dining table", "broccoli", "bird", "knife", "spoon", "wine glass", "carrot"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.375}}, {"image_id": 146504, "caption": "A young man sits at a desk, using a computer mouse to navigate on the computer screen. He is sitting in a room filled with office supplies, and there is a cup on the desk.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["laptop", "mouse", "person", "keyboard", "dining table", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.8333333333333334}}, {"image_id": 40037, "caption": "A large clock tower stands tall next to a building in a city, with a clock face visible on its side. The clock tower is likely a prominent landmark in the city, and its presence is a testament to the city's history and architecture. The clock tower may be part of a historic building or a", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "car", "clock"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 343218, "caption": "In the image, a young man is playing tennis on a court, holding a tennis racket while serving the ball. He is wearing tennis attire, including a white shirt and blue shorts. The image captures a moment of concentration and focus as the young man prepares to hit the ball back to", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "sports ball", "tennis racket", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 301837, "caption": "A kitchen with a large window and a white refrigerator is showcased in the image. It features a countertop with a stove, sink, and a microwave. The kitchen also has a white cabinet with a glass door and a dining table with a tablecloth. The overall design", "mscoco_hallucinated_words": [["microwave", "microwave"], ["table", "dining table"]], "mscoco_gt_words": ["clock", "sink", "oven", "refrigerator", "apple"], "hallucination_idxs": [28, 44], "metrics": {"CHAIRs": 1, "CHAIRi": 0.4, "Recall": 0.6}}, {"image_id": 309071, "caption": "A man is seen standing next to a bicycle, which is parked on the side of a road. He is adjusting the bike's handlebars.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bicycle", "person", "backpack", "potted plant", "bench"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 240681, "caption": "A young man is standing next to a red motorcycle parked on a city street, looking at his phone. He is wearing a black backpack and green sneakers, and he has his helmet on.", "mscoco_hallucinated_words": [["phone", "cell phone"]], "mscoco_gt_words": ["person", "car", "backpack", "motorcycle"], "hallucination_idxs": [19], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.75}}, {"image_id": 178753, "caption": "A young woman, possibly a student, sits in a red chair at an arena, wearing a black jacket and smiling for the camera. She is holding a cell phone, which could be a sign that she is taking a selfie or making a call.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "chair", "cell phone"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 278890, "caption": "A man is holding a cell phone and is taking a picture of a woman who is also holding a cell phone. They are standing near a table in a room, possibly a restaurant or a public space. The man is using the camera on his cell phone to take a picture of the woman, and she is likely sm", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "cell phone", "dining table"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 47781, "caption": "A red and black bed with a comforter and a pillow is placed in a bedroom. A lamp is on the bedside, and there are various items such as books, a vase, and a plant on the bed. The room has a modern and clean design, and the furniture and decor", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "vase", "bed", "tv", "book"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 542792, "caption": "A large baseball bat stands in front of a building, while a baseball field is visible in the background. The building has a tall brick wall and a large window. The image captures the combination of a sports-related object and a cityscape, showcasing the contrast between the two environments.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sports ball", "person", "baseball bat"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 293703, "caption": "A group of friends is enjoying a meal together at a table. They are sitting in a restaurant, and one of them is wearing a hat. They have ordered pizzas, and the man in the hat is holding a fork and knife, while the others are eating with their hands. The", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "chair", "person", "bottle", "bowl", "dining table", "pizza", "knife", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5555555555555556}}, {"image_id": 318777, "caption": "A group of baseball players, including one man and a few women, is standing on a grass field, with one man in a blue jersey and the others in white. The scene is set in a stadium, with a large crowd watching from the stands.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sports ball", "person", "baseball glove", "chair"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 14773, "caption": "A colorful plate filled with a hot dog, fries, and a car on a dish sits on a table in a restaurant, capturing the attention of the diner.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "person", "hot dog", "dining table", "bottle", "car", "cup", "spoon"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.375}}, {"image_id": 521863, "caption": "A young man, possibly a skateboarder, is performing a trick on a skateboard, while a crowd of people watches him in awe.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "bicycle", "skateboard"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 250540, "caption": "In the image, several people are standing on the side of the road, with bicycles and motorcycles parked nearby.", "mscoco_hallucinated_words": [["bicycle", "bicycle"]], "mscoco_gt_words": ["cell phone", "motorcycle", "person", "car", "handbag"], "hallucination_idxs": [16], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.4}}, {"image_id": 211604, "caption": "A young woman is lying on the floor in a park, wearing a tennis outfit and hat, and has a tennis racket beside her. She is taking a break from playing tennis, likely due to a break in the game or the sun. The image captures a moment of relaxation and leisure", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sports ball", "person", "tennis racket"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 298067, "caption": "The image shows a plate of pork chops and a bottle of beer on a table. The plate of pork chops is placed next to a glass of beer, making for a satisfying and enjoyable dining experience.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "cup", "bottle", "bowl"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 563938, "caption": "A group of friends is sitting on a couch, using their tablets to play games or surf the internet. They are wearing casual attire and appear to be enjoying each other's company.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "bottle", "tie", "bench", "couch"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2}}, {"image_id": 461311, "caption": "A group of people is gathered at a park, enjoying a day outdoors. They are watching a large kite flying in the sky, with people holding onto the kite strings. The image captures the joy and excitement of the group as they watch the kite soaring high above them.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "car", "kite", "handbag", "backpack"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 47940, "caption": "A young woman is sitting on her bed with a small teddy bear and a pile of books. She is reading a book, and her teddy bear is resting on her lap. The bed is covered with a blanket and pillows, and the young woman is dressed in jeans. This image capt", "mscoco_hallucinated_words": [["teddy bear", "teddy bear"], ["teddy bear", "teddy bear"]], "mscoco_gt_words": ["laptop", "bed", "book", "person"], "hallucination_idxs": [11, 27], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.75}}, {"image_id": 261318, "caption": "A man is sitting on a chair in front of a bench, looking at his phone while waiting for someone. The bench is red and wooden, and there is a suitcase nearby.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "cell phone", "person", "suitcase", "handbag", "bench"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.8333333333333334}}, {"image_id": 134768, "caption": "A black computer mouse is sitting on top of a white desk, with a keyboard and a computer monitor nearby. The desk is located in a room with a window, giving it an interesting and visually appealing background. The overall setting is a dark and spacious room, with a keyboard, mouse,", "mscoco_hallucinated_words": [["monitor", "tv"]], "mscoco_gt_words": ["laptop", "mouse", "keyboard", "dining table"], "hallucination_idxs": [19], "metrics": {"CHAIRs": 1, "CHAIRi": 0.1111111111111111, "Recall": 1.0}}, {"image_id": 526414, "caption": "A woman is sitting in a cozy room, surrounded by various household items and a sewing machine. She is sewing a piece of fabric, and there are several books and a TV in the room. The woman is working diligently, focusing on her sewing project. The room appears to be well", "mscoco_hallucinated_words": [["woman", "person"], ["woman", "person"]], "mscoco_gt_words": ["laptop", "cat", "dining table", "bowl", "scissors", "cup", "tv", "book", "remote", "couch"], "hallucination_idxs": [1, 40], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.2}}, {"image_id": 273132, "caption": "An elderly woman is sitting on a bench next to a suitcase, possibly waiting for a train or resting at the station. She wears a hat and carries a small bag, and there is a large suitcase by her side. The image captures a moment of the woman's life,", "mscoco_hallucinated_words": [["suitcase", "suitcase"], ["train", "train"], ["suitcase", "suitcase"]], "mscoco_gt_words": ["person", "handbag", "bench"], "hallucination_idxs": [11, 17, 39], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.6666666666666666}}, {"image_id": 505213, "caption": "A man is eating a hot dog while sitting on a bench, enjoying his meal in the cold weather.", "mscoco_hallucinated_words": [["bench", "bench"]], "mscoco_gt_words": ["person", "hot dog", "sandwich"], "hallucination_idxs": [11], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.6666666666666666}}, {"image_id": 192656, "caption": "A baseball player in a black and white uniform, wearing a white baseball cap, is holding a baseball glove and throwing the ball on a green field.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sports ball", "person", "baseball glove"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 272728, "caption": "A beautiful bouquet of multi-colored flowers is placed in a vase on a wooden table, adding a touch of color and vibrancy to the dining area. The arrangement of flowers is displayed in a decorative vase, making it a visually appealing centerpiece. The combination of", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["potted plant", "chair", "dining table", "vase"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 509811, "caption": "A group of students are seated in a large, well-lit room with computers and a whiteboard. They are using their laptops and are likely taking a break from studying or working on a project together.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["laptop", "chair", "person", "dining table", "book", "apple"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 412407, "caption": "A woman is holding a cell phone, which has a small screen displaying a picture. She is sitting on a couch or bench in a dark room, possibly watching a video or taking a picture.", "mscoco_hallucinated_words": [["couch", "couch"], ["bench", "bench"]], "mscoco_gt_words": ["person", "cell phone", "clock"], "hallucination_idxs": [22, 24], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.6666666666666666}}, {"image_id": 353658, "caption": "A woman carries an umbrella while walking in a crowded market, surrounded by various items for sale, including fresh produce and other goods. The presence of the umbrella suggests that it may be raining or that the woman is protecting herself from the sun, while the market scene showcases the l", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["clock", "person", "suitcase", "umbrella", "carrot", "handbag"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 441363, "caption": "A man wearing red clothing and holding a tennis racket is swinging his arm and preparing to hit the ball while standing on the tennis court.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sports ball", "person", "tennis racket"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 331084, "caption": "A group of people is gathered around a table filled with pizza, vegetables, and utensils. They are preparing to enjoy a meal together, possibly a pizza party. The image captures a moment of interaction and collaboration, as they work together to prepare and serve their food. The presence of", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "dining table", "bowl", "pizza", "knife", "spoon", "carrot"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.42857142857142855}}, {"image_id": 282553, "caption": "A group of people is walking down a dirt path in the middle of a field. They are surrounded by tall standing stones, giving the area an ancient and mysterious feel. One person is holding a large yellow sign that says, \"Follow the Yellow Brick Road.\"", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "handbag", "cell phone"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 328818, "caption": "A young woman sits on a wooden bench in a park, putting on her socks. She is preparing to put on her shoes, possibly to go for a bike ride.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "bench", "bicycle", "bottle"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 3103, "caption": "A man in a yellow helmet and a black and white jumpsuit is riding a skateboard on a half-pipe, performing a trick.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "clock", "skateboard"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 188136, "caption": "A large kitchen with a stainless steel sink, a large refrigerator, and several pots and pans is filled with fresh fruits and vegetables. The image captures a bountiful and colorful arrangement of food items, showcasing the variety of ingredients that can be used", "mscoco_hallucinated_words": [["refrigerator", "refrigerator"]], "mscoco_gt_words": ["person", "sink", "dining table", "bowl", "carrot", "orange"], "hallucination_idxs": [11], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.16666666666666666}}, {"image_id": 449675, "caption": "A woman is eating a sandwich in a dining area, with a fork and knife on her plate. The sandwich is placed on a white plate, and she has a glass of water on the table next to her.", "mscoco_hallucinated_words": [["woman", "person"]], "mscoco_gt_words": ["fork", "sandwich", "dining table", "bottle", "knife", "cup", "spoon", "carrot"], "hallucination_idxs": [1], "metrics": {"CHAIRs": 1, "CHAIRi": 0.16666666666666666, "Recall": 0.5}}, {"image_id": 191691, "caption": "A man is applying shaving cream to his face in the bathroom. He is using a shaving kit that includes a bottle of shaving cream and a razor. He is standing in front of the sink and has a toothbrush in his hand, possibly for cleaning his teeth", "mscoco_hallucinated_words": [["sink", "sink"]], "mscoco_gt_words": ["person", "toothbrush", "bottle"], "hallucination_idxs": [37], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 1.0}}, {"image_id": 89378, "caption": "The image shows a man standing next to a red motorcycle on a cement floor, wearing a red and black motorcycle helmet and holding a red backpack.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "backpack", "bicycle", "motorcycle"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 99874, "caption": "A young woman sits at a table, wearing glasses and a black shirt, while she holds her cell phone to her ear. She is using the phone to make a call, possibly to discuss plans or engage in conversation with someone. The woman's surroundings suggest that she is in a", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "person", "cat", "dining table", "bottle", "handbag"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 437895, "caption": "A colorful bed with a bed frame and a hammock is shown in the image. The hammock is hanging from the bed frame, creating a unique and eye-catching design. The bed itself is made up of several pillows and blankets, and there is a vase filled with flowers", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["potted plant", "bed", "vase"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 557447, "caption": "A man in a suit is sitting at a conference table with a notebook, pen, and a cup of coffee in front of him. He appears to be in a meeting or discussing business matters with others at the table.", "mscoco_hallucinated_words": [["notebook", "laptop"], ["cup", "cup"]], "mscoco_gt_words": ["fork", "person", "dining table", "knife", "spoon", "tie"], "hallucination_idxs": [13, 19], "metrics": {"CHAIRs": 1, "CHAIRi": 0.4, "Recall": 0.3333333333333333}}, {"image_id": 159979, "caption": "A group of people can be seen sitting on a wooden boat, surrounded by various food items and a dining umbrella. This scene suggests that they might be enjoying a meal together or participating in a social event, possibly on a river or lake. The presence of the umbrella provides protection from", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "umbrella", "boat", "bowl"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 357, "caption": "A group of baseball players is on the field, with a few players standing at the plate and others standing in the outfield. The image shows a close-up view of the batter's stance and the pitcher on the mound.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "baseball glove", "baseball bat"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 538891, "caption": "A young woman in a white tennis outfit is standing at the baseline of a tennis court, holding a tennis racket and looking at the camera with a determined expression. She is preparing to hit a tennis ball during a match.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sports ball", "person", "tennis racket"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 561967, "caption": "A train is traveling down the tracks, with a long line of railroad cars behind it. The train has a freight car at the end, which is the last car in the train. The train is moving through a rural area, surrounded by trees and fields.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["train", "traffic light", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 565778, "caption": "A blue train carries passengers down a track, passing by a green train car in the foreground. The image captures the moment when the two trains are moving in opposite directions, creating a contrast of colors and a sense of movement in the scene.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "train", "traffic light", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 7125, "caption": "A group of people, including a man and a woman, are riding bicycles on a paved path near a river. The man is riding a black bicycle, while the woman is riding a red one. They are both wearing bicycle helmets, indicating their safety and", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bicycle", "person", "bottle", "backpack", "dog"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 221350, "caption": "An elderly man is wearing a red tie with white hearts, holding a handwritten note in his hand. He is sitting in a chair, possibly in a room with a table. The man appears to be smiling, and the note may be related to a special occasion or a message of love.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "person", "dining table", "tie", "handbag"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.8}}, {"image_id": 280930, "caption": "A young girl is standing in front of a counter, with a tray of baked goods on it. She is holding a spatula and smiling, possibly enjoying her baking experience.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "oven", "refrigerator", "bottle"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 151081, "caption": "A small airplane is flying over a vast field with a long, open road and a fence running along the edge of the field.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "truck", "airplane"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 122232, "caption": "A man is playing tennis on a grassy field, surrounded by tennis balls and a net.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sports ball", "person", "tennis racket"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 134223, "caption": "A delicious sandwich and various condiments are displayed on a white plate in a dining setting. The sandwich consists of a baguette filled with a tasty combination of meat, cheese, and vegetables. The plate also contains a bowl of fries, a side of ranch dress", "mscoco_hallucinated_words": [["sandwich", "sandwich"], ["sandwich", "sandwich"]], "mscoco_gt_words": ["broccoli", "hot dog", "dining table", "bowl"], "hallucination_idxs": [2, 18], "metrics": {"CHAIRs": 1, "CHAIRi": 0.6666666666666666, "Recall": 0.25}}, {"image_id": 198163, "caption": "A man is sitting at a small table, surrounded by various bowls filled with paint. He is engaged in painting, using a brush to create artwork. The bowls of paint are arranged in front of him, and the window in the background provides natural light for his artistic process.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "dining table", "bowl"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 3742, "caption": "A bowl filled with apples sits on a dining table next to a window, surrounded by various fruits. A rose flower is also present on the table, adding a touch of color and beauty to the scene.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["apple", "vase", "dining table", "bowl"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 217593, "caption": "A young boy is standing in the middle of a grassy field, wearing a baseball uniform, glove, and holding a baseball bat. He is preparing to play baseball, and the image captures the moment before he swings the bat.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "person", "handbag", "baseball glove", "baseball bat"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 279078, "caption": "A young woman stands in front of a refrigerator filled with beer bottles, excitedly holding a bottle of beer as she poses for a photo.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "refrigerator", "bottle"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 572081, "caption": "A man in a black shirt and black shorts is playing tennis on a court with a net in the background. He is wearing tennis shoes and has a tennis racket in hand.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sports ball", "tennis racket", "chair", "person", "couch"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 477016, "caption": "A mother and her daughter are looking at a display of food products in a kitchen, with a large picture of a pig on the wall. The mother is holding a baby, while the daughter is walking away from the display with a toy. They appear to be in a happy and playful mood, enjo", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "sink", "potted plant", "oven", "handbag", "backpack"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.16666666666666666}}, {"image_id": 301266, "caption": "In the image, a group of people is gathered around a table, working together to prepare food for a meal. They are busy preparing various dishes, using utensils and tools, and possibly discussing the meal plans. The image captures the process of cooking and preparing food, show", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "person", "sink", "dining table", "cup", "spoon", "book"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2857142857142857}}, {"image_id": 475813, "caption": "A young girl stands in a room, holding a toy television remote in one hand while she stares at the TV screen with her other hand. The image captures a moment of curiosity and attention from the young child as she watches something on the screen.", "mscoco_hallucinated_words": [["television", "tv"], ["tv", "tv"]], "mscoco_gt_words": ["person", "handbag", "remote"], "hallucination_idxs": [11, 21], "metrics": {"CHAIRs": 1, "CHAIRi": 0.4, "Recall": 0.6666666666666666}}, {"image_id": 558784, "caption": "A man is standing by a small body of water, holding a golf club and looking at his phone. He is likely trying to check his golf score or make a plan for his next shot.", "mscoco_hallucinated_words": [["phone", "cell phone"]], "mscoco_gt_words": ["person", "backpack", "frisbee"], "hallucination_idxs": [19], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.3333333333333333}}, {"image_id": 308543, "caption": "A person is holding two silver spoons in their hand, with one of them dipped into a sink full of water. The person is possibly preparing a meal or cleaning a dish using the spoons.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "sink", "spoon"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 359164, "caption": "A pair of dogs, a golden retriever and a black and white dog, are seen playing in the grass. One of the dogs is running towards a small trash can in the grass.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["car", "chair", "dog", "dining table"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 539951, "caption": "A white and gray Lego kitchen with a stove, sink, and refrigerator is displayed in a colorful setting, showcasing the creativity and imagination of the Lego builder. The Lego kitchen is set up in a black and white checkered pattern, adding a unique touch to the overall", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["oven", "sink", "refrigerator", "clock"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 143479, "caption": "A man is holding a large tray filled with hot, spicy peppers, while an elderly woman is standing nearby. The man appears to be taking the peppers from the tray and handing them to the woman, who is likely his companion or someone he is assisting.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "hot dog", "chair"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 475024, "caption": "A vase full of orange flowers, sitting on a table with a mirror behind it, is the main focus of this image. The arrangement of the flowers in the vase adds a pop of color and beauty to the room, while the mirror provides a nice backdrop to capture the image.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["potted plant", "dining table", "orange", "vase"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 238065, "caption": "A young man is riding a skateboard, performing tricks and posing for the camera on a wooden platform. The image captures the moment of his skateboarding skills, and the sunlight illuminates his face, creating a lively and energetic atmosphere.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "chair", "skateboard"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 314016, "caption": "A small bathroom is filled with various items, including a sink, a toilet, a book, a bottle of alcohol, and a mirror. The sink is being used for washing hands, while the toilet is being used for personal hygiene. The book appears to be a decor", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sink", "book", "bottle", "toilet"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 322163, "caption": "A chef is busy preparing a meal at a pizza station in a restaurant, surrounded by other people. He is working on a dough, likely a pizza crust, and using a rolling pin to shape it. The chef is using a variety of ingredients, including a red sauce and", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["remote", "person", "bottle", "bowl", "dining table", "pizza", "potted plant", "oven", "microwave"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2222222222222222}}, {"image_id": 230983, "caption": "In the image, a man is seen jumping on a skateboard, doing a trick on the sidewalk. He is wearing a red baseball cap and a black shirt, and the skateboard is yellow. The man is performing a flip, showcasing his skills and agility on the", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "car", "skateboard"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 564629, "caption": "In the image, a kitchen with a large brown stove and a white refrigerator is visible, along with a countertop and a sink. The kitchen also features a microwave and an oven. The scene is set in a motorhome, which is a type of recreational vehicle designed for camp", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["oven", "sink", "microwave", "refrigerator"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 53431, "caption": "A man is sitting on a chair in front of a brick wall, wearing a suit and tie, with his laptop open. He is using the chair as a makeshift desk to work on his computer.", "mscoco_hallucinated_words": [["tie", "tie"], ["desk", "dining table"]], "mscoco_gt_words": ["laptop", "person", "chair"], "hallucination_idxs": [18, 33], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2857142857142857, "Recall": 1.0}}, {"image_id": 441840, "caption": "A young boy is practicing his baseball pitching skills in a field, using a baseball bat to throw the ball. He is surrounded by people, possibly his friends or family, who are watching him play. The image captures the moment of excitement and enjoyment as he takes a swing at the ball, demonstrating", "mscoco_hallucinated_words": [["ball", "sports ball"], ["ball", "sports ball"]], "mscoco_gt_words": ["person", "truck", "car", "baseball glove", "baseball bat"], "hallucination_idxs": [20, 56], "metrics": {"CHAIRs": 1, "CHAIRi": 0.4, "Recall": 0.4}}, {"image_id": 53465, "caption": "A group of people is enjoying a dessert at a table, with a cake that reads \"Welcome to the Jungle\" in frosting. The cake is decorated with edible flowers, and the group is drinking beverages and eating snacks while they celebrate their time", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "person", "dining table", "bowl", "cup", "spoon", "cake"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.42857142857142855}}, {"image_id": 381031, "caption": "A caption for the image could be:\n\n\"A bowl of peanut butter and jelly sandwiches, a glass of orange juice, and a bowl of mixed berries are arranged on a dining table. The table is set with a spoon, a knife,", "mscoco_hallucinated_words": [["bowl", "bowl"], ["sandwich", "sandwich"], ["orange", "orange"], ["bowl", "bowl"], ["knife", "knife"]], "mscoco_gt_words": ["bottle", "dining table", "cup", "spoon", "donut", "microwave", "apple"], "hallucination_idxs": [10, 16, 21, 26, 46], "metrics": {"CHAIRs": 1, "CHAIRi": 0.625, "Recall": 0.2857142857142857}}, {"image_id": 530520, "caption": "Two friends, one with a laptop and the other with a backpack, sit on the grass in a park, engaged in a conversation or working on a task. The scene suggests that they might be discussing a project or sharing information related to their studies or work.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["laptop", "clock", "motorcycle", "person", "backpack"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 539555, "caption": "A young man is playing a game of volleyball, using his hands to hit the ball while wearing a t-shirt and shorts. He is surrounded by other people, which suggests that this is a group activity.", "mscoco_hallucinated_words": [["ball", "sports ball"]], "mscoco_gt_words": ["person", "skateboard", "frisbee"], "hallucination_idxs": [16], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.3333333333333333}}, {"image_id": 279521, "caption": "A man and a woman are standing next to a city bus, looking at their phones. The woman is wearing a blue jacket, and the man is wearing a red hat. They seem to be discussing something while waiting for the bus to continue its route.", "mscoco_hallucinated_words": [["phone", "cell phone"]], "mscoco_gt_words": ["bus", "person", "train", "car", "handbag", "backpack"], "hallucination_idxs": [16], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2, "Recall": 0.16666666666666666}}, {"image_id": 560439, "caption": "In the image, a group of people are walking along a snowy trail, likely enjoying winter sports. They are dressed in warm clothing, including coats, hats, and gloves, and are carrying skis, snowboards, and bags. The group is standing on a snow-covered", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "snowboard", "handbag", "backpack", "skis"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 248353, "caption": "A group of young skiers, including a young girl and two boys, are having fun on a snow-covered slope, enjoying their winter sport. They are all wearing winter clothing and skiing equipment, such as skis, snowboards, and helmets, to keep warm and safe while", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "skis", "snowboard"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 9628, "caption": "A man is riding a red kayak, standing up and balancing himself on the water. He is holding onto a surfboard and appears to be performing a trick while doing so.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "surfboard", "boat"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 330050, "caption": "A man and a woman are standing in a tennis court, holding a tennis racket and a tennis ball. The woman is smiling, while the man is holding the racket in a more serious posture. They might be participating in a friendly game of tennis or just enjoying the sport together.", "mscoco_hallucinated_words": [["ball", "sports ball"]], "mscoco_gt_words": ["tennis racket", "person", "bench"], "hallucination_idxs": [19], "metrics": {"CHAIRs": 1, "CHAIRi": 0.14285714285714285, "Recall": 0.6666666666666666}}, {"image_id": 254161, "caption": "A person is walking through a city square surrounded by tall buildings, while holding a smartphone and looking up at the sky.", "mscoco_hallucinated_words": [["smartphone", "cell phone"]], "mscoco_gt_words": ["person", "kite", "handbag"], "hallucination_idxs": [16], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.3333333333333333}}, {"image_id": 275749, "caption": "A group of friends is gathered in a room, with one person sitting at a computer desk and others standing around. They are likely engaged in a video game or sharing a meal, as there is a bottle of beer on the desk. They are laughing and having fun together, creating a l", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["laptop", "chair", "mouse", "person", "dining table", "bottle", "cup", "tv"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 163518, "caption": "A woman in a chef uniform is placing a large serving of salad into a container, possibly for a catering event. The salad is made up of various vegetables, such as lettuce, tomatoes, and carrots, arranged in a neat and organized manner. The woman is diligently", "mscoco_hallucinated_words": [["carrot", "carrot"]], "mscoco_gt_words": ["chair", "person", "dining table", "bowl", "oven"], "hallucination_idxs": [39], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2, "Recall": 0.4}}, {"image_id": 156696, "caption": "A long train with several cars, including one with a passenger inside, is moving down the tracks, and people are standing on the platform.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "train", "handbag", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 525202, "caption": "A group of friends are enjoying a delicious pizza at a restaurant, sitting around a table with a large pizza in the center. The pizza is topped with a variety of ingredients, including meat, vegetables, and cheese, making it a satisfying and flavorful meal for", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "chair", "person", "bottle", "dining table", "pizza", "knife", "cup", "spoon"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2222222222222222}}, {"image_id": 423984, "caption": "A delicious and hearty meal is displayed on a white plate. A bowl of creamy pasta is placed in the center of the plate, surrounded by a variety of vegetables, including broccoli, carrots, and celery. The meal is accompanied by a slice of bread and", "mscoco_hallucinated_words": [["bowl", "bowl"]], "mscoco_gt_words": ["carrot", "broccoli", "dining table"], "hallucination_idxs": [13], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.6666666666666666}}, {"image_id": 499486, "caption": "Two cats, a black and white cat, and a brown cat, are sitting on a bed together. The black and white cat is on the pillow, while the brown cat is laying on top of the bed, and both cats appear to be sleeping.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bed", "book", "cat"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 118124, "caption": "A young man is sitting in a car, looking at the camera while wearing a tie and a pair of glasses.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "car", "tie"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 288729, "caption": "A cute and colorful cake with a circus theme sits on a table next to a stuffed animal and a stuffed elephant. The cake features a small circus tent with a smiling face on top, surrounded by balloons and a clown. The cake is", "mscoco_hallucinated_words": [["table", "dining table"]], "mscoco_gt_words": ["elephant", "person", "bear", "teddy bear", "cake"], "hallucination_idxs": [12], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2, "Recall": 0.4}}, {"image_id": 177721, "caption": "A young man is skateboarding on a half-pipe at an outdoor skate park. He is performing tricks and showing off his skills, enjoying the thrill of riding his skateboard.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "skateboard", "dining table"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 372220, "caption": "A man wearing a white robe and a hat is holding a mobile phone in his hand, possibly taking a photo or using it to communicate. He is standing in front of a crowd of people, possibly at a festival or event, and is surrounded by a group of people who are watching him.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "handbag", "cell phone", "horse"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 252625, "caption": "A busy street in Tokyo, Japan, features a bicycle lane, a sidewalk, and a variety of shops, including a convenience store and a vending machine.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["potted plant", "traffic light", "person", "bicycle"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 493610, "caption": "A bus is parked on a dirt road, with people riding on the roof and inside the vehicle. The bus is traveling through a rural area, and there is a person standing next to the bus.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "truck", "car", "bus"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 302789, "caption": "A suitcase and a backpack are placed on a bed in a room, with a laptop bag and a suitcase open on the floor next to the bed. A small table with a laptop and a bottle of water is also present in the room. The image suggests that someone may have recently returned from a trip", "mscoco_hallucinated_words": [["laptop", "laptop"], ["table", "dining table"], ["laptop", "laptop"]], "mscoco_gt_words": ["suitcase", "sink", "bottle", "bed", "handbag", "backpack", "refrigerator"], "hallucination_idxs": [16, 32, 35], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.5714285714285714}}, {"image_id": 30667, "caption": "A couple is sitting on a boat, reading a book together, while a brown dog is lying on the floor next to them.", "mscoco_hallucinated_words": [["book", "book"]], "mscoco_gt_words": ["person", "dog", "boat"], "hallucination_idxs": [10], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.6666666666666666}}, {"image_id": 114108, "caption": "In the image, a group of people is gathered around a large pizza on a table. The pizza is divided into several slices, and a fork and knife are placed on top of it. A person is holding a fork and taking a bite of the pizza, while another person is reaching for", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "chair", "person", "dining table", "pizza", "knife", "cup", "spoon"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.625}}, {"image_id": 328110, "caption": "A young woman is sitting on a bench, holding her baby while looking at her phone. The baby is wearing a red hat, and the woman is wearing a white t-shirt. The image captures the moment of her attention being focused on her phone, while the baby is safely held in her", "mscoco_hallucinated_words": [["phone", "cell phone"], ["phone", "cell phone"]], "mscoco_gt_words": ["person", "handbag", "bench", "backpack"], "hallucination_idxs": [16, 47], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.5}}, {"image_id": 366111, "caption": "A man rides a bicycle while a woman sits on a bike, both of them wearing suits, as they travel through a busy street.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "traffic light", "bicycle", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 532481, "caption": "A man is flying a kite on a beach with a surfer riding a wave in the background.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "kite", "surfboard", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 291634, "caption": "The image features a street lined with multiple motorcycles parked along the sidewalk. There are bikes of various sizes, shapes, and colors, indicating a diverse range of motorcycles. The scene suggests a vibrant and bustling atmosphere, with a mix of new and old bikes l", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "bicycle", "motorcycle"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 463678, "caption": "A man is holding a tennis racket and wearing white tennis attire while standing in front of a blue tennis court. He is about to hit a tennis ball with his racket. The image captures a moment of focus and concentration, as the man prepares to strike the ball.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sports ball", "person", "tennis racket"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 70815, "caption": "A dog is sitting on a sidewalk, possibly waiting for its owner to return. The dog is wearing a coat, and the scene is captured in black and white.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "truck", "bicycle", "dog"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 367872, "caption": "A baseball player is swinging a bat at a baseball, with a large crowd watching in the stands.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sports ball", "person", "umbrella", "baseball glove", "baseball bat"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2}}, {"image_id": 353898, "caption": "A young man is sitting on a stone bench surrounded by a flock of white birds in a park, engaging in a leisurely activity with his friends. The image captures a serene and peaceful scene, showcasing the beauty of nature and the joy of spending time with loved ones", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "person", "bench", "bird", "backpack"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 88269, "caption": "A delicious bowl of soup sits on a plate, accompanied by a slice of toast and a spoon.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sandwich", "spoon", "bowl"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 463211, "caption": "A young girl and her friend are standing next to a school bus, both wearing school uniforms. The girl is holding a pink backpack and has her hair tied in a ponytail. The friend, a boy, is standing next to her, and they seem to be waiting for the bus to arrive", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "backpack", "bus"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 396269, "caption": "In the image, a large bouquet of colorful flowers sits on a gold chair in a room with a beautiful floral design on the walls.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "dining table", "vase"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 98979, "caption": "A black microwave oven sits on a kitchen counter, surrounded by a stove and a dishwasher.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["oven", "knife", "microwave"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 244455, "caption": "A group of police officers on motorcycles are riding down a city street, with one officer waving and pointing at the camera. The image captures the camaraderie and professionalism of the officers as they patrol the city, ensuring the safety and security of the community.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bicycle", "motorcycle", "person", "truck", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 379443, "caption": "A person is sitting on a couch, surrounded by various objects like scissors, a black dress, and an orange pair of scissors.", "mscoco_hallucinated_words": [["person", "person"], ["couch", "couch"]], "mscoco_gt_words": ["orange", "dining table", "scissors"], "hallucination_idxs": [1, 6], "metrics": {"CHAIRs": 1, "CHAIRi": 0.4, "Recall": 0.6666666666666666}}, {"image_id": 536154, "caption": "A young girl is sitting on a bed surrounded by a large collection of stuffed animals, toys, and other plush items. The girl is holding up a teddy bear and smiling, showcasing her excitement and love for these cuddly companions. The image captures a moment of joy", "mscoco_hallucinated_words": [["bed", "bed"]], "mscoco_gt_words": ["person", "teddy bear", "cat"], "hallucination_idxs": [7], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.6666666666666666}}, {"image_id": 374061, "caption": "A black cat is sleeping on a couch, with a teddy bear on its side, and a small stuffed animal in its mouth.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cat", "bed", "bear", "teddy bear", "couch"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 560018, "caption": "A group of people are surfing in the ocean, riding the waves and enjoying the sunny day. They are located near a pier, with the pier's wooden structure visible behind them. The image captures the activity and joy of the surfers, who are engaged in their sport while enjoying", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "kite", "surfboard"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 353320, "caption": "A man is sitting on a bench in front of a train station, holding a suitcase and looking at his phone. The suitcase is on the bench beside him, and a guitar case is on the bench behind him.", "mscoco_hallucinated_words": [["train", "train"], ["phone", "cell phone"]], "mscoco_gt_words": ["suitcase", "person", "handbag", "bench"], "hallucination_idxs": [11, 21], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.75}}, {"image_id": 256628, "caption": "A golden retriever is lying down on the wooden floor, with its head resting on its paws, looking at the camera. The dog appears to be enjoying the sunny day and is probably waiting for its owner or someone to come and play with it.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "dog", "bowl"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 158806, "caption": "A cute dog is enjoying a tasty peanut butter and jelly sandwich on a blue plate, and it's being held by a person.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "sandwich", "dog"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 424270, "caption": "A young girl is lying on a bed or a mattress, surrounded by a pile of bedding, in a room with a window.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "bed", "tv"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 368335, "caption": "A horse stands next to a line of parked cars, looking at the street.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["truck", "car", "horse"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 483227, "caption": "A group of children is gathered around a tennis net, playing tennis with rackets and balls. They are engaged in a fun and active activity, enjoying the sunny weather and fresh air.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sports ball", "person", "tennis racket"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 228306, "caption": "A red double-decker bus is parked at a curb on a city street, with people walking past it. The bus is a classic London-style double-decker, which adds to its appeal and charm.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "car", "bus"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 416384, "caption": "A young woman sits on a wooden bench, holding her phone, and enjoying the sunshine. She is wearing a pink swimsuit and has a towel on her lap. The scene captures the woman's relaxed mood and the beautiful outdoor environment, showcasing", "mscoco_hallucinated_words": [["bench", "bench"]], "mscoco_gt_words": ["person", "chair", "cell phone"], "hallucination_idxs": [7], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.6666666666666666}}, {"image_id": 364783, "caption": "A close-up image of a small bathroom with a red sink, toilet, and bathtub, as well as a red-colored shower curtain. The bathroom is clean and well-maintained, with a shiny surface on the shower floor and a potted plant", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "sink", "toothbrush", "bottle", "cup", "toilet", "potted plant"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.42857142857142855}}, {"image_id": 335041, "caption": "A man and a woman are walking down a snowy street with snow-covered cars parked along the side. They are each carrying a pair of skis and appear to be enjoying their winter outdoor activity.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "skis", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 531327, "caption": "A bowl filled with a colorful vegetable salad, including broccoli, carrots, and peppers, is sitting on a dining table in a restaurant. The vegetables are arranged neatly and look appetizing. The dining table also has a glass of red wine nearby, adding", "mscoco_hallucinated_words": [["bowl", "bowl"]], "mscoco_gt_words": ["fork", "dining table", "broccoli", "knife", "spoon", "wine glass", "carrot"], "hallucination_idxs": [1], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2, "Recall": 0.42857142857142855}}, {"image_id": 451228, "caption": "A group of people riding bicycles and walking on the sidewalk, along with several red double-decker buses, is seen on a busy street in the city at night.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "traffic light", "bus", "bicycle"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 256365, "caption": "A white plate is filled with three blue cupcakes, each topped with a swirl of frosting. The cupcakes are arranged on a plate, and the plate is placed on a white table.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cake", "cup", "dining table"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 502936, "caption": "A man is playing tennis on a tennis court, with a racket and a tennis ball in hand. He is wearing tennis clothing and is in the process of hitting a tennis ball back and forth with his opponent. The image shows the man's focus on the game, and the presence of the ra", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sports ball", "person", "tennis racket"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 451449, "caption": "A dog is sleeping in a bed inside a bookshelf, surrounded by books and other items.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bed", "book", "dog"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 51054, "caption": "An elderly woman sits on a bed, holding a cell phone while looking at it intently. The image captures a moment of her daily life, possibly related to her communication with someone or a task she needs to complete.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "person", "bottle", "bed", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 1268, "caption": "A man and a woman are sitting on a stone bench, enjoying a sunny day and the beautiful view of the river. The man is taking a picture of the swan, while the woman is smiling and looking at the camera. The image captures the serene and picturesque atmosphere of the city", "mscoco_hallucinated_words": [["bench", "bench"]], "mscoco_gt_words": ["cell phone", "person", "bird", "handbag", "backpack", "boat"], "hallucination_idxs": [10], "metrics": {"CHAIRs": 1, "CHAIRi": 0.16666666666666666, "Recall": 0.3333333333333333}}, {"image_id": 62692, "caption": "A woman in a black and white outfit is playing tennis on a tennis court. She is in the middle of a serve, as she swings her tennis racket with a ball overhead.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sports ball", "person", "tennis racket"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 542771, "caption": "A woman sits at a wooden desk in a dimly lit room with a chair, a small table, and a vase of flowers. She is holding a book in her hands and appears to be reading it.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "person", "dining table", "vase", "potted plant", "book"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.8333333333333334}}, {"image_id": 575406, "caption": "A bright red and blue bus is parked on the sidewalk in front of a building, with a small red car nearby. The bus is decorated with colorful stripes, adding a vibrant touch to the scene.", "mscoco_hallucinated_words": [["car", "car"]], "mscoco_gt_words": ["potted plant", "person", "bus", "motorcycle"], "hallucination_idxs": [21], "metrics": {"CHAIRs": 1, "CHAIRi": 1.0, "Recall": 0.0}}, {"image_id": 244834, "caption": "A man and woman walk together on a sidewalk under an umbrella, holding hands and walking in the rain.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["clock", "bicycle", "person", "umbrella", "car", "potted plant", "handbag"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2857142857142857}}, {"image_id": 151159, "caption": "A man is playing skateboard with a group of friends on a concrete tennis court. They are enjoying the activity and having fun together, with the man performing a trick on the skateboard.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "bench", "skateboard"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 277073, "caption": "A man riding a motorcycle on a busy street, surrounded by cars and pedestrians, is captured in the image. The man is wearing a helmet and is driving the motorcycle with a sense of confidence and determination, while the other vehicles and pedestrians continue their daily activities around", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bicycle", "motorcycle", "person", "car", "backpack"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 377879, "caption": "A large army tank sits on a truck bed, being transported through a city street. The tank is surrounded by a metal fence and is parked on a rail track.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["train", "truck", "bed"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 436814, "caption": "A young woman is sitting at a desk in a small, well-lit room. She is using a laptop and a cell phone, with a pile of papers and other documents on her desk. There is a bookshelf behind her, and a window visible in the background. The room appears to be", "mscoco_hallucinated_words": [["woman", "person"], ["cell phone", "cell phone"]], "mscoco_gt_words": ["laptop", "chair", "mouse", "dining table"], "hallucination_idxs": [2, 22], "metrics": {"CHAIRs": 1, "CHAIRi": 0.4, "Recall": 0.5}}, {"image_id": 63934, "caption": "A man rides a skateboard down the sidewalk in front of a city building, wearing a white nun costume.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "truck", "skateboard", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 275611, "caption": "A close-up image of a pizza sitting on a plate, with a fork and knife on the side, is displayed in the image. The pizza has a white sauce, and it is topped with cheese, green peppers, and onions. It is being served on a white table", "mscoco_hallucinated_words": [["fork", "fork"]], "mscoco_gt_words": ["pizza", "knife", "dining table"], "hallucination_idxs": [13], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2, "Recall": 1.0}}, {"image_id": 516248, "caption": "A person is sitting at a computer desk with a keyboard, mouse, and a laptop. The person is typing on the keyboard and using the mouse to navigate through a computer program or website. The image shows a person using a computer for work or leisure activities, such as browsing the internet or working on", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["laptop", "mouse", "person", "keyboard", "dining table", "tv"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.8333333333333334}}, {"image_id": 478380, "caption": "A large group of sheep are gathered on a road in front of a bus, creating a traffic jam. A man is standing on the bus, observing the situation.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "car", "sheep"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 422326, "caption": "A man is standing next to a motorcycle, while a couple of motorcycles are parked next to each other. One of the motorcycles is a chopper, and the other one is a sidecar. They are parked in a parking lot, and there is a person standing next to them", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bicycle", "motorcycle", "person", "truck", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 110449, "caption": "Two men, one wearing a hat and the other wearing a baseball cap, are standing at a bar counter, looking at a computer screen and a DJ mixing music. They are both involved in a night out, possibly at a party or a club.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["laptop", "person", "dining table", "tv", "remote"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 45550, "caption": "In the image, a man is holding a plate with a large piece of fried chicken on it, smiling for the camera.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "sandwich", "clock", "bowl"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 444913, "caption": "A man is standing in a grassy area, holding a baseball bat and looking up at the sky, possibly while waiting for a pitch. He is wearing a baseball cap, and the image captures the moment of him being ready to swing at the ball. The man is situated near a building, adding context to", "mscoco_hallucinated_words": [["baseball bat", "baseball bat"], ["ball", "sports ball"]], "mscoco_gt_words": ["person", "car", "frisbee"], "hallucination_idxs": [11, 48], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.3333333333333333}}, {"image_id": 82709, "caption": "A dog is jumping over a fence while a girl is holding a frisbee in the background.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "bottle", "cup", "backpack", "dog", "frisbee"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 132796, "caption": "A group of people, including a man and a woman, are riding an elephant through the forest, with a person sitting on the elephant's back.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["elephant", "chair", "person", "bench", "backpack"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 303099, "caption": "Two cats sit on top of a toilet, looking at a bathroom sink, and a toilet paper roll.", "mscoco_hallucinated_words": [["sink", "sink"]], "mscoco_gt_words": ["toilet", "cat", "bottle"], "hallucination_idxs": [13], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.6666666666666666}}, {"image_id": 271565, "caption": "A group of motorcyclists is riding down a city street, passing by a parked car on the side of the road. The motorcyclists appear to be enjoying a fun and adventurous ride together, with one of them holding a flag. The parked car serves as a backdrop", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "truck", "car", "motorcycle"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 205193, "caption": "A person is sitting on a kitchen counter next to a cup of tea and a tea bag. The person is holding a spoon and looking at the tea bag in their hand.", "mscoco_hallucinated_words": [["cup", "cup"], ["spoon", "spoon"]], "mscoco_gt_words": ["person", "oven", "toaster", "microwave"], "hallucination_idxs": [11, 24], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.25}}, {"image_id": 272566, "caption": "A man sitting on a bench is surrounded by a variety of fruits, including bananas, apples, and oranges. He is enjoying a snack while sitting in a park, likely enjoying the freshness of the fruits and the pleasant atmosphere of the park.", "mscoco_hallucinated_words": [["bench", "bench"], ["orange", "orange"]], "mscoco_gt_words": ["person", "banana", "cup", "apple"], "hallucination_idxs": [5, 20], "metrics": {"CHAIRs": 1, "CHAIRi": 0.4, "Recall": 0.75}}, {"image_id": 170099, "caption": "In this image, a man stands in front of a couch with orange cushions, while holding a framed photograph of an apartment building. The man is wearing a suit, and the scene appears to be a living room or a conference room. The presence of the couch, the man, and", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "couch", "orange", "tie"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 14940, "caption": "A large orange cat is sitting on a bed, holding a stuffed animal in its paws, and looking at the camera.", "mscoco_hallucinated_words": [["bed", "bed"]], "mscoco_gt_words": ["chair", "orange", "cat", "couch", "dog"], "hallucination_idxs": [8], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.4}}, {"image_id": 408449, "caption": "A young man skateboards down a city street, holding his skateboard while walking, and wearing a white shirt.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bus", "person", "truck", "skateboard", "car", "handbag", "backpack"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2857142857142857}}, {"image_id": 140702, "caption": "A baby elephant and its mother walk together in a field, with the baby elephant being led by its mother.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "elephant", "bird"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 354540, "caption": "A man is sitting on a kitchen counter with a laptop and a few cables hanging from the counter, which suggests that he is working on something.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["laptop", "toaster", "chair", "cell phone", "person", "oven", "microwave"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2857142857142857}}, {"image_id": 19763, "caption": "A man is enjoying a slice of pizza, with a glass of beer on the table next to it, while sitting at a table in a restaurant.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "chair", "person", "dining table", "pizza", "knife", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.42857142857142855}}, {"image_id": 191301, "caption": "A close-up image of a dessert tray showcases a delicious treat, including chocolate cake and ice cream. The tray is placed on a white tablecloth, and there are various utensils, such as spoons and forks, to enjoy the dessert. The", "mscoco_hallucinated_words": [["fork", "fork"]], "mscoco_gt_words": ["person", "dining table", "cup", "spoon", "cake"], "hallucination_idxs": [38], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.4}}, {"image_id": 124236, "caption": "A busy kitchen is filled with various items, including a stove, sink, dishwasher, refrigerator, and microwave. A kitchen table is present, as well as a small dining table with chairs. There are pots, pans, and utensils on the", "mscoco_hallucinated_words": [["sink", "sink"], ["refrigerator", "refrigerator"], ["microwave", "microwave"], ["chair", "chair"]], "mscoco_gt_words": ["toaster", "dining table", "bowl", "spoon", "oven"], "hallucination_idxs": [13, 17, 20, 36], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5714285714285714, "Recall": 0.4}}, {"image_id": 344930, "caption": "A red fire hydrant stands on a sidewalk next to a car, and a parked car is visible in the background.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fire hydrant", "car", "orange"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 14285, "caption": "A cat lays on a bed in a room with a TV and a computer. The cat is likely sleeping, and the room has a TV and a computer, which suggests that the owner is using the devices for entertainment or work.", "mscoco_hallucinated_words": [["computer", "laptop"], ["computer", "laptop"]], "mscoco_gt_words": ["chair", "cat", "bed", "tv", "book", "remote"], "hallucination_idxs": [14, 30], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2857142857142857, "Recall": 0.5}}, {"image_id": 82488, "caption": "A bed or beds, with multiple pillows and a clock, are arranged in a room, possibly a hotel or bed and breakfast. The bedding appears to be colorful and comfortable, adding to the inviting atmosphere of the space.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["clock", "dining table", "bed", "book", "remote", "orange"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 348251, "caption": "A woman wearing a green jacket and a backpack is walking down a snow-covered slope with skis on her feet. She is walking on a ski trail, likely enjoying a day at the ski resort.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "skis", "backpack"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 150703, "caption": "A glass of beer and a hot dog sit on a table, with a plate of food and a napkin nearby.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["hot dog", "sandwich", "cup", "dining table"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 381615, "caption": "A woman sits in a dining room, surrounded by plants and a window, with a chair next to a table.", "mscoco_hallucinated_words": [["woman", "person"], ["table", "dining table"]], "mscoco_gt_words": ["chair", "vase", "cup", "potted plant", "book"], "hallucination_idxs": [1, 21], "metrics": {"CHAIRs": 1, "CHAIRi": 0.6666666666666666, "Recall": 0.2}}, {"image_id": 352703, "caption": "A woman is preparing food at an outdoor event, using a large blue bowl, a spoon, and a wooden cutting board. She is stirring and mixing the ingredients in the bowl. The scene is taking place at a picnic table in a park, where people are gathered to enjoy", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "dining table", "bottle", "bowl", "cup", "spoon", "oven", "handbag"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 111109, "caption": "A young boy is sitting on a chair, wearing shorts and a white shirt. He is smiling and looking directly at the camera.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "motorcycle", "person", "tie", "tv"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 226802, "caption": "A crowded street scene with people walking and vehicles passing by, including a red bus, cars, and a taxi. The scene takes place on a wet pavement, and there are buildings and a hotel visible in the background.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "car", "bus", "motorcycle"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 49005, "caption": "In the image, a baseball game is taking place on a large field, with several players engaged in the action. The game is being played on a grassy field, and the players are dressed in baseball uniforms. One player is holding a baseball bat, while another is preparing to pitch the ball. The field", "mscoco_hallucinated_words": [["ball", "sports ball"]], "mscoco_gt_words": ["person", "baseball glove", "baseball bat"], "hallucination_idxs": [57], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2, "Recall": 0.6666666666666666}}, {"image_id": 410114, "caption": "In the image, a group of cows is walking down a dirt road, possibly grazing in the fields. The cows are surrounded by a fence, and the dirt road can be seen in the background.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "cow", "truck", "horse"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 100274, "caption": "A train is parked on a platform next to a railroad track in a city, surrounded by buildings and a street. The train is near a large industrial building, and there are other vehicles nearby.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["train", "truck", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 317254, "caption": "A young man on a motorcycle rides down the street, passing by parked cars, while a city street is visible in the background.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "car", "motorcycle"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 425569, "caption": "A chef is preparing a meal in a kitchen, with multiple pots, pans, utensils, and food items on the stovetop. The chef is using a stainless steel bowl to prepare a dish.", "mscoco_hallucinated_words": [["chef", "person"], ["chef", "person"]], "mscoco_gt_words": ["oven", "sink", "bowl"], "hallucination_idxs": [1, 26], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.6666666666666666}}, {"image_id": 28842, "caption": "A man is riding a skateboard down a grassy hill, enjoying the outdoors and the thrill of the ride. He is wearing a helmet and has a grin on his face, indicating that he is having a good time. The image captures the excitement and fun of sk", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "skateboard", "dog"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 319607, "caption": "A man rides his bicycle down the street in front of a building with a traffic light at an intersection. The traffic light is red, indicating that the road is currently closed to vehicular traffic. The man is dressed in a black and white striped shirt, which adds to the overall vibrant", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bus", "bicycle", "person", "car", "traffic light", "backpack"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 210372, "caption": "A close-up image of a red kitchen with a sink, refrigerator, and a table in the foreground.", "mscoco_hallucinated_words": [["table", "dining table"]], "mscoco_gt_words": ["sink", "refrigerator", "bottle"], "hallucination_idxs": [15], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.6666666666666666}}, {"image_id": 156915, "caption": "A beautiful bouquet of red roses is placed on a wooden table, surrounded by greenery and a glass vase. The arrangement adds a touch of elegance and beauty to the room, creating a welcoming atmosphere.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["potted plant", "dining table", "vase"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 349642, "caption": "A man sits on a bench, looking at his dog that is sitting on the ground next to him. The man is dressed in a black coat, and the dog is a small brown dog. They are sitting together on the sidewalk in front of a brick building.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "bench", "dog"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 423008, "caption": "A bustling market scene in a small town or village is captured in this image. A group of people are gathered near the water, with boats, fishing gear, and various colorful umbrellas visible. The scene is likely filled with the sounds of vendors calling out their wares and customers", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "suitcase", "umbrella", "handbag", "boat"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 45435, "caption": "A hand holding a smartphone is shown, with the device's screen displaying the image of a person holding a white smartphone.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cup", "person", "cell phone"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 35827, "caption": "In the image, a man is sitting at a desk in a room, surrounded by various electronic devices and papers. He is working on a computer, possibly on a project or typing an email. The room is well-lit and appears to be organized, with the man sitting in front of a white desk and", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["laptop", "chair", "person", "bottle", "dining table", "cup", "tv"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.42857142857142855}}, {"image_id": 72656, "caption": "Three children are sitting at a wooden table on a wooden deck, enjoying their lunches together. They are eating pizza and playing with toys, having a fun time together.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "person", "suitcase", "dining table", "bowl", "pizza"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 372087, "caption": "A green train with a large number of passengers pulls into the station, with a person standing at the edge of the platform.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["suitcase", "train", "bench", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 336209, "caption": "A young man is riding a skateboard in an abandoned warehouse, jumping and performing tricks on the ramps. He is wearing a shirt and jeans, and the image captures the excitement and energy of his skateboarding skills.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "bench", "skateboard"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 46031, "caption": "A laptop, a mouse, and a keyboard are sitting on a table next to a window. A mousepad and a keyboard are also present. The table has a green and brown pattern on it, and there are some plants nearby. The laptop and keyboard are likely being used for various tasks or activities, such as brow", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["laptop", "mouse", "cell phone", "keyboard", "dining table", "tv"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 283118, "caption": "A family is enjoying a meal together at a restaurant, with the children sitting in chairs and the mother and father sitting at the table. They are all smiling and engaged in conversation, and there is a bottle of water and a plate of food in front of them. The children are likely enjoying", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "cell phone", "person", "bottle", "dining table", "pizza", "car", "handbag", "backpack"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4444444444444444}}, {"image_id": 429598, "caption": "A wooden kitchen with an old-fashioned stove and refrigerator sits in a room with a brick wall. The kitchen features a wooden table with chairs, and a wooden countertop, giving it a rustic and cozy appearance. The presence of a stove and refrigerator", "mscoco_hallucinated_words": [["table", "dining table"], ["chair", "chair"]], "mscoco_gt_words": ["oven", "sink", "refrigerator", "bottle"], "hallucination_idxs": [23, 25], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.5}}, {"image_id": 333365, "caption": "A large red airplane sits on a tarmac next to a smaller white airplane, both parked at an airport. The image captures the bustling atmosphere of an airport, with multiple planes on the runway and passengers walking in the background.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "truck", "car", "airplane"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 424174, "caption": "A colorful and lively bowl of fruit is displayed on a wooden table, showcasing a variety of fruits like apples, bananas, and oranges. The fruit bowl is full of fresh and healthy options for snacking or adding to a meal, making it a delightful", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["banana", "dining table", "bowl", "orange", "apple"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 3035, "caption": "A plane sits on the tarmac at an airport, surrounded by a few other airplanes and a large airport building. The image captures the various aircraft parked together, waiting to be used for flights. The scene showcases the bustling atmosphere of an airport, with multiple", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "truck", "car", "airplane"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 177213, "caption": "A person is eating pizza, which is a popular Italian dish made with dough, cheese, and sauce. The person is sitting at a table, enjoying their meal. The pizza is placed on a white plate, and a knife is used to cut it.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "person", "dining table", "pizza", "knife", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 438535, "caption": "A large clock stands in the middle of a busy street, surrounded by tall buildings and a cityscape. The clock is a classic design with a white face and a black hand, indicating the time.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "car", "backpack", "clock"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 490711, "caption": "In this image, we see a white kitchen appliance, likely a refrigerator, sitting in a kitchen with a countertop and cabinets. The refrigerator is surrounded by other kitchen items, such as a sink and a stove. There is also a microwave on the countertop.", "mscoco_hallucinated_words": [["stove", "oven"], ["microwave", "microwave"]], "mscoco_gt_words": ["sink", "refrigerator", "banana"], "hallucination_idxs": [40, 46], "metrics": {"CHAIRs": 1, "CHAIRi": 0.4, "Recall": 0.6666666666666666}}, {"image_id": 163728, "caption": "A white cat is lying on a desk, with its paws resting on a small mouse toy. The cat is sleeping while holding the mouse toy, and it is a cute scene.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["laptop", "mouse", "cat", "dining table", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 456756, "caption": "A large giraffe stands in a zoo, looking at the camera with its long neck and legs. It is surrounded by other animals, such as a zebra and a lion. The image captures the giraffe's unique appearance and the variety of animals present in the zoo.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "zebra", "giraffe"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 281028, "caption": "A passenger train with a large window is sitting at a station, with two chairs facing the window. The passenger train is decorated with a red and white color scheme, and there is a large American flag on the side of the train. The image captures a moment of the train's arrival at the station", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "train", "car", "chair"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 343937, "caption": "A woman is riding a snowboard down a snow-covered slope, wearing a black snowboarding helmet, a black jacket, and a white hat. She is standing on a snowboard, balancing on the edge of the snowboard with her skis, enjoying the thrill of", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "skis", "snowboard"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 277051, "caption": "Two birds perched on a table next to a dish of food, looking at the camera.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "dining table", "bottle", "bird", "knife"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 145666, "caption": "A bowl full of fresh broccoli and carrots sits on a stainless steel countertop, waiting to be cooked and enjoyed. The vegetables are colorful and fresh, and the bowl is clean and ready for use.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["carrot", "broccoli", "dining table", "bowl"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 304984, "caption": "A delicious sandwich with a plate of sliced oranges and a fork rests on a table, with a glass of chocolate milk next to it. The sandwich is made with a crispy, golden-brown bread, and it is likely filled with meat, cheese, or", "mscoco_hallucinated_words": [["table", "dining table"]], "mscoco_gt_words": ["fork", "sandwich", "bowl", "wine glass", "cake", "orange"], "hallucination_idxs": [15], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2, "Recall": 0.5}}, {"image_id": 122467, "caption": "The image shows a hand holding a white Nintendo Game Boy Advance (GBA) controller, with a red circle around it.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "remote", "couch", "dining table"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 518287, "caption": "A toothbrush with a smiling face is sitting on top of a tube of toothpaste on a bright orange background. The toothbrush appears to be enjoying the toothpaste, as if it is about to brush its teeth.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["toothbrush", "orange", "cup", "dining table"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 145448, "caption": "A cat sits on the back of a motorcycle, while a group of people sit around the table, enjoying a meal.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "motorcycle", "person", "cat", "dining table", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 352900, "caption": "A delicious, creamy pasta dish with broccoli and a fork is served on a white plate, ready to be enjoyed by someone.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["broccoli", "fork", "knife", "bowl"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 153607, "caption": "A blue vase with a flower placed in it is sitting on a table next to a blue bowl and a blue cup. The image is a beautiful display of colorful decoration, adding a touch of elegance and sophistication to the room.", "mscoco_hallucinated_words": [["cup", "cup"]], "mscoco_gt_words": ["orange", "vase", "dining table", "bowl"], "hallucination_idxs": [22], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.75}}, {"image_id": 157581, "caption": "A caption for the image could be: \"A group of wine glasses, bottles, and a wine bottle sitting on a table, with a white background and a silver tablecloth. The wine glasses are arranged in a neat and tidy manner, and the bottles are placed on top of", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "person", "bottle", "dining table", "cup", "wine glass"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 227438, "caption": "A luxurious hotel room is shown in the image, with a large bed and a comfortable couch. There is a table and a lamp in the room, as well as a couple of chairs. The bed has a white cover, and the couch is covered in a patterned fabric. A large window", "mscoco_hallucinated_words": [["table", "dining table"]], "mscoco_gt_words": ["bed", "chair", "clock", "couch"], "hallucination_idxs": [22], "metrics": {"CHAIRs": 1, "CHAIRi": 0.16666666666666666, "Recall": 0.75}}, {"image_id": 116037, "caption": "A young girl is playing softball, swinging a bat and running towards home plate. She is wearing a baseball cap and a glove, and is surrounded by other players in the field. The image captures the excitement and energy of the game, showcasing the young girl's passion for softball", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sports ball", "person", "baseball glove", "baseball bat"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 202658, "caption": "A small pink toilet is sitting in front of a blue toilet seat, and it appears to be covered with a pink toilet seat cover. The image shows the two toilets sitting side by side, with one being a blue toilet and the other being a pink to", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "toilet", "bowl"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 18150, "caption": "A young boy is sitting on a bed while eating a pizza, and a man is sitting on the floor next to him. The boy is holding a pizza box and the man is holding a pizza slice, both of which are eating pizza together.", "mscoco_hallucinated_words": [["bed", "bed"]], "mscoco_gt_words": ["person", "bottle", "pizza", "backpack", "couch"], "hallucination_idxs": [7], "metrics": {"CHAIRs": 1, "CHAIRi": 0.1111111111111111, "Recall": 0.4}}, {"image_id": 418711, "caption": "In the image, a man is riding a bicycle while holding a large basket full of bananas, likely being sold at a market or street stand.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["banana", "bicycle", "person", "truck", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 92107, "caption": "A bowl of creamy broccoli soup, served with a spoon, sits on a table next to a slice of bread, ready to be enjoyed. The soup is made with corn, and it's a healthy and delicious meal option.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "broccoli", "spoon", "bowl"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 491000, "caption": "A man walks down a cobblestone street in a historic city, passing by a group of people and a bicycle. The street is lined with colorful buildings and has a unique architecture that reflects the city's rich history. The presence of a bicycle indicates that the area may", "mscoco_hallucinated_words": [["bicycle", "bicycle"], ["bicycle", "bicycle"]], "mscoco_gt_words": ["motorcycle", "person", "car", "handbag", "dog"], "hallucination_idxs": [20, 46], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.2}}, {"image_id": 401163, "caption": "A man and his dog sit on a bench in a park, enjoying the fresh air and the sunshine. The man has his arms around the dog, while the dog is lying down next to him. They appear to be taking a break and spending quality time together, away from the hustle", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "bench", "dog"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 39663, "caption": "A backpack full of various items is sitting on a floor in the image. The items include a laptop, a notebook, a pink pen, a pair of scissors, a book, and a black pen. These items are likely used for educational or work-related purposes, such as writing, research", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["laptop", "cell phone", "scissors", "book", "backpack"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.8}}, {"image_id": 268293, "caption": "A young man is playing tennis on a sunny day, using his racket to hit a tennis ball. He is wearing a blue shirt and white pants, and his headband helps him keep his hair out of his face while he plays.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sports ball", "person", "tennis racket"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 474499, "caption": "In the image, a kitchen is full of various utensils, appliances, and food. A stove, a dishwasher, and a refrigerator are some of the appliances found in the kitchen. Additionally, there are numerous bottles, jars, and other containers", "mscoco_hallucinated_words": [["refrigerator", "refrigerator"], ["container", "bowl"]], "mscoco_gt_words": ["clock", "sink", "bottle", "vase", "spoon", "oven", "apple"], "hallucination_idxs": [25, 47], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.2857142857142857}}, {"image_id": 358086, "caption": "A group of young girls are playing a game of soccer at an indoor field, with one girl in a blue shirt and black shorts jumping up in the air to head the ball.", "mscoco_hallucinated_words": [["ball", "sports ball"]], "mscoco_gt_words": ["chair", "person", "bottle", "backpack", "frisbee"], "hallucination_idxs": [34], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.2}}, {"image_id": 89541, "caption": "A yellow plastic container filled with various sweet treats sits on a table. It contains a cake, a slice of pound cake, a piece of strawberry shortcake, and a variety of fruits such as strawberries and blueberries.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["banana", "cake", "dining table", "bowl"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 239445, "caption": "The man in the image is holding a frisbee and smiling, ready to play with someone. He is wearing a white t-shirt and has a positive attitude, indicating that he is eager to engage in a fun activity with his friend or partner. The presence of a white plate on the", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sports ball", "person", "frisbee"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 105782, "caption": "A young kangaroo is standing on a grassy field, holding a red and yellow toy car in its paws. It appears to be having fun and playing with the toy car.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["kite", "car", "cat", "dog"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 487990, "caption": "A group of friends is enjoying a picnic together, with a variety of food items, including sandwiches, cookies, and a pink cupcake. One of the friends is using a small, handheld guitar to play music while they eat and socialize. This image captures a fun and", "mscoco_hallucinated_words": [["sandwich", "sandwich"]], "mscoco_gt_words": ["fork", "person", "bottle", "bowl", "dining table", "knife", "cup", "spoon", "donut", "cake"], "hallucination_idxs": [18], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.1}}, {"image_id": 138834, "caption": "A man is walking down a snowy road with skis on his feet.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "skis", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 492057, "caption": "A man, possibly in his mid-20s, is captured in a mirrored wall of a public restroom. He is standing in front of the mirror, holding a phone, and taking a selfie.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "cell phone", "tie"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 388215, "caption": "A man is playing tennis at a court, with a ball flying over his head and a tennis racket in hand.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sports ball", "person", "tennis racket"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 111409, "caption": "The image features a man riding a motorcycle down a slope, with a puddle of water on the ground. The man is wearing a helmet, which is essential for safety while riding a motorcycle.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "bicycle", "motorcycle"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 451391, "caption": "A man is holding a bunch of broccoli in a green grocery store, showcasing a colorful and healthy vegetable option.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "broccoli", "dining table"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 92462, "caption": "A group of cows and a car are walking down a narrow street, possibly in a village or town, with the car passing by the cows. The cows are moving in a line, likely in a group or herd, and the car is driving past them. The scene could be a typical sight in", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "cow", "car", "backpack"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 397268, "caption": "A small, charming bike shop with a bicycle hanging from the ceiling and a bicycle parked in front. The shop is surrounded by greenery and a small table with a chair and a red couch outside. The bike shop has a cozy atmosphere, which might appeal to", "mscoco_hallucinated_words": [["table", "dining table"], ["couch", "couch"]], "mscoco_gt_words": ["potted plant", "bench", "chair", "bicycle"], "hallucination_idxs": [29, 36], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2857142857142857, "Recall": 0.5}}, {"image_id": 127659, "caption": "A man is standing on a train platform, looking at his phone. A train is parked at the station, and the man is waiting for it to depart. The image captures a moment of the man's daily commute, where he is checking his phone for updates or notifications while waiting for the train to", "mscoco_hallucinated_words": [["phone", "cell phone"], ["phone", "cell phone"]], "mscoco_gt_words": ["person", "train", "bench", "dog"], "hallucination_idxs": [12, 49], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.5}}, {"image_id": 251857, "caption": "A man is skateboarding on a sidewalk in front of a city park, while a young man is riding a skateboard in the background. The skateboarders are enjoying their time outdoors and engaging in the sport they love, while the city park provides a beautiful and v", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "traffic light", "skateboard", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 243212, "caption": "A young boy is holding a frisbee and standing in a grassy area, possibly in a park.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "truck", "car", "dog", "frisbee"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 444304, "caption": "A man is sitting on a couch and watching a television, with his head resting on his hands. The television is showing a video of a man sitting on a couch, which could be a reflection or a mirror image. The man is possibly watching his own reflection, which might be a funny or self", "mscoco_hallucinated_words": [["couch", "couch"], ["couch", "couch"]], "mscoco_gt_words": ["person", "bed", "remote", "tv"], "hallucination_idxs": [6, 32], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2857142857142857, "Recall": 0.5}}, {"image_id": 305000, "caption": "The image features a woman standing at a fruit stand, surrounded by various fruits and vegetables. She is holding a wooden cutting board, likely to help her prepare or sell the produce. The scene is set in a tropical environment, with greenery and a colorful umbrella overhead.", "mscoco_hallucinated_words": [["umbrella", "umbrella"]], "mscoco_gt_words": ["person", "banana", "apple"], "hallucination_idxs": [50], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.3333333333333333}}, {"image_id": 44136, "caption": "A group of men are enjoying a night out at a dinner party, with one man holding a beer and the other sitting at a table with a glass of wine. They are dressed in formal attire, adding to the elegance of the event.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["wine glass", "person", "dining table", "bottle", "tie"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 154846, "caption": "A couple is enjoying a slice of pizza on a white plate, surrounded by other pizza slices, at a dining table.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "pizza", "dining table"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 567254, "caption": "A young boy is sitting on a couch, holding a TV remote control, and watching a TV show.", "mscoco_hallucinated_words": [["couch", "couch"], ["remote", "remote"]], "mscoco_gt_words": ["person", "tv", "bottle", "vase"], "hallucination_idxs": [7, 12], "metrics": {"CHAIRs": 1, "CHAIRi": 0.4, "Recall": 0.5}}, {"image_id": 79261, "caption": "A man is sitting on a bench, holding a broom, and wearing a uniform while a sign is nearby reading \"No Diving.\" The man is likely a maintenance worker, and the sign is likely in place to ensure the safety of people who might be tempted to dive into the water.", "mscoco_hallucinated_words": [["bench", "bench"]], "mscoco_gt_words": ["person", "handbag", "backpack", "clock"], "hallucination_idxs": [6], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2, "Recall": 0.25}}, {"image_id": 301402, "caption": "A man is sitting in a chair, surrounded by a dining table, and a laptop computer. He is wearing a hat and appears to be working on a laptop in the living room, surrounded by other people and objects.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["laptop", "chair", "person", "bottle", "dining table", "potted plant"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 415828, "caption": "A group of people is gathered on a street, possibly in front of a building or a parked car, as they wait for the rain to stop. The scene is described as a \"rainy day,\" and the people are holding umbrellas to protect themselves from the rain. There are a few cars park", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "umbrella", "car", "traffic light", "handbag", "backpack", "stop sign"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.42857142857142855}}, {"image_id": 543231, "caption": "The woman in the image is using a remote control to play a video game on her TV while sitting on a couch, surrounded by other people. She is holding a drink in her hand and appears to be engaged in the game.", "mscoco_hallucinated_words": [["tv", "tv"], ["couch", "couch"]], "mscoco_gt_words": ["person", "bowl", "bed", "book", "remote"], "hallucination_idxs": [17, 22], "metrics": {"CHAIRs": 1, "CHAIRi": 0.4, "Recall": 0.4}}, {"image_id": 495357, "caption": "A man rides a motorcycle down a city street, accompanied by a group of people, possibly friends or family, while a small dog walks on a leash nearby.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "handbag", "dog", "motorcycle"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 523175, "caption": "A spoon is scooping up a bowl of hearty, flavorful soup, filled with carrots and potatoes, as it sits on a plate. The soup is served in a white bowl, and a red spoon is used to scoop the delicious meal. This", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["carrot", "dining table", "spoon", "bowl"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 184945, "caption": "A large group of motorcycles is parked outside, with some of them being locked up to metal poles. The scene is taking place in a city, with a few cars and a building in the background.", "mscoco_hallucinated_words": [["car", "car"]], "mscoco_gt_words": ["potted plant", "bicycle", "motorcycle"], "hallucination_idxs": [32], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.3333333333333333}}, {"image_id": 49942, "caption": "A young man is standing under an umbrella, with his arms up and looking at the camera. He is wearing a suit, tie, and a pink shirt. This image captures a moment of the man's life, possibly in a city setting, where he is using an umbrella", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "umbrella", "tie"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 223019, "caption": "A passenger train travels through the city, carrying people to their destinations. The train has a blue and silver color scheme, and it is stopped at a platform with multiple passengers waiting to board.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "suitcase", "train", "car", "handbag", "backpack"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 42889, "caption": "A teddy bear sits on a red chair next to a computer with a keyboard, mouse, and headphones. There is also a speaker on the table, and the teddy bear is holding a cell phone. The scene is well-lit and shows the teddy bear as a small, cute companion", "mscoco_hallucinated_words": [["chair", "chair"], ["computer", "laptop"], ["mouse", "mouse"], ["table", "dining table"], ["cell phone", "cell phone"]], "mscoco_gt_words": ["teddy bear", "keyboard", "bear"], "hallucination_idxs": [7, 11, 16, 28, 37], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5555555555555556, "Recall": 0.6666666666666666}}, {"image_id": 22112, "caption": "A small bowl with fresh green herbs sits on a coffee table, next to a vase filled with flowers. This combination of plants adds a pleasant and natural touch to the room.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["potted plant", "vase", "dining table", "bowl"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 247587, "caption": "A man is walking on a white surfboard on a beach, with a beach umbrella in the background.", "mscoco_hallucinated_words": [["umbrella", "umbrella"]], "mscoco_gt_words": ["person", "surfboard", "car"], "hallucination_idxs": [15], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.6666666666666666}}, {"image_id": 171962, "caption": "A yellow school bus is parked at the side of the road, waiting for passengers. It is an open-top bus with a bike rack on the side, indicating that it is designed for transporting students who ride their bicycles to school. The image shows the bus parked in front of a", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "car", "bus", "bicycle"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 545056, "caption": "A large field filled with numerous sheep grazes under the green grass, with a fence and trees in the background.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cow", "car", "sheep", "dog"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 401411, "caption": "A chef is preparing a meal at a large kitchen table, surrounded by various food items and utensils. The chef is holding a spatula and appears to be preparing to cook or serve food to the people sitting at the table.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["oven", "person", "dining table", "bowl", "cup", "carrot", "book"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2857142857142857}}, {"image_id": 2867, "caption": "A group of people, including a man and a woman, are gathered on a snowy slope, possibly preparing for a skiing or snowboarding adventure. They are standing in a line, with one man holding a ski pole and the woman holding a backpack. This scene suggests that they are getting ready", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "skis", "backpack"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 246963, "caption": "In the image, a group of motorcyclists are riding down a road, with a stop sign in the background. The motorcyclists are wearing leather jackets and helmets, and one of them is holding a stop sign. The scene suggests that the motorcyclists are particip", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "motorcycle", "stop sign"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 498225, "caption": "A group of people, including a woman and two men, are standing in front of a bakery counter, admiring the selection of cakes and pastries. One man is holding a slice of cake, while the woman is pointing to a cake display. The men seem to be discussing their choices", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "person", "handbag", "donut", "cake"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 124601, "caption": "In the image, we see a kitchen with a white countertop and a microwave oven. A coffee cup and a laptop are placed on the countertop, and a dish is sitting on the kitchen table.", "mscoco_hallucinated_words": [["oven", "oven"]], "mscoco_gt_words": ["laptop", "sink", "bottle", "keyboard", "dining table", "cup", "wine glass", "microwave"], "hallucination_idxs": [15], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2, "Recall": 0.5}}, {"image_id": 581749, "caption": "A pile of fresh vegetables, including broccoli, carrots, and lettuce, is displayed in a plastic bag. The vegetables are fresh and well-packed, with some of them still wrapped in their original packaging. The image is taken at a grocery store, suggesting", "mscoco_hallucinated_words": [["carrot", "carrot"]], "mscoco_gt_words": ["broccoli", "orange", "dining table"], "hallucination_idxs": [9], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.3333333333333333}}, {"image_id": 227960, "caption": "In the image, there is a large bowl filled with brussels sprouts, a popular vegetable dish, and a spoon is present. The bowl is placed on a table, and it is likely that the brussels sprouts are being served as a side dish at a gathering", "mscoco_hallucinated_words": [["table", "dining table"]], "mscoco_gt_words": ["bowl", "cup", "spoon", "wine glass", "carrot"], "hallucination_idxs": [31], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.4}}, {"image_id": 286503, "caption": "In the image, we see a large elephant standing on a platform or a stage, with a large crowd gathered around it. The elephant is surrounded by people, and it is holding a small ball in its trunk. The scene appears to be at a zoo or an event, where the eleph", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sports ball", "elephant", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 315740, "caption": "In this image, a kitchen is filled with various appliances, including a refrigerator, stove, and sink. There is also a dishwasher and a microwave oven. The kitchen is well-equipped and well-organized, with cabinets and drawers for", "mscoco_hallucinated_words": [["refrigerator", "refrigerator"]], "mscoco_gt_words": ["chair", "sink", "bowl", "tv", "potted plant", "oven", "microwave", "couch"], "hallucination_idxs": [14], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2, "Recall": 0.375}}, {"image_id": 142108, "caption": "A group of people are gathered around a long table with several baked bananas on it. They are all busy preparing and cutting up the bananas, possibly for a meal or a snack.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "banana", "dining table"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 542933, "caption": "A baseball player is standing on the field, holding a bat, and waiting for the pitcher to throw the ball. The player is surrounded by a large crowd of people, who are cheering and watching the game.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sports ball", "chair", "person", "bench", "baseball glove", "baseball bat"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 475043, "caption": "A group of friends is sitting on a couch in a living room, enjoying a beverage while using their laptops and a tablet. One person is sipping from a cup of coffee, while others are engaging in online activities, such as browsing the internet or playing games on their devices.", "mscoco_hallucinated_words": [["cup", "cup"]], "mscoco_gt_words": ["laptop", "person", "bottle", "bowl", "spoon", "couch"], "hallucination_idxs": [31], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.5}}, {"image_id": 456784, "caption": "A man is holding a knife and slicing a white cake on a table.", "mscoco_hallucinated_words": [["table", "dining table"]], "mscoco_gt_words": ["person", "cake", "knife"], "hallucination_idxs": [13], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 1.0}}, {"image_id": 33753, "caption": "A television remote sits on a bench, surrounded by greenery, as a person enjoys the outdoors on a sunny day.", "mscoco_hallucinated_words": [["person", "person"]], "mscoco_gt_words": ["bench", "remote", "chair", "tv"], "hallucination_idxs": [14], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.75}}, {"image_id": 448694, "caption": "A group of young people, including a boy and two girls, play a game of frisbee on a green grassy field. The boy tosses the frisbee while the girls catch it, demonstrating their teamwork and coordination. The scene shows the fun and enjoyment of playing outdoor", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "chair", "frisbee"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 99053, "caption": "A bowl filled with a hearty and flavorful meal, featuring a mix of vegetables and meat, sits on a blue table. The dish is composed of broccoli, carrots, and chicken, all cooked together in a savory sauce. The bowl is", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "dining table", "bowl", "broccoli", "carrot"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.8}}, {"image_id": 503210, "caption": "A spacious living room with a brown leather couch, a coffee table, a grandfather clock, and various other furniture pieces. The room is well-lit and decorated with colorful cushions and curtains, creating a cozy and inviting atmosphere.", "mscoco_hallucinated_words": [["table", "dining table"]], "mscoco_gt_words": ["chair", "clock", "vase", "couch", "potted plant", "book", "orange"], "hallucination_idxs": [12], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.2857142857142857}}, {"image_id": 142257, "caption": "A busy street with cars and traffic lights is captured in the image.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "traffic light", "truck", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}], "overall_metrics": {"CHAIRs": 0.258, "CHAIRi": 0.09568382735309412, "Recall": 0.5225512528473805, "num_hallucinated_caps": 129.0, "num_caps": 500.0, "hallucinated_word_count": 184.0, "coco_word_count": 1923.0, "length_response": 41.85, "hallucinated_caps_ls": [95908, 324008, 247179, 493862, 253630, 161227, 343534, 459141, 227031, 209347, 183766, 344942, 133146, 498747, 185327, 129707, 37907, 235595, 489909, 333712, 148977, 399058, 183571, 325836, 467887, 346716, 401010, 313928, 222782, 122602, 59710, 527497, 265628, 499594, 255483, 258209, 245664, 453731, 443299, 120776, 219546, 437720, 535403, 449798, 375769, 426172, 138078, 180764, 147762, 333998, 295105, 301837, 240681, 250540, 47940, 134768, 526414, 273132, 505213, 412407, 188136, 449675, 191691, 557447, 134223, 475813, 558784, 53431, 441840, 381031, 539555, 279521, 330050, 254161, 163518, 423984, 288729, 302789, 30667, 328110, 379443, 536154, 353320, 416384, 531327, 1268, 575406, 436814, 275611, 444913, 303099, 205193, 272566, 14940, 191301, 124236, 14285, 381615, 49005, 425569, 210372, 429598, 490711, 304984, 153607, 227438, 18150, 491000, 474499, 358086, 487990, 397268, 127659, 444304, 305000, 567254, 79261, 543231, 184945, 42889, 247587, 124601, 581749, 227960, 315740, 475043, 456784, 33753, 503210]}}}