{"overall_metrics": {"CHAIRs": 0.246, "CHAIRi": 0.08144578313253012, "Recall": 0.5712984054669704, "num_hallucinated_caps": 123.0, "num_caps": 500.0, "hallucinated_word_count": 169.0, "coco_word_count": 2075.0, "length_response": 41.856, "hallucinated_caps_ls": [144305, 324008, 247179, 39053, 269873, 253630, 317320, 161227, 195645, 343534, 370657, 460347, 254368, 459141, 277479, 409346, 300124, 185327, 482432, 379842, 203110, 556478, 506401, 278365, 368367, 21779, 333712, 148977, 467887, 401010, 388237, 24104, 527497, 61959, 473118, 265628, 499594, 258209, 285820, 245664, 443299, 354559, 545594, 219546, 535403, 375769, 426172, 138078, 180764, 147762, 47781, 14773, 563938, 47940, 134768, 526414, 273132, 412407, 188136, 191691, 561967, 280930, 3742, 217593, 477016, 539951, 564629, 53431, 381031, 9628, 330050, 423984, 30667, 328110, 366111, 291634, 70815, 88269, 463211, 536154, 560018, 353320, 416384, 531327, 51054, 1268, 542771, 436814, 478380, 110449, 45550, 303099, 205193, 140702, 124236, 150703, 381615, 226802, 210372, 429598, 333365, 145666, 304984, 352900, 227438, 18150, 491000, 39663, 474499, 105782, 138834, 111409, 127659, 444304, 223019, 42889, 401411, 581749, 315740, 475043, 99053, 503210, 142257]}, "results": {"sentences": [{"image_id": 144305, "caption": "A computer with a keyboard, mouse, and a laptop is sitting on a table, with a few cables connected to it. The computer is connected to a monitor, which is showing a blue screen. The image highlights the importance of computer technology in our daily lives, as it is essential for communication, information access", "mscoco_hallucinated_words": [["mouse", "mouse"], ["monitor", "tv"]], "mscoco_gt_words": ["dining table", "keyboard", "laptop"], "hallucination_idxs": [6, 31], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 1.0}}, {"image_id": 164091, "caption": "A small doll and a teddy bear are placed inside a baby carriage in a room. The doll and teddy bear are resting on a cushion, creating a cozy and comforting environment for them.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["teddy bear", "person", "bed"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 308003, "caption": "A wooden bench is sitting in a grassy area, surrounded by trees. The bench has a green and white striped pattern on it, and it appears to be an outdoor seating area. The image captures the serene and peaceful atmosphere of the natural setting, inviting the viewer to", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "chair", "bench"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 54870, "caption": "A plate with a sandwich, a salad, and a fork is sitting on a white tablecloth. The sandwich is cut in half, and the salad has a large serving of lettuce and tomatoes. The fork is placed on top of the salad.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["knife", "sandwich", "fork"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 95908, "caption": "A white mouse sits on a mousepad next to a cup of hot coffee, while a computer is nearby. The cup is in a metal cup holder, and there is a laptop in front of the cup.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "laptop", "cup", "mouse", "keyboard"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 329614, "caption": "A car is driving down a city street, passing a busy intersection with a double-decker bus and a large building in the background. The city street is lined with tall buildings, and the sky is overcast.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bus", "person", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 324008, "caption": "A passenger on an airplane is enjoying a meal consisting of a sandwich, an orange, and a banana on a tray.", "mscoco_hallucinated_words": [["sandwich", "sandwich"]], "mscoco_gt_words": ["dining table", "banana", "cup", "airplane", "orange", "person", "train"], "hallucination_idxs": [12], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2, "Recall": 0.5714285714285714}}, {"image_id": 52700, "caption": "A group of people are enjoying a cake buffet, with a variety of desserts and cakes on display. The event appears to be a celebration, as there are several cakes and desserts on the table, and a person is holding a fork and a spoon.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "fork", "spoon", "handbag", "person", "cake"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.8333333333333334}}, {"image_id": 501311, "caption": "The image shows a baseball player pitching a baseball to a batter, with a ball flying through the air. The pitcher is wearing a baseball uniform and glove, while the batter is standing at the plate. The ball is in mid-air, ready to be caught by the batter. The scene is set", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sports ball", "person", "baseball glove"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 247179, "caption": "A man is standing next to a large elephant, with a crowd of people watching them. The elephant is decorated and dressed up, and the man is wearing a hat and holding a trumpet. The scene takes place at night, and there are street lights illuminating the area.", "mscoco_hallucinated_words": [["street light", "traffic light"]], "mscoco_gt_words": ["clock", "elephant", "truck", "person"], "hallucination_idxs": [48], "metrics": {"CHAIRs": 1, "CHAIRi": 0.16666666666666666, "Recall": 0.5}}, {"image_id": 577912, "caption": "A beautiful bathroom with a large white bathtub, a white sink, and a toilet. The toilet is in a separate room. The room also includes a white countertop and a window.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bottle", "sink", "toilet", "toothbrush"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 196341, "caption": "A woman is walking down a hallway, looking at a large clock on the wall. The clock is located inside the famous Clock Tower in Paris, France.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["clock", "handbag", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 234433, "caption": "A bicycle rider is seen approaching a traffic signal in a busy urban street. The signal is located at the corner of a street and a sidewalk, and it features a sign that reads \"LHT RD RI RD.\" This indicates that the rider is approaching a left turn, and the", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["traffic light", "bicycle", "person", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 455610, "caption": "A group of people are gathered around a motorcycle, admiring its unique design and colorful paint job.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["traffic light", "motorcycle", "person", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 39053, "caption": "A table is set with various dishes, including a bowl of eggs, a plate of pasta, a dish of fried food, and a bowl of yogurt. There are also utensils, such as a spoon and a fork, on the table. The scene is described as", "mscoco_hallucinated_words": [["fork", "fork"]], "mscoco_gt_words": ["dining table", "bowl", "cup", "apple", "cell phone", "spoon", "cake"], "hallucination_idxs": [42], "metrics": {"CHAIRs": 1, "CHAIRi": 0.16666666666666666, "Recall": 0.42857142857142855}}, {"image_id": 493862, "caption": "A young woman is standing on a grassy hill, holding a tennis racket and looking up at the sky. She is in the middle of a beautiful landscape, surrounded by trees and the sun in the background. The image captures a moment of leisure, with the woman enjoying her time outdoors", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dog", "person", "tennis racket"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 269873, "caption": "A group of people is walking down the sidewalk, passing by a bus with a stop sign. The people are dressed in formal attire, which suggests that they are likely going to or from work. The presence of the bus indicates that the city has public transportation services available for residents, making it easier for them", "mscoco_hallucinated_words": [["stop sign", "stop sign"]], "mscoco_gt_words": ["traffic light", "bus", "person", "car"], "hallucination_idxs": [16], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.25}}, {"image_id": 524656, "caption": "A well-equipped kitchen with a stainless steel sink, a refrigerator, a microwave, a toaster, and a dishwasher is the main focus of this image. The kitchen is neatly organized with a variety of utensils and appliances, such as", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["knife", "bowl", "wine glass", "bottle", "refrigerator", "cup", "microwave", "sink", "spoon", "oven", "toaster"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.36363636363636365}}, {"image_id": 369547, "caption": "A black and white dog is sitting on a beach, surrounded by rocks and sand. The dog is looking at a bird in the distance, possibly trying to catch it. The dog's presence on the beach creates a beautiful and intriguing scene, capturing the attention of the viewer.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bird", "cat", "dog"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 181446, "caption": "A man is standing in front of a refrigerator, holding a bottle of soda. He is wearing a black shirt and a baseball cap, giving the impression that he is a casual and laid-back person. The man is looking at the refrigerator with a curious expression,", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "bottle", "refrigerator", "sink", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 128119, "caption": "A person is standing on a city bus, looking down at their phone while the bus is parked at a curb. The bus has a bicycle hanging from the roof, and a handbag is on the floor.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bus", "bicycle", "cell phone", "backpack", "handbag", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 401027, "caption": "A sandwich is placed on a plate, with various ingredients such as lettuce, tomato, and cheese. A slice of bread is seen on top, along with a knife and a fork. The sandwich is set against a white tablecloth, and there is a glass of water on", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "sandwich", "cup", "fork", "knife"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 253630, "caption": "A dark brown dining table is sitting in the middle of a living room. The table has a glass top and is surrounded by chairs and a couch. There is a brown leather chair in front of the table, and a red cushion is placed on top of a large couch. The room", "mscoco_hallucinated_words": [["couch", "couch"], ["couch", "couch"]], "mscoco_gt_words": ["dining table", "chair", "potted plant", "tv"], "hallucination_idxs": [28, 53], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2857142857142857, "Recall": 0.5}}, {"image_id": 326021, "caption": "A woman is sitting at a table with a teddy bear and a red tablecloth. She is holding a sign that reads, \"Just seeing bad eye results. I have to get my eyes checked!\"", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "teddy bear", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 317320, "caption": "A man rides a bicycle on the sidewalk in front of a busy street, while a woman is walking past him. The street is lined with yellow lines and a parked car.", "mscoco_hallucinated_words": [["car", "car"]], "mscoco_gt_words": ["bicycle", "motorcycle", "person"], "hallucination_idxs": [33], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.6666666666666666}}, {"image_id": 507171, "caption": "A man is seen riding a surfboard in the ocean, with the waves crashing against the shore in the background. He is wearing a wetsuit and appears to be enjoying his surfing experience.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["surfboard", "person", "cat"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 161227, "caption": "A leather couch is sitting in front of a television, and there is a laptop on the table next to it. A remote control is also present, with a TV screen showing a menu or channel selection. In the background, there are other furniture pieces, such as a chair and a table, along with", "mscoco_hallucinated_words": [["television", "tv"], ["table", "dining table"], ["tv", "tv"], ["table", "dining table"]], "mscoco_gt_words": ["remote", "laptop", "couch", "chair", "cell phone", "keyboard"], "hallucination_idxs": [9, 18, 32, 57], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.6666666666666666}}, {"image_id": 25812, "caption": "In the image, a man is snowboarding down a snow-covered hill, with a ski lift and a ski resort in the background. The man is wearing a ski jacket and holding his snowboard, indicating that he is an experienced snowboarder. This scene showcases the winter sport of snow", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["snowboard", "person", "skis"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 267537, "caption": "A group of people is sitting in the stands, watching a baseball game. They are dressed in formal attire, including dresses and suits, and are holding umbrellas to protect themselves from the rain.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["umbrella", "bench", "tie", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 195645, "caption": "A group of people, including a man and a woman, are sitting at a wooden table, surrounded by chairs. They are enjoying a gathering, possibly a family dinner or a social event, as they are conversing and laughing together. The man is holding a glass of wine, and the woman is", "mscoco_hallucinated_words": [["chair", "chair"]], "mscoco_gt_words": ["dining table", "bench", "wine glass", "bottle", "handbag", "person"], "hallucination_idxs": [21], "metrics": {"CHAIRs": 1, "CHAIRi": 0.14285714285714285, "Recall": 0.3333333333333333}}, {"image_id": 155671, "caption": "The image features a busy street with multiple cars and a traffic light in the middle of the intersection. The street is lined with buildings, including a restaurant, and there are pedestrians present as well.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["traffic light", "truck", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 412894, "caption": "A group of people, possibly tourists, is walking down a city street, passing by a red traffic light at a busy intersection. The street is lined with shops and buildings, and the scene captures the hustle and bustle of city life.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["traffic light", "handbag", "person", "backpack"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 32625, "caption": "The image shows a table with a bowl of soup, a cup of coffee, and a fork on it.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "bowl", "cup", "fork", "book"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.8}}, {"image_id": 18688, "caption": "A baseball player in a red uniform is pitching a baseball to a batter in a white uniform, while a crowd of people watches from the stands.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sports ball", "person", "baseball bat", "baseball glove"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 343534, "caption": "A young girl stands next to a stuffed dog, holding a teddy bear, and sitting on a chair in front of a table. The girl is dressed in a pink outfit, and her dog is sitting next to her. The scene is set in a room with a bookshelf, a chair,", "mscoco_hallucinated_words": [["girl", "person"], ["table", "dining table"], ["girl", "person"]], "mscoco_gt_words": ["dog", "potted plant", "chair", "book", "teddy bear"], "hallucination_idxs": [2, 24, 27], "metrics": {"CHAIRs": 1, "CHAIRi": 0.375, "Recall": 0.6}}, {"image_id": 370657, "caption": "A group of people, including a man, a woman, and a young girl, are riding on motorcycles. They are wearing helmets and carrying baskets on their bikes, possibly indicating that they are on a trip or a tour. The scene takes place on a street, with a", "mscoco_hallucinated_words": [["bike", "bicycle"]], "mscoco_gt_words": ["motorcycle", "handbag", "person"], "hallucination_idxs": [31], "metrics": {"CHAIRs": 1, "CHAIRi": 0.16666666666666666, "Recall": 0.6666666666666666}}, {"image_id": 481596, "caption": "A man sits in a stadium, holding a hot dog and eating it while watching the game.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "person", "hot dog"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 460347, "caption": "A large city street with multiple lanes is filled with cars, buses, and a person on a cell phone.", "mscoco_hallucinated_words": [["cell phone", "cell phone"]], "mscoco_gt_words": ["bus", "person", "car"], "hallucination_idxs": [19], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 1.0}}, {"image_id": 398753, "caption": "The image shows a baseball field filled with people, including a baseball player wearing a glove, a baseball bat, and a baseball glove. There is also a large crowd of people watching the game.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sports ball", "person", "baseball bat", "baseball glove"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 67833, "caption": "A group of people are enjoying a delicious meal together at a table, with a pizza and other food items in front of them. They are sharing a meal, having a good time, and enjoying the food.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "bowl", "wine glass", "bottle", "cup", "fork", "pizza", "knife", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 272880, "caption": "A person is holding a pizza slice and a pizza box, with a fork in their hand, while eating a slice of pizza. The pizza box has the name \"Mystic Pizza\" written on it, indicating that it is a pizza shop or restaurant. The person is enjoying", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "cup", "fork", "pizza", "knife", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 254368, "caption": "A man in a bathrobe is sitting on a bed, eating a piece of pizza while holding a bowl of soup.", "mscoco_hallucinated_words": [["bowl", "bowl"]], "mscoco_gt_words": ["pizza", "person", "bed"], "hallucination_idxs": [19], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 1.0}}, {"image_id": 193108, "caption": "A baseball player is standing in front of a fence, wearing a baseball uniform, and holding a baseball bat. He is ready to hit a ball that is being tossed by another player in the background.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sports ball", "baseball bat", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 459141, "caption": "A woman rides a bicycle while wearing a hat and holding a large plastic bag full of groceries. She is navigating through a crowded city street, which is filled with various cars, trucks, and pedestrians. The image captures the woman's determination", "mscoco_hallucinated_words": [["car", "car"], ["truck", "truck"]], "mscoco_gt_words": ["potted plant", "motorcycle", "bicycle", "person"], "hallucination_idxs": [33, 35], "metrics": {"CHAIRs": 1, "CHAIRi": 0.4, "Recall": 0.5}}, {"image_id": 231534, "caption": "An airplane is being loaded with luggage and other items, as a man carries a suitcase and a handbag, while a truck is parked nearby.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["truck", "airplane", "person", "handbag", "suitcase"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 227031, "caption": "A man and woman are standing next to a cake at a wedding reception. The man is holding a knife, and the woman is holding a small bouquet of flowers. They are both smiling and looking at the camera. The cake is on a table, and there are other people in the background", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "potted plant", "tie", "knife", "person", "cake"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 209347, "caption": "A woman is sitting on a subway train, using her cell phone while holding onto a handrail for support.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["tie", "cell phone", "handbag", "person", "train"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 523292, "caption": "A cat is sitting on a laptop, which is open on a table. The cat is looking at the screen and appears to be watching the laptop display.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "laptop", "tv", "chair", "cat"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 12375, "caption": "The image features a white plate filled with a delicious meal, consisting of various food items such as chicken, potatoes, carrots, and lettuce. The meal is served with a side of broccoli, which adds a healthy and tasty element to the dish.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "broccoli", "carrot"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 13550, "caption": "A woman is sitting on a rock next to an elephant, petting it while holding a handbag.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["elephant", "handbag", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 146837, "caption": "The young man is skateboarding in a parking lot, showcasing his skills and enthusiasm for the sport.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["skateboard", "person", "motorcycle"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 67042, "caption": "A man stands next to a large stone archway, looking at his cell phone while wearing a suit.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "tie", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 209925, "caption": "A baseball player is shown in mid-action, with his arm extended and the ball in his hand, ready to pitch.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sports ball", "person", "baseball glove"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 2154, "caption": "A man sits on a bench, surrounded by trash and an empty shopping cart, in the middle of a city street.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["umbrella", "bench", "person", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 274931, "caption": "A city street is shown in the image, with cars parked along the side of the road. A car is parked in front of a building, and a red traffic light is visible in the background. The street is empty, giving the scene a deserted atmosphere.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["traffic light", "fire hydrant", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 104326, "caption": "The image features a cozy dining room with a table, chairs, and a clock. There are several dishes on the table, and a kitchen area is visible behind the table. A green dining room table and matching chairs contribute to the warm and inviting atmosphere. The room is well-lit", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "knife", "potted plant", "microwave", "clock", "chair", "sink", "oven"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.375}}, {"image_id": 233888, "caption": "A young boy is playing baseball with a bat in front of a television, surrounded by a living room setting. He is wearing a baseball uniform and is attempting to hit a baseball that is being thrown by a person. The television is playing a baseball game, and the boy is likely watching the game while trying to practice", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["tv", "potted plant", "baseball glove", "baseball bat", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 213905, "caption": "Two women tennis players are standing on a grassy field, holding tennis rackets and smiling at each other. One woman is wearing a white tennis dress, while the other is wearing a black tennis dress. They appear to be enjoying their time on the field, possibly during a break or before a game", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "person", "backpack", "tennis racket"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 277479, "caption": "A young girl is walking towards the refrigerator in the kitchen, possibly looking for a drink or snack. She is holding a bottle of ketchup in her hand and has a toy dog with her, which she might be using as a toy. The girl is walking in front of a", "mscoco_hallucinated_words": [["dog", "dog"]], "mscoco_gt_words": ["refrigerator", "person", "bottle"], "hallucination_idxs": [34], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2, "Recall": 1.0}}, {"image_id": 300784, "caption": "A group of children, including a boy and a girl, sit together on a couch, surrounded by a dog and a wooden bench. They appear to be enjoying their time together, and the presence of a dog adds a playful and fun atmosphere to the scene.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["couch", "bench", "dog", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 183766, "caption": "A delicious slice of cake, decorated with fresh berries and a slice of cheesecake, is presented on a white plate. The arrangement is perfect for a special occasion or as a treat to indulge in.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "knife", "fork", "cake"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 169169, "caption": "A person is standing in front of a large, green-colored street sign in the middle of a city street. The sign is displaying the word \"Spring\" in a modern font, and it appears to be a prominent and well-lit street sign. The city street is surrounded by various buildings and people walking around", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["traffic light", "potted plant", "person", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 409346, "caption": "A group of people, including a woman and a man, are enjoying a meal at a table. The woman is holding a spoon while the man is holding a fork. There is a bowl of fruit in front of them, and a variety of foods, such as a cake, are on", "mscoco_hallucinated_words": [["fork", "fork"]], "mscoco_gt_words": ["dining table", "bowl", "spoon", "person", "cake"], "hallucination_idxs": [32], "metrics": {"CHAIRs": 1, "CHAIRi": 0.1, "Recall": 1.0}}, {"image_id": 522262, "caption": "A long line of bicycles is parked along the sidewalk in front of a building.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["traffic light", "bicycle", "person", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 79014, "caption": "A man is holding a yellow, plastic ball while standing in front of a fence, making a funny pose.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sports ball", "orange", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 344942, "caption": "A small wooden toy is perched on top of a computer monitor, peeking out from behind the laptop screen.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["clock", "laptop", "tv"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 275929, "caption": "Two toilets are sitting on the stairs in a building, with one of them being a white porcelain toilet, and the other being a brown porcelain toilet. The image is taken from the top, providing a view of the toilets from above.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sink", "toilet", "bowl"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 465601, "caption": "A man is walking in a park, holding an umbrella, and looking at a woman who is sitting on a bench.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["umbrella", "bench", "handbag", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 300124, "caption": "A small, old, and worn-out couch is sitting in the middle of a dirt street, surrounded by trees and greenery. The couch has a tray on top of it, which might be used for food or a cup of coffee. The scene suggests a sense of nostalgia, as", "mscoco_hallucinated_words": [["cup", "cup"]], "mscoco_gt_words": ["couch", "dining table", "chair", "microwave"], "hallucination_idxs": [42], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.25}}, {"image_id": 46919, "caption": "A man is walking uphill with skis on his feet, heading towards a snowy mountain peak.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "backpack", "skis"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 434022, "caption": "A white train engine is traveling down a rail track, with a black engine in the background.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "car", "train"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 490491, "caption": "A man is standing in front of a street sign and a brick wall, looking at the camera. The street sign has a red arrow pointing to the left, indicating that the street is one-way. The brick wall is partially covered with graffiti. The scene suggests that the man is taking a moment to observe", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["stop sign", "person", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 175878, "caption": "A group of friends are gathered around a large outdoor trash can, engaged in a conversation. One person is holding a cell phone, while the others are either using their phones or not. The scene suggests that they might be discussing something interesting or sharing a funny moment. The presence of a trash", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "person", "backpack"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 12669, "caption": "In this image, a young woman is standing in a room surrounded by people, holding a wine glass. She is posing for a photo with a group of friends, while a man is also present in the background. The woman is wearing a white shirt, and the group appears to be enjoying a social", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["vase", "handbag", "person", "wine glass"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 192496, "caption": "A train is seen moving down the tracks, passing a small station in the countryside. A person is standing on the platform, looking at the train as it goes by. There is also a train car with a blue and white paint job, which might be a passenger train or a freight train. The", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "car", "train"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 133146, "caption": "The living room features a couch, a chair, a book, and a vase. It has a fireplace and a TV, making it a cozy space for relaxation and entertainment.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["tv", "vase", "couch", "chair", "book"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 53744, "caption": "A caption for this image could be: \"A fresh and colorful salad on a cutting board, complete with a knife and a sandwich plate, is ready to be enjoyed as a healthy and delicious meal.\"", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "knife", "sandwich"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 375902, "caption": "A man in a blue and white ski suit, wearing a backpack, is skiing down a snowy mountain slope while holding a pair of skis.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "backpack", "skis"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 498747, "caption": "In this image, a young man is holding a cell phone while standing in a room full of people. He is likely making a call or texting, and the group of people around him is engaged in conversation. The image captures a moment of social interaction and communication, where people are interacting with each other and", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bird", "cell phone", "person", "bottle"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 52435, "caption": "A group of people are enjoying a day at the beach, with a surfboard, an umbrella, and a large body of water.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bird", "surfboard", "umbrella", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 301977, "caption": "A cow stands by a row of colorful bottles and soda cans, possibly waiting to be milked. The scene is set against the backdrop of a bustling street, indicating that it might be a busy and active area.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["refrigerator", "bottle", "cow"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 261097, "caption": "A man wearing a tennis uniform is walking on a tennis court, looking at his racket, and holding it in his hand. He is standing near a blue tennis court and is likely preparing for a match or taking a break.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "bench", "person", "tennis racket"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 227204, "caption": "A group of three women are sitting at a dining table, enjoying their meal. One woman is eating a banana, while the other two women are eating their food. They all appear to be in their 50s or older, and they are dressed in casual clothing. The", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "bowl", "banana", "bottle", "cup", "cell phone", "spoon", "knife", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 353981, "caption": "A large airplane sits on the tarmac, surrounded by smaller vehicles and equipment, possibly waiting to be serviced or prepared for takeoff.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["airplane", "truck", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 185327, "caption": "A man is walking down a street, holding a long stick, and surrounded by a group of elephants, which are being led by a man on a motorcycle. The scene is taking place on a busy road with cars and other vehicles passing by. The presence of the elephants adds a unique and interesting", "mscoco_hallucinated_words": [["elephant", "elephant"], ["motorcycle", "motorcycle"], ["elephant", "elephant"]], "mscoco_gt_words": ["bus", "car", "horse", "person", "cow"], "hallucination_idxs": [19, 30, 53], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.4}}, {"image_id": 348654, "caption": "A small, black iPhone sits on a desk next to a white laptop, while a white iPhone is placed on top of a black iPhone stand. A black laptop is also visible on the desk.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "cell phone", "laptop", "tv"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 482432, "caption": "A toothbrush, toothpaste, and a bottle of whitening toothpaste are arranged on a bathroom sink, along with a toothbrush cup and a toothbrush holder.", "mscoco_hallucinated_words": [["bottle", "bottle"], ["cup", "cup"]], "mscoco_gt_words": ["sink", "bowl", "toothbrush"], "hallucination_idxs": [7, 22], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.6666666666666666}}, {"image_id": 454161, "caption": "A pizza and a glass of wine are on a dining table, accompanied by a fork.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "pizza", "fork", "wine glass"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 144723, "caption": "A dog is flying through the air while holding a frisbee, showcasing its impressive flying skills and love for the game.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["truck", "dog", "car", "frisbee"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 129707, "caption": "A person is holding a cell phone with a large screen, showing a digital interface. The phone is being used to make a call.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "person", "book"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 379842, "caption": "A small, white Nintendo Wii console and a controller are sitting on top of a stack of books, with a Game Boy Advance Game and a Game Boy Advance Game Book next to them.", "mscoco_hallucinated_words": [["boy", "person"], ["boy", "person"]], "mscoco_gt_words": ["dining table", "remote", "book"], "hallucination_idxs": [23, 29], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.3333333333333333}}, {"image_id": 203110, "caption": "A man is riding a vintage, bright orange, open-door trolley car down a city street, possibly in a busy downtown area. The trolley car has an old-fashioned design, with wooden benches and a steering wheel. The man is enjoying the", "mscoco_hallucinated_words": [["bench", "bench"]], "mscoco_gt_words": ["bus", "car", "orange", "truck", "person", "train"], "hallucination_idxs": [35], "metrics": {"CHAIRs": 1, "CHAIRi": 0.125, "Recall": 0.6666666666666666}}, {"image_id": 556478, "caption": "A close-up image shows a slice of pizza on a plate, with a fork and knife placed next to it.", "mscoco_hallucinated_words": [["fork", "fork"], ["knife", "knife"]], "mscoco_gt_words": ["pizza", "oven", "cup", "bottle"], "hallucination_idxs": [14, 16], "metrics": {"CHAIRs": 1, "CHAIRi": 0.6666666666666666, "Recall": 0.25}}, {"image_id": 103815, "caption": "A baseball player throws a baseball while another player watches from the dugout.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sports ball", "person", "baseball bat", "baseball glove"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 451943, "caption": "A bed is seen in the image, with two pillows on it. There is a lamp nearby, casting light on the bed. The bed is situated in a room with a wooden floor and a white wall.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "suitcase", "backpack", "bed"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 268854, "caption": "A woman carrying a large wooden boat on her shoulder is walking towards a beach, surrounded by boats and people.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "handbag", "boat"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 34464, "caption": "A group of people, including a young girl and a man, are having fun in the ocean while holding onto a red inflatable kayak. They are enjoying their time on the water, paddling and playing with the kayak in the waves.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["surfboard", "boat", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 495513, "caption": "A man and a woman are holding hot dogs on forks while standing in front of a fire.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "person", "hot dog"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 529256, "caption": "A dog is laying on a red bed, and a dog is laying on the floor near the bed. The dog on the bed is looking at the camera, while the other dog is looking at the camera from a distance.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["book", "dog", "bed"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 37907, "caption": "A cat sits on a TV stand, looking at the TV screen with a curious expression.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cat", "potted plant", "tv"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 506401, "caption": "A city street is bustling with cars, a truck, and a few people walking, while a white dog and a statue of a wolf sit in the middle of the road.", "mscoco_hallucinated_words": [["dog", "dog"]], "mscoco_gt_words": ["traffic light", "car", "cat", "truck", "person"], "hallucination_idxs": [20], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.6}}, {"image_id": 406611, "caption": "A group of people is gathered at the bottom of a ski slope, watching a skiier on the slopes. The skiier is about to hit a jump, and the group of people is cheering. The scene is set in the snowy mountains, creating a festive atmosphere for winter sports enthusiasts", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "backpack", "skis"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 267225, "caption": "In the image, there is a television truck parked on the street, along with several cars and a group of people. The truck is equipped with antennas, which are used for broadcasting or transmitting signals. The presence of the television truck and the people around it suggests that there is a", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["remote", "tv", "car", "truck", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.8}}, {"image_id": 278365, "caption": "Two friends are enjoying a meal together on a patio, with a pizza box on a table. One person is eating a slice of pizza, while the other is holding a pizza box. They are both sitting on a bench, with a chair nearby.", "mscoco_hallucinated_words": [["bench", "bench"]], "mscoco_gt_words": ["dining table", "cup", "pizza", "chair", "cell phone", "person"], "hallucination_idxs": [43], "metrics": {"CHAIRs": 1, "CHAIRi": 0.14285714285714285, "Recall": 0.6666666666666666}}, {"image_id": 69757, "caption": "A group of people, including an older man, a woman, and a young girl, sit around a dining table, enjoying a delicious cake on a special occasion. The cake is decorated with candles and colorful candies, adding to the festive atmosphere.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "wine glass", "cup", "chair", "knife", "person", "cake"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.42857142857142855}}, {"image_id": 432213, "caption": "In the image, a person is holding a sandwich with a slice of fried chicken, lettuce, and tomato, all topped with a sauce. The person is sitting at a table, enjoying their meal. The image captures a moment of relaxation and satisfaction as the person sav", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "bowl", "sandwich", "wine glass", "knife", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 368367, "caption": "A young woman is sitting at a table outside, enjoying a meal while talking on her cell phone. She is dressed in a white shirt and black pants, and has a casual, relaxed demeanor.", "mscoco_hallucinated_words": [["table", "dining table"]], "mscoco_gt_words": ["cell phone", "person", "cup"], "hallucination_idxs": [7], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.6666666666666666}}, {"image_id": 201555, "caption": "A busy road with a traffic light and a construction site, featuring a truck and a car, is the scene in the image. The construction site has a sign that reads \"Grand National Boulevard,\" indicating the name of the street or road. The presence of a traffic light suggests that the intersection is being", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["traffic light", "truck", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 92131, "caption": "A group of people, including a man and a woman, stand near a bus, which is parked on a street. They appear to be waiting for the bus to start moving or are simply observing it. The bus has a sign on it that reads \"Bus Stop,\" indicating its purpose.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bus", "handbag", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 21779, "caption": "A young woman is sitting on the floor and holding a suitcase, which is open and filled with her belongings. She is smiling and possibly looking at her phone or a map, suggesting that she might be planning a trip or preparing for a journey.", "mscoco_hallucinated_words": [["phone", "cell phone"]], "mscoco_gt_words": ["person", "suitcase", "backpack"], "hallucination_idxs": [30], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.6666666666666666}}, {"image_id": 565148, "caption": "A baseball player is at the plate, ready to hit a home run in front of a crowd of people. He is wearing a baseball cap, a baseball glove, and a baseball bat.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sports ball", "person", "baseball bat", "baseball glove"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 160183, "caption": "A fire truck is parked outside a large building with a fire hose extended from the back. There are people in the background, and a group of firefighters can be seen standing near the truck. The fire truck is likely used for training purposes or for a demonstration, and it is", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["truck", "person", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 555456, "caption": "The image shows a group of skiers and snowboarders lined up at the base of a snow-covered hill, preparing to hit the slopes. The scene is captured from a bird's-eye perspective, showcasing the snowy landscape and the winter sports enthusiasts getting", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["snowboard", "person", "skis"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 235595, "caption": "A group of motorcycles, including a Harley-Davidson, is parked in a row on the sidewalk outside a restaurant. The scene is set in a busy city, where people are walking and cars are passing by. The presence of the motorcycles indicates a vibrant and bustling", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cup", "potted plant", "car", "parking meter", "motorcycle", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 489909, "caption": "A basket of colorful fruits and vegetables is arranged in a bowl. The bowl is filled with various fruits, such as bananas and oranges, as well as some vegetables, like green cucumbers. The fruit and vegetables are displayed in a pleasing arrangement, making for", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "orange", "banana"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 501080, "caption": "A large red poinsettia flower is placed in a clear glass vase, standing on a wooden table. The poinsettia is surrounded by a decorative bowl and a small white flower, creating a beautiful and festive arrangement.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "potted plant", "vase", "bowl"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 405183, "caption": "A young girl is sitting on a couch, holding a small remote control while a group of friends are gathered around her. They are watching a video game on a TV screen, and the girl is trying to demonstrate her skills in the game.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["remote", "tv", "potted plant", "couch", "chair", "book", "handbag", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 409138, "caption": "A green city bus is parked on the side of a street, near a curb.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bus", "person", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 411840, "caption": "A couple of tennis players walk on the grassy field, carrying their tennis rackets and balls. They are wearing sports attire and are ready to play a game.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sports ball", "tennis racket", "chair", "backpack", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 333712, "caption": "The image shows a slice of pizza on a plate, with a green topping and cheese. A knife and a spoon are placed next to the pizza, indicating that it's ready to be eaten. The slice is a delicious treat that can be enjoyed by pizza lovers.", "mscoco_hallucinated_words": [["knife", "knife"]], "mscoco_gt_words": ["dining table", "pizza", "spoon"], "hallucination_idxs": [19], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2, "Recall": 0.6666666666666666}}, {"image_id": 148977, "caption": "A small teddy bear sits on a table, wearing headphones, and listening to music while holding a book. It is placed next to a cup of coffee and a bottle of cola. The scene shows the teddy bear enjoying its music and reading, creating a cozy atmosphere.", "mscoco_hallucinated_words": [["cup", "cup"]], "mscoco_gt_words": ["dining table", "bear", "bottle", "teddy bear", "book", "keyboard"], "hallucination_idxs": [27], "metrics": {"CHAIRs": 1, "CHAIRi": 0.16666666666666666, "Recall": 0.6666666666666666}}, {"image_id": 399058, "caption": "A man is riding on the back of a large elephant as it travels down the road. The man is wearing a white shirt and a pair of sunglasses, while the elephant is covered in a layer of mud. The scene is captured on a rural road, surrounded by", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["elephant", "bicycle", "orange", "truck", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 183571, "caption": "A man is standing on a boat, holding a small dog. The boat is on a body of water, and the man is smiling while petting the dog.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "dog", "boat"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 325836, "caption": "A vintage motorcycle is on display at a red carpet event, showcasing its sleek design and colorful paint job. The motorcycle's unique style, with its bright red and black paint scheme, stands out against the black and white background, making it a focal point in the image", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bicycle", "motorcycle", "handbag", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 437910, "caption": "In a small, cramped bathroom, a toilet is situated next to a sink. The bathroom has a white wall, and there is a large stack of newspapers on the floor.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sink", "toilet", "bottle"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 155885, "caption": "A group of birds are flying overhead a small boat, with a lone man sitting on the boat, enjoying the view.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bird", "boat", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 467887, "caption": "A man in a red shirt is sitting in a living room, using a laptop on a table. He is likely engaged in some work or activity, possibly using a computer program or browsing the internet. The man is wearing glasses and has a cup of coffee on the table next to his laptop.", "mscoco_hallucinated_words": [["cup", "cup"]], "mscoco_gt_words": ["dining table", "laptop", "mouse", "couch", "chair", "person"], "hallucination_idxs": [48], "metrics": {"CHAIRs": 1, "CHAIRi": 0.125, "Recall": 0.5}}, {"image_id": 174402, "caption": "The image shows a young man holding a tennis racket and standing on a tennis court. He is wearing a blue shirt and tennis shoes, and has a tennis ball in his hand.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sports ball", "person", "tennis racket"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 352734, "caption": "A young boy is eating a birthday cake from a plate with a spoon.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "fork", "spoon", "person", "cake"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 346716, "caption": "A group of red double-decker buses are driving down a city street, passing in front of a red car.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bus", "person", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 451144, "caption": "Two men are standing on a snowy slope, with one of them holding a backpack. They are likely skiing or snowboarding, enjoying the beautiful winter landscape and the outdoor activity.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "backpack", "skis"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 295656, "caption": "A group of people, including a man and woman, are enjoying a meal together at a restaurant. The woman is eating a pizza, and the man is eating a pasta dish. They are both smiling and having a good time.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["tv", "tie", "car", "clock", "pizza", "chair", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2857142857142857}}, {"image_id": 129886, "caption": "A man and a woman are skiing down a snowy hill while wearing skiing gear, with a ski lift in the background. The image captures the fun and excitement of winter sports, with the skiers enjoying their time on the slopes and the ski lift providing a convenient means of transport", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["snowboard", "person", "skis"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 557998, "caption": "A young girl is sitting at a dining table, surrounded by a beautiful garden and lush greenery, sipping a glass of wine. She is smiling and seems to be enjoying her time outdoors.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "wine glass", "bottle", "chair", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 401010, "caption": "A bed or bedding area is visible in the image, with a table nearby. The bed is covered with white linens, and there is a chair and a lamp in the room.", "mscoco_hallucinated_words": [["table", "dining table"]], "mscoco_gt_words": ["chair", "sink", "tv", "bed"], "hallucination_idxs": [13], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.5}}, {"image_id": 567562, "caption": "A group of young girls is sitting around a table, enjoying a meal together. They are sharing a variety of foods, including pizza, salad, and a glass of juice. The girls are smiling and engaged in conversation while eating, creating a warm and friendly atmosphere.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "bowl", "bottle", "cup", "fork", "pizza", "chair", "broccoli", "spoon", "book", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2727272727272727}}, {"image_id": 313928, "caption": "A caption for this image could be: \"Sunny day at the beach with a yellow surfboard, a table and chairs, and a bottle of wine, providing a relaxing spot to enjoy a meal.\"", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "surfboard", "wine glass", "bottle", "chair"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.8}}, {"image_id": 490284, "caption": "A black dog is laying on a couch, resting its head on someone's hand, possibly seeking comfort or attention.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["couch", "dog", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 346940, "caption": "A kitchen scene with a stove, a frying pan, and a pot on the stove is filled with smoke from the cooking process.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["knife", "oven", "bowl"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 222782, "caption": "A woman walks down the sidewalk past an old-fashioned gas station sign, which reads \"AMOCO GAS.\" The woman is walking while looking at her phone, possibly using a map app or talking on the phone. The presence of the woman and her phone in the image creates a sense of", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "truck", "person", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 255934, "caption": "An adult elephant and two young elephants are walking together in a zoo, with the adult elephant leading the way. The young elephants are close to the adult, and one is even holding onto the adult's trunk. The scene takes place in a rocky area with rocks and", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["elephant", "handbag", "person", "cow"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 278627, "caption": "A group of friends are enjoying their meal at a restaurant, with a plate of fried chicken, a bottle of drink, and a delicious salad. The image captures the fun and relaxed atmosphere of the dining experience, showcasing the variety of food options available.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "bottle", "cup", "potted plant", "fork", "chair", "spoon", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.125}}, {"image_id": 400851, "caption": "A group of people lounging on a sandy beach, enjoying a beautiful day with plenty of sunshine and the presence of a tent, chairs, and umbrellas, creating a comfortable and relaxing atmosphere.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["umbrella", "bench", "boat", "sports ball", "chair", "backpack", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.42857142857142855}}, {"image_id": 472610, "caption": "A woman is standing with her dog in a field of cows, with a barn in the background. She is smiling and petting the dog, while the dog is wagging its tail. The woman and her dog appear to be enjoying a leisurely walk on a beautiful day.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dog", "person", "cow"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 78565, "caption": "A group of people, including a man and a dog, are seen enjoying a day on the water, sailing and playing in the water.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "dog", "boat"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 388237, "caption": "A group of young people is gathered in a parking lot, enjoying the summer evening by skateboarding and hanging out. They are surrounded by a few cars, with one skateboarder in the foreground and another person on a skateboard in the background. The scene is filled with laugh", "mscoco_hallucinated_words": [["car", "car"]], "mscoco_gt_words": ["chair", "skateboard", "person", "bottle"], "hallucination_idxs": [28], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2, "Recall": 0.5}}, {"image_id": 289640, "caption": "A group of friends are gathered around a table with a large orange plastic cup, a dining chair, and a person wearing a yellow t-shirt. They are enjoying a fun night together, possibly celebrating a special occasion or just spending time together. The person in the yellow t-sh", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "wine glass", "cup", "chair", "orange", "frisbee", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.7142857142857143}}, {"image_id": 122602, "caption": "A caption for the image could be: A helpful language and vision assistant sits at a desk with a paper, scissors, and a bottle of white glue, assisting the user with various tasks using natural language.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "scissors", "bottle"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 24104, "caption": "A person is sitting at a desk in front of a computer, surrounded by various office supplies and a laptop. There is a cup of coffee on the desk, and a keyboard and mouse are also nearby. The person is using the computer to access information on a screen, and there is a television on the wall", "mscoco_hallucinated_words": [["person", "person"], ["person", "person"]], "mscoco_gt_words": ["dining table", "laptop", "tv", "cup", "mouse", "book", "keyboard", "bed"], "hallucination_idxs": [1, 42], "metrics": {"CHAIRs": 1, "CHAIRi": 0.18181818181818182, "Recall": 0.75}}, {"image_id": 183709, "caption": "A group of people is standing on a city street, looking at a red light at a traffic intersection. They are waiting for the light to turn green before crossing the street.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["traffic light", "handbag", "person", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 59710, "caption": "A white refrigerator is sitting on a wooden floor in a room, with its doors open and the interior exposed. The refrigerator is surrounded by other kitchen appliances and a window, creating a well-lit and organized space.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["refrigerator", "chair", "dining table"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 279407, "caption": "A young boy in a green baseball jersey and a baseball cap is standing on a field, ready to play baseball. He is holding a baseball and looking up at the sky with a smile on his face. The scene is set against a backdrop of trees, and there are other people watching the game in the", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bench", "bottle", "sports ball", "baseball glove", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2}}, {"image_id": 314729, "caption": "The image features an old black and white photograph of a man in a baseball uniform, standing in front of a white backdrop. He is holding a baseball bat and wearing a cap, ready to swing the bat and hit a home run. The image captures the spirit of competition and dedication of a baseball player", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sports ball", "baseball bat", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 527497, "caption": "A person is sitting at a computer desk with a computer monitor and a keyboard in front of them. There is a phone on the desk, and a computer monitor with a digital clock on it. The person is likely working or engaging in some activity on their computer.", "mscoco_hallucinated_words": [["person", "person"], ["phone", "cell phone"], ["clock", "clock"], ["person", "person"]], "mscoco_gt_words": ["dining table", "laptop", "tv", "mouse", "keyboard"], "hallucination_idxs": [1, 23, 35, 40], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3076923076923077, "Recall": 0.8}}, {"image_id": 411564, "caption": "A man is sitting on the edge of a chair, looking at his phone while sitting in the kitchen. The chair is placed near a window, allowing natural light to enter the room. The image captures a moment of relaxation and focus on the man's phone, with the presence of a dining table and", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "bottle", "refrigerator", "chair", "cell phone", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 320350, "caption": "A couple is walking on a frozen lake with their dogs, enjoying the winter scenery.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dog", "person", "skis"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 401857, "caption": "A baseball player is swinging at a pitch on a baseball field. The player is wearing a baseball cap, and the ball is flying through the air.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bench", "cup", "sports ball", "baseball glove", "baseball bat", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 285302, "caption": "A young boy is sitting at a dining table, surrounded by various crafting materials, including scissors, glue, and paper. He is engaged in a creative activity, possibly making a paper craft or art project.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "person", "chair", "scissors"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 61959, "caption": "A white and red bus is driving down a street, with a red car in front of it. The bus is passing by a stop sign at the corner of the street, and there is a traffic light ahead. The image shows a typical urban scene with a bus and a car navigating through the busy city street.", "mscoco_hallucinated_words": [["stop sign", "stop sign"]], "mscoco_gt_words": ["traffic light", "bus", "truck", "car"], "hallucination_idxs": [26], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.5}}, {"image_id": 229659, "caption": "A man is sitting at a table in a coffee shop, using his laptop and typing on it. The laptop screen displays a blue and white website, with a caption that reads \"Helping hands.\" A few people are sitting nearby, enjoying their coffee or talking to each other. The scene captures the modern", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "laptop", "tv", "bottle", "clock", "chair", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.42857142857142855}}, {"image_id": 473118, "caption": "A young man is skateboarding on a concrete ramp, performing a trick in the air while his skateboard is on a truck.", "mscoco_hallucinated_words": [["truck", "truck"]], "mscoco_gt_words": ["bicycle", "skateboard", "person"], "hallucination_idxs": [22], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.6666666666666666}}, {"image_id": 391222, "caption": "A man and a woman are walking on a snow-covered trail, possibly in a park or nature reserve, while they hold onto ski poles. The man is wearing a backpack, and the woman is wearing a purple jacket. They are likely on a snowshoeing or hik", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "backpack", "skis"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 416104, "caption": "A group of friends is enjoying a relaxing evening at a restaurant, with a few of them sitting at a table and others standing outside. They are sipping drinks and chatting with each other, creating a lively atmosphere.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["umbrella", "dining table", "wine glass", "bottle", "chair", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.16666666666666666}}, {"image_id": 511852, "caption": "Two men are skiing down a snowy slope, with one man wearing a red jacket and the other man wearing a blue jacket. They are holding ski poles and appear to be enjoying the winter sports experience.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "backpack", "skis"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 59386, "caption": "A group of giraffes, including one with a leaf in its mouth, are gathered together near a tree in a field. The giraffes are standing in a line, with their heads close together, and one giraffe has its mouth open to grab a leaf from the tree. This scene is", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["zebra", "car", "giraffe"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 540180, "caption": "A green traffic light sits on a pole in the middle of a street, indicating that it's time for cars to stop and wait for the signal to proceed. The image captures the moment when the sun is setting, casting a warm glow over the scene. A few cars can be seen in the distance", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["traffic light", "person", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 153692, "caption": "A man rides a bicycle across a street intersection, passing by a dog and a car. The man is dressed in casual attire and wears a backpack, while the dog is riding on the back of the bicycle. The image captures the moment of the man and the dog", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["traffic light", "dog", "bicycle", "car", "backpack", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.8333333333333334}}, {"image_id": 265628, "caption": "A man is sitting on a toilet in a bathroom, with a toilet paper roll next to him. He is wearing shoes and appears to be waiting for something, possibly using his phone or simply enjoying a moment of privacy in the bathroom.", "mscoco_hallucinated_words": [["phone", "cell phone"]], "mscoco_gt_words": ["bowl", "toilet", "person"], "hallucination_idxs": [35], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.6666666666666666}}, {"image_id": 499594, "caption": "A plate filled with delicious pasta, broccoli, and a side of steak is sitting on a dining table, ready to be enjoyed by the person eating.", "mscoco_hallucinated_words": [["person", "person"]], "mscoco_gt_words": ["dining table", "cup", "bottle", "fork", "broccoli", "knife"], "hallucination_idxs": [27], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.3333333333333333}}, {"image_id": 5934, "caption": "A baseball glove sits on top of a baseball, with a ball in the glove. The image is set against a concrete wall, and the baseball glove and ball are placed on top of a rack, possibly in a sports store or museum. The baseball glove is leather-based and appears", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sports ball", "bench", "baseball glove"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 47828, "caption": "The image features a blue city skyline with a boat and a bridge at night, giving it a unique and stunning view. The bridge is illuminated, and the boat is either docked or sailing through the water. This captivating scene offers an insight into the city's vibrant night", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["boat", "person", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 47916, "caption": "Two dogs, a golden retriever and a yellow dog, are running through a grassy field while playing with a frisbee.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bench", "dog", "car", "frisbee", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 255483, "caption": "A man is sitting at a desk with a stack of papers, possibly working on a project. He is holding a pen and appears to be reading through the documents. The image suggests that he is engaged in a task that requires careful attention and thoughtful consideration.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "person", "scissors", "book"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 131138, "caption": "A caption for the image could be: \"A modern workspace with a desk, computer, and a TV. The space is well-organized and has a variety of items such as a keyboard, a mouse, a coffee cup, and a plant. The person sitting at the desk is likely working", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "laptop", "tv", "cup", "potted plant", "mouse", "spoon", "keyboard", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.7777777777777778}}, {"image_id": 258209, "caption": "A man is sitting on a bench in front of a building, looking down at his phone. There is a bike rack next to him, and the man is wearing a suit and a hat.", "mscoco_hallucinated_words": [["phone", "cell phone"]], "mscoco_gt_words": ["bicycle", "bench", "person", "book"], "hallucination_idxs": [17], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2, "Recall": 0.75}}, {"image_id": 347453, "caption": "A busy city street is filled with multiple red double-decker buses, cars, and pedestrians. The scene is captured from the side of a building, giving a bird's-eye view of the urban environment. The presence of both public and private vehicles on the street indicates a vibr", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["traffic light", "bus", "bench", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 285820, "caption": "A living room with a television, a couch, and a dining table is filled with various items such as a TV remote, a purse, a book, and a phone. The room has a wooden floor and is well-lit, creating a cozy atmosphere.", "mscoco_hallucinated_words": [["remote", "remote"], ["purse", "handbag"]], "mscoco_gt_words": ["dining table", "bowl", "bench", "tv", "couch", "cell phone", "book"], "hallucination_idxs": [23, 26], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.7142857142857143}}, {"image_id": 245664, "caption": "A man is sitting at a desk with a laptop and a cell phone. He is working on his computer and reading a book while a TV is on in the background. There is a cup of wine on the table, and a keyboard and mouse are nearby. This scene portrays a relaxed and productive", "mscoco_hallucinated_words": [["man", "person"], ["cell phone", "cell phone"]], "mscoco_gt_words": ["dining table", "laptop", "wine glass", "cup", "tv", "mouse", "book", "keyboard"], "hallucination_idxs": [1, 12], "metrics": {"CHAIRs": 1, "CHAIRi": 0.18181818181818182, "Recall": 0.875}}, {"image_id": 453731, "caption": "A small dog is lying on a wooden floor, surrounded by various items like a bottle, a bucket, and a wooden barrel. The dog is likely taking a nap or resting, enjoying its cozy and comfortable surroundings.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dog", "cup", "bottle"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 524601, "caption": "A group of friends are gathered in a living room, playing video games on a Nintendo Wii console. They are all excited and engaged in the game, with one person playing the Wii controller and others watching and cheering them on.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["remote", "refrigerator", "couch", "chair", "book", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.16666666666666666}}, {"image_id": 253262, "caption": "A man stands next to a large airplane, holding a suitcase and looking at a smaller plane in the background.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["airplane", "tie", "person", "truck", "suitcase"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 87052, "caption": "A couple is standing in a kitchen, holding hands and looking at each other while they are preparing food. They are surrounded by various kitchen utensils and appliances, including a stove and a refrigerator. The man is holding a jar of sauce, and the woman is holding a sp", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "cup", "refrigerator", "bottle", "vase", "oven", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.42857142857142855}}, {"image_id": 357578, "caption": "A red fire truck is parked on the side of a city street, next to a traffic light. The truck is manned by a firefighter who is standing next to it. A car is stopped in front of the fire truck, and a traffic light is in the background.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["traffic light", "truck", "person", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 418692, "caption": "A man is sitting on a couch in a living room, reading a book while his girlfriend is lying on a couch nearby. The living room has a large window, and there is a chair nearby as well. The man and his girlfriend are enjoying their relaxation time together, engaging in activities", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["remote", "couch", "chair", "cell phone", "book", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 259345, "caption": "A man with a long beard and wearing a colorful, patterned outfit is standing outside with a pink umbrella, smiling at the camera.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["umbrella", "chair", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 119709, "caption": "A woman is sitting at a kitchen table, surrounded by a variety of doughnuts, and she is using a rolling pin to shape and prepare them.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "person", "chair", "donut"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 443299, "caption": "A couple is sitting on a bench in a train station, both using their cell phones to browse through content on the screen. They are likely waiting for a train or checking the schedule. The man is wearing a jacket, and the woman is wearing a hat.", "mscoco_hallucinated_words": [["train", "train"], ["train", "train"]], "mscoco_gt_words": ["bench", "cell phone", "backpack", "handbag", "person"], "hallucination_idxs": [9, 31], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.6}}, {"image_id": 120776, "caption": "A group of people is gathered around a large metal sculpture, enjoying the outdoor space and the city view. The sculpture features a large, intricate design, likely made of metal, and is placed on a raised platform or a rooftop, offering a great vantage point for the people to", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["umbrella", "tie", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 411765, "caption": "A man is playing tennis on a tennis court, swinging his tennis racket to hit the ball. The image captures a moment in time as the man prepares to hit the ball, focusing on the ball in front of him.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sports ball", "person", "tennis racket"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 447991, "caption": "In the image, a woman is walking down the sidewalk in a city street, with a man walking on the other side. The woman is carrying a purse and wearing a blue shirt, while the man is wearing a white shirt and has his hands in his pockets. There are cars,", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["traffic light", "truck", "bicycle", "car", "cell phone", "handbag", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.42857142857142855}}, {"image_id": 276719, "caption": "A group of people and cars are gathered in a parking lot, with a dog walking around and a person holding a dog leash. The cars include both old and new trucks, as well as a convertible. The scene is lively and vibrant, with people socializing and enjoying the", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dog", "car", "chair", "handbag", "motorcycle", "truck", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5714285714285714}}, {"image_id": 422328, "caption": "A horse is standing in the snow with its head hanging low, possibly due to the cold weather. It is pulling a wagon, which is filled with a large wooden crate. A man is walking nearby, likely supervising the horse or assisting with the wagon. The image captures a moment", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["snowboard", "car", "skis", "horse", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 354559, "caption": "A young woman wearing a black and white striped dress holds a stuffed teddy bear, smiling while posing for the camera. The woman is holding the teddy bear in one hand and her phone in the other, which suggests that she might be taking a selfie or sharing a photo with her friends", "mscoco_hallucinated_words": [["phone", "cell phone"]], "mscoco_gt_words": ["bear", "teddy bear", "person"], "hallucination_idxs": [35], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2, "Recall": 0.6666666666666666}}, {"image_id": 438788, "caption": "A group of people is sitting at a table, enjoying a cake that is cut into slices.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "knife", "person", "cake"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 468005, "caption": "A large, brown elephant is walking along a boardwalk, with a large, wooden elephant statue behind it.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["elephant", "person", "backpack"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 545594, "caption": "A man is standing in the middle of a city bus, looking at a cell phone. He is wearing a colorful shirt, and a backpack is visible on his back. The image captures the busy atmosphere of a city street, where people are walking and cars are passing by.", "mscoco_hallucinated_words": [["cell phone", "cell phone"], ["car", "car"]], "mscoco_gt_words": ["chair", "orange", "person", "backpack"], "hallucination_idxs": [15, 50], "metrics": {"CHAIRs": 1, "CHAIRi": 0.4, "Recall": 0.5}}, {"image_id": 219546, "caption": "A large dining table is filled with various food items, including a ham, salads, and cheeses. The table is decorated with a Christmas tablecloth, creating a festive atmosphere. The image shows a group of people gathered around the table, enjoying their meal together.", "mscoco_hallucinated_words": [["person", "person"]], "mscoco_gt_words": ["dining table", "bowl", "bottle", "fork", "chair", "spoon", "knife"], "hallucination_idxs": [40], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.14285714285714285}}, {"image_id": 386645, "caption": "A bustling street scene in an Asian city, with a large building with an old-fashioned facade, a car parked next to it, and a motorcycle parked in front of a restaurant.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["motorcycle", "truck", "person", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 155131, "caption": "A woman in a tennis uniform is playing tennis, with her racket in hand and her back turned to the camera. She is on a grassy court, and there is a man in the background who appears to be watching her. The woman is about to hit the tennis ball with her racket.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bench", "sports ball", "tie", "tennis racket", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 188752, "caption": "A man is standing in a fruit market, surrounded by various types of fruits, including bananas, apples, and other items.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["apple", "person", "banana"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 228350, "caption": "In the image, a man is standing in front of a dining table, possibly waiting for a meal or greeting guests. The dining table is set with a white tablecloth, silverware, and wine glasses. There are chairs at the table, and the man is wearing a suit", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["umbrella", "dining table", "bowl", "wine glass", "cup", "tie", "chair", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 437720, "caption": "A young woman sits at a red-colored dining table, typing on her laptop while surrounded by a few paintings. She is wearing a hat, and her hair is down, exposing her face. The image captures the moment of her concentrating on her work, surrounded by art pieces that", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "laptop", "vase", "chair", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 378831, "caption": "A woman in a green shirt is walking down a sidewalk next to a fire hydrant, carrying a shopping bag.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "handbag", "fire hydrant"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 375503, "caption": "A person is sitting at a desk in a room with a staircase leading up to the second floor. The room has a large wooden desk and a large wooden chair, and there is a clock on the wall. The image captures a moment of a person working at their desk, possibly on a", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "laptop", "tv", "clock", "chair", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 330369, "caption": "A red fishing boat is docked at a pier, with a man standing on the deck looking out to the sea. There are two white boats moored nearby. The man is likely a fisherman or crew member preparing for the day's fishing trip.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bird", "boat", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 288576, "caption": "A man is playing a frisbee in the park, with a tree in the background. The man is throwing the frisbee and running towards it, while a little boy is riding a bicycle nearby.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bicycle", "person", "frisbee"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 32190, "caption": "A small, life-like horse statue sits on the sidewalk in front of a store. The horse has a brown and white color, and its mane and tail are visible. The horse statue is placed on a small pedestal, making it stand out on the sidewalk.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "horse", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 535403, "caption": "In the image, there is a small, clean bathroom with a sink, toilet, and a few other items like a hair dryer, a toothbrush, and a toilet brush. A long mirror is also present in the bathroom.", "mscoco_hallucinated_words": [["toothbrush", "toothbrush"]], "mscoco_gt_words": ["bottle", "hair drier", "potted plant", "clock", "sink", "toilet"], "hallucination_idxs": [28], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.3333333333333333}}, {"image_id": 449798, "caption": "In this image, we see a desk with a computer, keyboard, and mouse. There is also a laptop, a book, and a variety of figurines and other objects on the desk. The desk is located in a bedroom, and it appears to be a cluttered space.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "laptop", "mouse", "cell phone", "book", "keyboard"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.8333333333333334}}, {"image_id": 375769, "caption": "A young boy sits at a table, eating a sandwich while looking at a bicycle parked outside.", "mscoco_hallucinated_words": [["sandwich", "sandwich"]], "mscoco_gt_words": ["umbrella", "dining table", "hot dog", "cup", "bicycle", "car", "chair", "person"], "hallucination_idxs": [10], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.375}}, {"image_id": 426172, "caption": "A wine-themed gift shop showcases a table with a wine bottle, a wine bottle cap, a wine glass, and a wine-themed tablecloth. The display is surrounded by various items, such as a wine aerator, a wine key, and a wine decanter. The image", "mscoco_hallucinated_words": [["wine glass", "wine glass"]], "mscoco_gt_words": ["dining table", "bottle", "chair", "book", "knife"], "hallucination_idxs": [18], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.4}}, {"image_id": 20650, "caption": "A delicious sandwich, salad, and a bowl of broccoli sit on a table, ready to be enjoyed. The sandwich is made of meat, bread, and cheese, while the salad consists of lettuce, tomato, and onion. A bowl of steamed bro", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "bowl", "sandwich", "fork", "orange", "broccoli"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 138078, "caption": "A young baseball player stands on the field, holding a baseball bat while wearing a red baseball cap and a baseball jersey. He is looking down and seems to be contemplating the next play.", "mscoco_hallucinated_words": [["baseball bat", "baseball bat"]], "mscoco_gt_words": ["sports ball", "person", "baseball glove"], "hallucination_idxs": [11], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.3333333333333333}}, {"image_id": 152499, "caption": "A group of friends is gathered around a swimming pool, playing games with a water gun and enjoying a fun day outdoors.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["umbrella", "dining table", "surfboard", "potted plant", "chair", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 180764, "caption": "A man is sitting on a couch, holding a donut in his hand.", "mscoco_hallucinated_words": [["couch", "couch"]], "mscoco_gt_words": ["person", "microwave", "donut", "bottle"], "hallucination_idxs": [6], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.5}}, {"image_id": 147762, "caption": "A delicious slice of chocolate cake is served on a plate, accompanied by a scoop of ice cream and a topping of whipped cream. This delightful dessert is presented on a white tablecloth and is ready to be enjoyed by the person who has just taken a bite", "mscoco_hallucinated_words": [["person", "person"]], "mscoco_gt_words": ["dining table", "fork", "cake"], "hallucination_idxs": [43], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.3333333333333333}}, {"image_id": 113860, "caption": "A man is standing on a boat, which is floating in the water. He is holding a fishing rod and appears to be preparing to cast his line into the river.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["umbrella", "boat", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 460866, "caption": "A dental hygiene routine is being performed in the image. A toothbrush and toothpaste are seen in a bathroom sink, while a tube of toothpaste is being squeezed and a toothbrush is being used. The image shows a dental hygiene", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "bowl", "cup", "sink", "toothbrush"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 177015, "caption": "A man is sitting on a couch while using a laptop. He is also holding a cat that is resting on his lap, and the cat is looking at the computer screen. The man is focused on his work, while the cat is curious about what he is doing on the laptop. This scene captures the", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["laptop", "refrigerator", "chair", "couch", "apple", "cat", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5714285714285714}}, {"image_id": 333998, "caption": "A kitchen full of appliances and dishes is shown in this image. There is a fridge, stove, microwave, and sink, along with several dishes and utensils. The kitchen has a white and brown color scheme, and the room appears to be well-organized.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "bottle", "refrigerator", "cup", "microwave", "sink", "suitcase", "oven", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4444444444444444}}, {"image_id": 47131, "caption": "A group of men are attempting to clear a railroad track of debris after a train accident. They are surrounded by wreckage, including a derailed train car, as they work to restore the track and ensure safety. The image captures the aftermath of the accident and the efforts made by the", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "car", "train"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 425447, "caption": "A man is standing in front of a white pickup truck, looking at the ground and possibly preparing to use a hose. The truck is parked next to a tree and is equipped with a water tank.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "truck", "fire hydrant"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 295105, "caption": "The man is standing in front of a kitchen sink, looking at a refrigerator and a stove. He is wearing a blue shirt and jeans, and appears to be preparing or finishing a meal.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "bottle", "refrigerator", "sink", "apple", "oven", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5714285714285714}}, {"image_id": 443259, "caption": "A modern kitchen with white cabinets, stainless steel appliances, and wooden countertops is displayed in the image. The kitchen has a large island, a dining table, and a sink, making it a spacious and functional area for cooking and entertaining.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "bowl", "bottle", "refrigerator", "potted plant", "chair", "sink", "orange", "oven"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2222222222222222}}, {"image_id": 537861, "caption": "A passenger train is pulling into a station, and a person is standing on the platform waiting for it to arrive.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bench", "person", "train"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 145020, "caption": "A duck is standing in front of a Christmas-themed display, wearing a red sweater and a Santa hat. The duck is holding a sign that reads \"Merry Christmas\" in a playful manner, and it is standing near a Christmas tree. This image captures the spirit of the hol", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bird", "teddy bear", "person", "mouse"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 249969, "caption": "A turkey dinner, complete with mashed potatoes, carrots, and other vegetables, is being served on a white plate. The meal is accompanied by a side of gravy and a glass of red wine. A fork and knife are also visible on the table.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "wine glass", "fork", "bird", "broccoli", "spoon", "knife", "carrot"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.625}}, {"image_id": 146504, "caption": "A man is sitting at a desk with a computer mouse and a keyboard in front of him, using the mouse to navigate through a document.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "laptop", "cup", "mouse", "keyboard", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.8333333333333334}}, {"image_id": 40037, "caption": "A large clock tower stands tall in the city center, with a building and a car parked nearby. The clock tower appears to be a significant landmark in the area, serving as a focal point for both locals and tourists.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["clock", "person", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 343218, "caption": "A young man is playing tennis at an outdoor tennis court, with a racket and a tennis ball. He is using a tennis net to serve and is enjoying the sport.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sports ball", "person", "car", "tennis racket"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 301837, "caption": "A modern kitchen features a large, open space with a glass-topped island, white cabinets, and a white refrigerator. The kitchen also includes a dishwasher, an oven, and a stove, which are all part of the modern appliance collection. The space is well", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["refrigerator", "clock", "apple", "sink", "oven"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 309071, "caption": "A man is sitting on a bench with his bicycle, while he is repairing the tire with his hands. The image is taken on a dirt road or a street in a tropical environment.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bench", "potted plant", "bicycle", "backpack", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 240681, "caption": "A young man is walking down a street, carrying a backpack, while standing next to a red motorcycle parked on the sidewalk.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "motorcycle", "person", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 178753, "caption": "A young girl sits in a red chair at an ice rink, wearing a red jacket and a smile on her face. She is holding a phone and seems to be talking to someone. The girl is enjoying her time at the ice rink and is possibly engaged in a conversation with someone nearby or", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "cell phone", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 278890, "caption": "A man is holding a cell phone and is talking on it. He is walking with a woman and has his arm around her as they walk.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "cell phone", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 47781, "caption": "A cozy bedroom with a red bed, a desk, and a lamp, filled with various personal belongings and decorations.", "mscoco_hallucinated_words": [["desk", "dining table"]], "mscoco_gt_words": ["tv", "vase", "book", "person", "bed"], "hallucination_idxs": [9], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.2}}, {"image_id": 542792, "caption": "A large baseball bat stands tall in the foreground of a city street, overlooking the surrounding buildings. A tall building with a baseball on top can be seen in the background. This unique combination of a baseball bat and a tall building creates an interesting visual contrast between the two structures, showcasing the diverse architecture and", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sports ball", "baseball bat", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 293703, "caption": "A group of men, including one with a beard, are sitting at a table enjoying their meal. They have a variety of foods, including pizza, salad, and drinks, and are enjoying their dining experience.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "bowl", "bottle", "cup", "fork", "pizza", "chair", "knife", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 318777, "caption": "A group of baseball players is gathered on a grassy field, standing in a row, and ready to play. They are dressed in their respective uniforms and are wearing baseball gloves. The scene is in a stadium, with the stands full of people watching the game.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sports ball", "person", "chair", "baseball glove"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 14773, "caption": "A colorful, fun, and delicious meal is being enjoyed by a person sitting at a table. The meal includes a tray of french fries, a sandwich, and a car-shaped hamburger. The person is enjoying their meal while sitting in a green-color", "mscoco_hallucinated_words": [["sandwich", "sandwich"], ["hamburger", "sandwich"]], "mscoco_gt_words": ["dining table", "hot dog", "cup", "bottle", "fork", "car", "spoon", "person"], "hallucination_idxs": [29, 34], "metrics": {"CHAIRs": 1, "CHAIRi": 0.4, "Recall": 0.25}}, {"image_id": 521863, "caption": "A young man is skateboarding down the sidewalk in front of a large building, with a group of people watching from the doorway.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bicycle", "skateboard", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 250540, "caption": "A group of people on motorcycles, including one man on a red motorcycle, are riding through the rain on a city street. The man is wearing a red helmet, while the other riders are wearing green helmets. The scene is captured from behind, showing the bikers", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["car", "cell phone", "motorcycle", "handbag", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 211604, "caption": "A young woman lays down on a wooden deck, wearing a tennis outfit and holding a tennis racket.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sports ball", "person", "tennis racket"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 298067, "caption": "A bottle of beer and a plate of grilled meat are sitting on a table. The plate contains a juicy piece of meat, and the beer is being poured into a glass. This image could be a perfect combination of a satisfying meal and a refreshing beverage, making it a", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "bowl", "cup", "bottle"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 563938, "caption": "A group of people is gathered around a table, engaged in conversation while one person is using a mobile phone. The scene appears to be taking place in a living room or a similar indoor setting.", "mscoco_hallucinated_words": [["table", "dining table"], ["mobile phone", "cell phone"]], "mscoco_gt_words": ["bench", "bottle", "tie", "couch", "person"], "hallucination_idxs": [8, 19], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.2}}, {"image_id": 461311, "caption": "The image shows a group of people gathered at a park or field, with a man flying a kite while others watch. There is a large group of people, including a man holding a red handbag, a child, and a woman with a backpack. The scene appears to be a fun and social event,", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["kite", "car", "backpack", "handbag", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.8}}, {"image_id": 47940, "caption": "A young woman is sitting on her bed, surrounded by various books, a teddy bear, and a laptop. She is reading a book and holding a teddy bear while looking at the laptop.", "mscoco_hallucinated_words": [["teddy bear", "teddy bear"], ["teddy bear", "teddy bear"]], "mscoco_gt_words": ["person", "bed", "laptop", "book"], "hallucination_idxs": [15, 30], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 1.0}}, {"image_id": 261318, "caption": "A man is sitting on a bench in the city, surrounded by suitcases, chairs, and other luggage. He is on his cell phone, possibly making a call or checking his messages. The scene captures the hustle and bustle of city life, where people are constantly on the", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bench", "chair", "cell phone", "suitcase", "handbag", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.8333333333333334}}, {"image_id": 134768, "caption": "The image shows a computer, keyboard, and mouse on a desk. There is also a pair of headphones and a black cable nearby. This could be a workspace or a home office, where the person is working or using their computer for various tasks.", "mscoco_hallucinated_words": [["person", "person"]], "mscoco_gt_words": ["dining table", "keyboard", "laptop", "mouse"], "hallucination_idxs": [39], "metrics": {"CHAIRs": 1, "CHAIRi": 0.16666666666666666, "Recall": 1.0}}, {"image_id": 526414, "caption": "A cozy living room filled with books, a cat, and a sewing machine is the setting for this image. A couch and a TV are also present, making it a comfortable and relaxing space for people to enjoy their hobbies and spend time together. The cat adds a touch of warmth and", "mscoco_hallucinated_words": [["person", "person"]], "mscoco_gt_words": ["dining table", "bowl", "laptop", "tv", "cup", "remote", "scissors", "couch", "cat", "book"], "hallucination_idxs": [39], "metrics": {"CHAIRs": 1, "CHAIRi": 0.16666666666666666, "Recall": 0.4}}, {"image_id": 273132, "caption": "An elderly woman is sitting on a bench, surrounded by her belongings, and looking at her phone. She appears to be waiting for someone or using her phone for a specific task.", "mscoco_hallucinated_words": [["phone", "cell phone"], ["phone", "cell phone"]], "mscoco_gt_words": ["bench", "handbag", "person"], "hallucination_idxs": [18, 30], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.6666666666666666}}, {"image_id": 505213, "caption": "The man is holding a sandwich with sausages and eating it while standing on a sidewalk in the middle of a bustling city.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sandwich", "person", "hot dog"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 192656, "caption": "A baseball player is in the middle of a pitch, throwing a baseball towards the catcher. He is wearing a black and white baseball uniform, and his glove is on his left hand.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sports ball", "person", "baseball glove"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 272728, "caption": "A vase filled with colorful flowers sits on a wooden table, surrounded by a green rug and a chair.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "chair", "potted plant", "vase"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 509811, "caption": "The image shows a large room filled with tables and chairs, where students are sitting and working on their computers.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "laptop", "chair", "apple", "book", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 412407, "caption": "A woman is holding a cell phone, which is displaying a black and white image on its screen. She is sitting on a couch, surrounded by people, and the image on the phone is likely showing a video or a picture.", "mscoco_hallucinated_words": [["couch", "couch"]], "mscoco_gt_words": ["clock", "cell phone", "person"], "hallucination_idxs": [25], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2, "Recall": 0.6666666666666666}}, {"image_id": 353658, "caption": "A woman with a pink umbrella walks on a busy street, carrying a bag and shopping items, while a man stands nearby, looking at her. The scene takes place in a city, with a market or storefronts nearby, showcasing the hustle and bustle of urban", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["umbrella", "clock", "person", "handbag", "suitcase", "carrot"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 441363, "caption": "A young man is playing tennis, swinging his tennis racket with a red shirt and white shorts. He is in the middle of the court, ready to hit the ball.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sports ball", "person", "tennis racket"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 331084, "caption": "A group of people is gathered around a dining table, preparing a pizza meal. They have various ingredients such as pizza dough, toppings, and sauce on the table, and are using a knife to slice the pizza dough into individual portions. One person is", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "bowl", "pizza", "spoon", "knife", "person", "carrot"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5714285714285714}}, {"image_id": 282553, "caption": "In the image, a young woman and a man are walking along a path, passing by a large stone monument at dusk. They are likely enjoying a leisurely stroll or a scenic walk, taking in the beauty of the surrounding landscape. The man is holding a phone, while the woman has", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "handbag", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 328818, "caption": "A woman is sitting on a bench while putting on her shoe. She is in a park setting with a bicycle nearby, and there is a green tree behind her.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bicycle", "bench", "person", "bottle"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 3103, "caption": "A man in a yellow helmet and a black jacket is doing a skateboard trick in the air, with his arms outstretched, while another man looks on in the background.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["clock", "skateboard", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 188136, "caption": "In the image, a kitchen filled with various food items, pots, and a sink is captured. The kitchen is bright and clean, with a green color scheme. There are fruits, including oranges and apples, arranged on the counter, along with a large bowl of vegetables. A stain", "mscoco_hallucinated_words": [["apple", "apple"]], "mscoco_gt_words": ["dining table", "bowl", "sink", "orange", "person", "carrot"], "hallucination_idxs": [40], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.5}}, {"image_id": 449675, "caption": "A white plate is filled with a delicious sandwich, which includes various ingredients such as meat, cheese, and vegetables. The plate is placed on a white tablecloth, and there is a fork and knife next to the plate. A glass of water is also visible on the table.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "sandwich", "bottle", "cup", "fork", "spoon", "knife", "carrot"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 191691, "caption": "In the image, a man is standing in front of a bathroom sink, shaving his face using a shaving razor. He is wearing a blue bathrobe, and the bathroom is clean and well-lit.", "mscoco_hallucinated_words": [["sink", "sink"]], "mscoco_gt_words": ["toothbrush", "person", "bottle"], "hallucination_idxs": [13], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.3333333333333333}}, {"image_id": 89378, "caption": "A man in a motorcycle helmet and leather jacket is standing next to a red motorcycle in a parking lot.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bicycle", "motorcycle", "person", "backpack"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 99874, "caption": "A young woman is sitting at a table with her phone, wearing sunglasses, and enjoying a meal.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "bottle", "cat", "cell phone", "handbag", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 437895, "caption": "A colorful bed with a floral pattern, featuring a bed frame with an arched shape and a potted plant on the bed, is showcased in this image. The bed is surrounded by a lively and vibrant atmosphere, creating a cozy and inviting ambiance.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["potted plant", "vase", "bed"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 557447, "caption": "A businessman in a suit sits at a conference table, holding a pen and looking down at a piece of paper. He is likely discussing a business proposal or reviewing documents related to the company's operations. The image suggests that the man is engaged in a professional setting and is actively participating in", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "tie", "fork", "spoon", "knife", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 159979, "caption": "A group of people are gathered around a boat in a river, with various items such as a tray of food, umbrellas, and a raft.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["umbrella", "bowl", "boat", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 357, "caption": "A baseball game is in progress, with a batter on base and a fielder preparing to catch a baseball. The image captures the dynamic nature of the sport, showcasing the skill and teamwork involved in the game.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "baseball bat", "baseball glove"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 538891, "caption": "A woman in a white tennis outfit is holding a tennis racket and standing on a grassy tennis court, ready to hit the ball.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sports ball", "person", "tennis racket"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 561967, "caption": "A train is passing by a line of cars, with a large shipping container on the tracks. The train is moving through the countryside, and there are some trees visible in the background.", "mscoco_hallucinated_words": [["container", "bowl"]], "mscoco_gt_words": ["traffic light", "car", "train"], "hallucination_idxs": [14], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.6666666666666666}}, {"image_id": 565778, "caption": "A train travels along a track next to a tunnel, with a passenger train and a freight train in the background.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["traffic light", "person", "car", "train"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 7125, "caption": "A group of people, including a woman and a man, are riding bicycles on a dirt path by a body of water. The man is holding a water bottle and wearing a backpack, while the woman is holding a small dog. They are enjoying the scenic view and spending", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dog", "bottle", "bicycle", "backpack", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 221350, "caption": "A man is wearing a red tie with white text and a heart design, sitting in a chair, holding a red tie in his hand, and looking at a woman. The tie is likely a gift or a special item, as the man is carefully examining it. The woman might be his partner or someone he", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "tie", "chair", "handbag", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 280930, "caption": "A young girl is standing in front of a stove, holding a tray of doughnuts and smiling while standing near a counter. The image captures the moment of her enjoying her baking and the delicious aroma of freshly baked doughnuts.", "mscoco_hallucinated_words": [["doughnut", "donut"], ["doughnut", "donut"]], "mscoco_gt_words": ["refrigerator", "oven", "person", "bottle"], "hallucination_idxs": [15, 41], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.5}}, {"image_id": 151081, "caption": "A small airplane is flying over a field, with a fence in the background. The image captures the moment of the plane taking off, or the pilot maneuvering the aircraft to land. The presence of the fence adds a sense of isolation and creates a clear visual contrast between the sky and", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["airplane", "truck", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 122232, "caption": "A young woman is standing on a grassy tennis court, holding a tennis racket and preparing to serve a ball. She is wearing a yellow tennis outfit, and her tennis shoes are green. The image captures her in mid-action, with the ball in her hand and her eyes looking up", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sports ball", "person", "tennis racket"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 134223, "caption": "A delicious hot dog is served on a plate, accompanied by a side of fries and a side of coleslaw. The image showcases a variety of food options that are appealing to the taste buds.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["hot dog", "dining table", "bowl", "broccoli"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 198163, "caption": "A man is sitting at a table filled with various bowls of blue and green paint, likely getting ready to create art or paint a piece.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "bowl", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 3742, "caption": "A bowl of apples sits on a dining table, accompanied by a rose. The rose is placed next to a vase, and a large window is visible behind the table. This scene shows a cozy and inviting atmosphere, where people can enjoy a snack or have a conversation while admiring", "mscoco_hallucinated_words": [["person", "person"]], "mscoco_gt_words": ["dining table", "apple", "bowl", "vase"], "hallucination_idxs": [44], "metrics": {"CHAIRs": 1, "CHAIRi": 0.16666666666666666, "Recall": 1.0}}, {"image_id": 217593, "caption": "A young boy is standing in a grassy area, ready to play baseball. He is wearing a baseball uniform, a baseball cap, and a glove. He is looking down and has a baseball in his hand. The image captures the moment before the boy swings his bat to hit the ball. The", "mscoco_hallucinated_words": [["ball", "sports ball"]], "mscoco_gt_words": ["baseball glove", "chair", "baseball bat", "handbag", "person"], "hallucination_idxs": [56], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.2}}, {"image_id": 279078, "caption": "A young girl is excitedly standing in front of a refrigerator full of various bottles of beer, while she is holding a bottle of beer. She seems to be enjoying the cool and refreshing drink, and the bottles on the shelf are arranged in a colorful and", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["refrigerator", "person", "bottle"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 572081, "caption": "A man is playing tennis on a court, while a woman watches from the sidelines. The image is taken in a large indoor stadium, with the court and seating area visible in the background. The man is hitting the tennis ball with a racket, and the woman is likely observing the", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sports ball", "tennis racket", "couch", "chair", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 477016, "caption": "A young girl is standing next to a kitchen sink, looking at a small oven with a television screen on the stove.", "mscoco_hallucinated_words": [["television", "tv"]], "mscoco_gt_words": ["potted plant", "sink", "backpack", "oven", "handbag", "person"], "hallucination_idxs": [18], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2, "Recall": 0.5}}, {"image_id": 301266, "caption": "A group of people, including a young woman, are gathered around a table with various items, such as utensils, dishes, and a basket of bread. They are engaged in preparing a meal or snack, possibly for a gathering or event.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "cup", "fork", "sink", "spoon", "book", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2857142857142857}}, {"image_id": 475813, "caption": "A young girl is standing in a room, holding a remote control in her hand. She is wearing a blue shirt and is surrounded by various objects, including a stuffed animal. The girl looks up at the camera, perhaps curious about the presence of the photographer. The image captures a moment of her", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "handbag", "remote"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 558784, "caption": "A young man is playing a frisbee in a green field while standing near a body of water. He is wearing a black shirt and is holding the frisbee in his right hand.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "backpack", "frisbee"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 308543, "caption": "A man is holding two silver spoons in a kitchen sink, with his hands covered in soap. The image captures a moment of cleaning and preparation for cooking, emphasizing the importance of proper cleanliness and hygiene in the kitchen.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sink", "person", "spoon"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 359164, "caption": "A brown dog and a black dog play in a green grass field, while a brown dog is also seen peeking out of a white bag.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "dog", "chair", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 539951, "caption": "A small kitchen setup is displayed in a LEGO scene, featuring a refrigerator, sink, and stove. The kitchen is designed in a checkerboard pattern, which adds a unique and visually appealing touch to the scene. The LEGO kitchen has a small dining table and chairs,", "mscoco_hallucinated_words": [["table", "dining table"], ["chair", "chair"]], "mscoco_gt_words": ["refrigerator", "oven", "sink", "clock"], "hallucination_idxs": [48, 50], "metrics": {"CHAIRs": 1, "CHAIRi": 0.4, "Recall": 0.75}}, {"image_id": 143479, "caption": "A man is holding a tray of hot dogs, and an older woman is standing next to him. They are both outside on a grassy field, surrounded by a group of people. The man is likely preparing to serve the hot dogs to the people in the group. The scene is reminiscent of", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "person", "hot dog"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 475024, "caption": "A vase filled with bright orange flowers is placed on a wooden table in a room.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "potted plant", "orange", "vase"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 238065, "caption": "A young man is riding a skateboard on a wooden skate ramp, performing a trick or stunt in the sunlight.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "skateboard", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 314016, "caption": "A small bathroom in a house features a sink, a toilet, and a shower, along with a bottle of alcohol on the counter.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sink", "toilet", "book", "bottle"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 322163, "caption": "A group of men, including a chef and multiple waiters, are gathered around a large table in a restaurant kitchen. They are preparing to make pizza using a variety of ingredients and utensils. The chef is standing next to a pizza oven, while the waiters are gathered around the", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "bowl", "remote", "bottle", "potted plant", "microwave", "pizza", "oven", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4444444444444444}}, {"image_id": 230983, "caption": "A young man is performing a skateboard trick in the middle of a city street, jumping over a pile of cardboard boxes. The man is wearing a black shirt and black pants, and he is jumping over the boxes with his skateboard.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["skateboard", "person", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 564629, "caption": "A spacious kitchen with a stainless steel sink, a refrigerator, a microwave, and a stove, along with a dining table and chairs, is shown in the image. The kitchen appears to be well-equipped for cooking and dining, with plenty of", "mscoco_hallucinated_words": [["table", "dining table"], ["chair", "chair"]], "mscoco_gt_words": ["refrigerator", "oven", "sink", "microwave"], "hallucination_idxs": [23, 25], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 1.0}}, {"image_id": 53431, "caption": "A man is sitting on a chair, using a laptop on his lap. He is wearing a suit and tie, and is sitting in front of a brick wall.", "mscoco_hallucinated_words": [["tie", "tie"]], "mscoco_gt_words": ["chair", "person", "laptop"], "hallucination_idxs": [21], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 1.0}}, {"image_id": 441840, "caption": "A young boy is swinging a bat at a baseball field, likely participating in a game or practice session. He is surrounded by other players, and there are a few adults present, possibly coaches or spectators. The image captures the moment of excitement and engagement as the young boy swings the", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["baseball glove", "car", "baseball bat", "truck", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2}}, {"image_id": 53465, "caption": "A group of friends are sitting at a table with a delicious cake on a plate. The cake is decorated with the words \"Welcome to Our Home\" in red and white icing, and it appears to be a special occasion. The friends are enjoying their time together, laughing and sm", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "bowl", "cup", "fork", "spoon", "person", "cake"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2857142857142857}}, {"image_id": 381031, "caption": "A man is enjoying a snack with a bowl of peanut butter, a spoon, and a glass of juice on a table.", "mscoco_hallucinated_words": [["man", "person"], ["bowl", "bowl"]], "mscoco_gt_words": ["dining table", "cup", "bottle", "microwave", "donut", "apple", "spoon"], "hallucination_idxs": [1, 8], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.2857142857142857}}, {"image_id": 530520, "caption": "Three men are sitting on a grassy field, engaged in a discussion. One man is wearing a backpack, and the other two are wearing shirts. They appear to be having a conversation about something, possibly related to their work or personal matters. The scene is peaceful and natural, with a", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["laptop", "clock", "motorcycle", "backpack", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 539555, "caption": "A young man is jumping on a skateboard, with his right foot raised and his left foot on the ground. The image is captured in a black and white photo, giving it a classic and timeless feel.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["skateboard", "person", "frisbee"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 279521, "caption": "Two men are standing next to a bus, looking at it. One of them is wearing a baseball cap, while the other has a beard. They are discussing something related to the bus, possibly planning a trip or waiting for a specific bus service.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bus", "car", "backpack", "handbag", "person", "train"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.16666666666666666}}, {"image_id": 560439, "caption": "A group of people, including a man, a woman, and a child, are walking in a snow-covered area, possibly a ski slope, with snowboards and skis. They appear to be enjoying their time together, and the man is holding a snowboard, while the woman and the child are", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["snowboard", "skis", "backpack", "handbag", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 248353, "caption": "A group of people, including a young boy, a girl, and a man, are enjoying a snowy day on a ski slope. They are all wearing ski gear and standing on the mountain, ready to start their day of skiing and snowboarding. The young boy is holding a snowboard", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["snowboard", "person", "skis"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 9628, "caption": "A man is riding a jet ski while jumping over the water, accompanied by a friend on a paddleboard.", "mscoco_hallucinated_words": [["jet", "airplane"], ["ski", "skis"]], "mscoco_gt_words": ["surfboard", "boat", "person"], "hallucination_idxs": [5, 6], "metrics": {"CHAIRs": 1, "CHAIRi": 0.6666666666666666, "Recall": 0.3333333333333333}}, {"image_id": 330050, "caption": "A man and woman are playing tennis at a court, possibly during a recreational match. The woman is holding a tennis racket, while the man is holding a tennis ball and is about to hit it back to her. They are both wearing tennis clothing and white shoes, and the man is standing with", "mscoco_hallucinated_words": [["ball", "sports ball"]], "mscoco_gt_words": ["bench", "person", "tennis racket"], "hallucination_idxs": [32], "metrics": {"CHAIRs": 1, "CHAIRi": 0.14285714285714285, "Recall": 0.6666666666666666}}, {"image_id": 254161, "caption": "A man is walking through a city park, where a large stone fountain is located in the middle of the grassy area. The man is holding a camera in his hand, and there is a large, green tree behind him. In the background, there are skyscrapers and a city skyline", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["kite", "handbag", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 275749, "caption": "A group of friends are gathered in a room, enjoying some drinks and having a good time. They are seated in a small space, with a laptop on a table and a TV behind them. The atmosphere seems lively and fun, with the presence of a couple of cups and a bottle,", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "laptop", "tv", "bottle", "cup", "mouse", "chair", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.625}}, {"image_id": 163518, "caption": "A chef, likely a restaurant worker, is standing at a table with a large pile of plastic salad bowls. She is wearing a white apron and a chef's hat, indicating her professional role in the food industry. The bowls are filled with various types of salad ingredients", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "bowl", "chair", "oven", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 156696, "caption": "A man stands next to a train with a long, dark green passenger car, possibly a subway or commuter train. The train has a large engine attached to it, which is in the process of pulling the passenger car down the tracks. The man is standing near the train, and there are other people on the", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["handbag", "person", "car", "train"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 525202, "caption": "A group of friends are sitting at a table, enjoying a delicious pizza together. They have a variety of toppings, including meat and vegetables, and are sharing slices of the pizza with each other. The pizza is placed on a metal tray, which is sitting on a tablecl", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "bottle", "cup", "fork", "pizza", "chair", "spoon", "knife", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2222222222222222}}, {"image_id": 423984, "caption": "A bowl of pasta, carrots, and broccoli is served on a dining table.", "mscoco_hallucinated_words": [["bowl", "bowl"]], "mscoco_gt_words": ["dining table", "broccoli", "carrot"], "hallucination_idxs": [1], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 1.0}}, {"image_id": 499486, "caption": "A cat lays on a bed next to a catnip toy, with a pile of clothes on the floor.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cat", "book", "bed"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 118124, "caption": "A young man is sitting in a car, wearing a tie and a black shirt. He appears to be smiling or posing for a photo. The car's rearview mirror is visible in the image, giving insight into the man's surroundings.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["tie", "person", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 288729, "caption": "A cute and colorful cake with a circus theme sits in front of a tent. It features a blue and white striped tent, a clown with a red nose, and a big smile on his face. The cake also has a bear and a bunny on top, giving", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["elephant", "bear", "teddy bear", "person", "cake"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 177721, "caption": "A young man is performing a skateboard trick on a ramp, showing off his skills and athleticism.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "skateboard", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 372220, "caption": "In this image, a man with a long beard is standing near a large stone wall and looking at his cell phone while wearing a black hat. He is likely in a historical setting, possibly a church or a museum, as the stone wall and his attire suggest a connection to the past. The man'", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "handbag", "person", "horse"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 252625, "caption": "A busy street with a mix of pedestrians and cyclists is seen in the image. There are various shops and a few bicycles parked along the sidewalk. The street is also lined with streetlights, which create a safe and well-lit environment for both pedestrians", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["traffic light", "potted plant", "bicycle", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 493610, "caption": "A group of people are standing next to a yellow truck with a blue trailer, which is being pulled by a blue pickup truck. There is also a person sitting on top of the blue trailer. The scene is set in a dusty, rural area, with a car parked nearby.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bus", "truck", "person", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 302789, "caption": "A suitcase and a backpack sit on a bed in a small room. The room has a small kitchenette, a sink, and a refrigerator, with a bed in the corner. A suitcase and a backpack are also present in the room, suggesting that someone has recently returned from a trip", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bottle", "refrigerator", "sink", "backpack", "handbag", "suitcase", "bed"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.7142857142857143}}, {"image_id": 30667, "caption": "A brown dog is lying on a boat, sitting next to a person and a man who is reading a book.", "mscoco_hallucinated_words": [["book", "book"]], "mscoco_gt_words": ["person", "dog", "boat"], "hallucination_idxs": [21], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2, "Recall": 1.0}}, {"image_id": 114108, "caption": "In the image, a group of people are sitting at a table with a pizza and a dining setup. One of the pizzas is a white pizza with green leaves on top, while the other pizza is a meat-topped pizza. They are both served on a dining table with", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "cup", "fork", "pizza", "chair", "spoon", "knife", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.375}}, {"image_id": 328110, "caption": "A woman is sitting on a bench with her baby in a carrier while looking at her phone.", "mscoco_hallucinated_words": [["phone", "cell phone"]], "mscoco_gt_words": ["bench", "handbag", "person", "backpack"], "hallucination_idxs": [17], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.5}}, {"image_id": 366111, "caption": "A man rides a bicycle on the sidewalk while another man is walking and carrying a briefcase, both of them in suits, in the city.", "mscoco_hallucinated_words": [["briefcase", "handbag"]], "mscoco_gt_words": ["traffic light", "bicycle", "person", "car"], "hallucination_idxs": [16], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.5}}, {"image_id": 532481, "caption": "The image shows a man flying a kite in the sky, with a surfer riding a wave in the ocean below.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["surfboard", "kite", "person", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 291634, "caption": "A group of motorcycles are parked in front of a street in a city, with some of them being parked on the sidewalk. The scene is filled with a mix of black, silver, and red motorcycles, creating an interesting contrast of colors. The presence of people walking around and cars driving", "mscoco_hallucinated_words": [["car", "car"]], "mscoco_gt_words": ["bicycle", "motorcycle", "person"], "hallucination_idxs": [55], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.6666666666666666}}, {"image_id": 463678, "caption": "The image features a man playing tennis, with a tennis racket and a ball, as he prepares to hit the ball.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sports ball", "person", "tennis racket"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 70815, "caption": "A dog is sitting on the sidewalk next to a bicycle and a bench, looking up at the camera.", "mscoco_hallucinated_words": [["bench", "bench"]], "mscoco_gt_words": ["bicycle", "truck", "dog", "person"], "hallucination_idxs": [13], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.5}}, {"image_id": 367872, "caption": "A baseball player stands at the plate, ready to swing a bat during a game. He is wearing a baseball uniform, and his teammates are gathered around him in the dugout.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["umbrella", "sports ball", "baseball glove", "baseball bat", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2}}, {"image_id": 353898, "caption": "A man sitting on a bench in a park is surrounded by a flock of white pigeons, enjoying the peaceful atmosphere and the company of the birds.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bench", "bird", "cell phone", "backpack", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 88269, "caption": "A bowl of soup sits on a white plate, next to a slice of toast on a wooden table. The bowl is filled with a red soup, and the toast has a slice of cheese on it.", "mscoco_hallucinated_words": [["table", "dining table"]], "mscoco_gt_words": ["sandwich", "bowl", "spoon"], "hallucination_idxs": [19], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.3333333333333333}}, {"image_id": 463211, "caption": "A girl and a boy are walking together, with the girl wearing a backpack and the boy holding a book. They are standing by a school bus, possibly waiting for their ride home.", "mscoco_hallucinated_words": [["book", "book"]], "mscoco_gt_words": ["bus", "person", "backpack"], "hallucination_idxs": [20], "metrics": {"CHAIRs": 1, "CHAIRi": 0.16666666666666666, "Recall": 0.6666666666666666}}, {"image_id": 396269, "caption": "A beautiful floral arrangement sits on a table in a grand room, surrounded by elegant furniture and decorative elements. The vase is adorned with a variety of colorful flowers, adding a touch of elegance and beauty to the space.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "chair", "vase"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 98979, "caption": "A microwave oven is sitting on a countertop, next to a stove and a dishwasher in a kitchen. The microwave oven is silver in color, and it is clean and well-maintained.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["knife", "oven", "microwave"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 244455, "caption": "Two motorcyclists ride down the street, with one rider giving a thumbs-up gesture while the other rider looks back. The scene is set against the backdrop of a city, with a car parked nearby. The motorcyclists seem to be enjoying their ride and expressing their", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bicycle", "car", "motorcycle", "truck", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 379443, "caption": "A pair of scissors and a pair of orange scissors are on a black surface, sitting next to a large black cloth.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "orange", "scissors"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 536154, "caption": "A young girl is surrounded by a pile of stuffed animals, including teddy bears, cuddly toys, and plush dogs. She is lying down on her bed, smiling and holding a stuffed animal. This image captures a child's joy and affection for their beloved", "mscoco_hallucinated_words": [["dog", "dog"], ["bed", "bed"]], "mscoco_gt_words": ["cat", "teddy bear", "person"], "hallucination_idxs": [21, 29], "metrics": {"CHAIRs": 1, "CHAIRi": 0.4, "Recall": 0.6666666666666666}}, {"image_id": 374061, "caption": "A black cat is laying on a couch and holding a stuffed animal, possibly a teddy bear, while a teddy bear is also present on the couch.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bear", "couch", "cat", "teddy bear", "bed"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 560018, "caption": "A group of people is enjoying water sports in the ocean, riding surfboards and kayaks, and having fun while the waves are crashing against the shore.", "mscoco_hallucinated_words": [["kayak", "boat"]], "mscoco_gt_words": ["surfboard", "person", "kite"], "hallucination_idxs": [15], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.6666666666666666}}, {"image_id": 353320, "caption": "A man is sitting on a bench near a suitcase and a large, black guitar case. He has a bag or backpack on the bench next to him. The image shows a busy street scene, with people walking past the man and his belongings.", "mscoco_hallucinated_words": [["backpack", "backpack"]], "mscoco_gt_words": ["person", "bench", "handbag", "suitcase"], "hallucination_idxs": [23], "metrics": {"CHAIRs": 1, "CHAIRi": 0.14285714285714285, "Recall": 0.75}}, {"image_id": 256628, "caption": "A yellow dog lays on the wooden deck, with its head and paws raised. The dog is likely enjoying the warm weather, and the deck provides a comfortable place for it to rest and relax.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "bowl", "dog"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 158806, "caption": "A dog is eating a sandwich on a blue plate, looking up at the person holding it.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sandwich", "dog", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 424270, "caption": "A young girl is sitting on a bed, surrounded by a pile of blankets, and there is a window in the room.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "tv", "bed"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 368335, "caption": "A horse is walking along a parking lot, passing by cars and trucks parked along the side of the road.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["truck", "horse", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 483227, "caption": "A group of children is gathered around a tennis court, participating in a tennis lesson or playing a game. They are standing in front of a net, with some holding tennis rackets, and one person is holding a tennis ball. The scene is likely a fun and engaging way for the kids to learn", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sports ball", "person", "tennis racket"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 228306, "caption": "A red double-decker bus is parked in front of a building, with a person walking towards it. The bus has a yellow and black stripe pattern, and it appears to be a London bus, given the presence of the iconic Routemaster design. The image captures a moment of the bus", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bus", "person", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 416384, "caption": "A woman is sitting on a bench, using her cell phone, while wearing a bathing suit.", "mscoco_hallucinated_words": [["bench", "bench"]], "mscoco_gt_words": ["chair", "cell phone", "person"], "hallucination_idxs": [6], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.6666666666666666}}, {"image_id": 364783, "caption": "A pink bathroom with a white sink, toilet, and shower is the focus of the image. The bathroom features a red floor and red walls, adding a pop of color to the space. The toilet and sink are positioned in separate areas, creating a sense of organization and efficiency", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bottle", "cup", "potted plant", "chair", "sink", "toilet", "toothbrush"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2857142857142857}}, {"image_id": 335041, "caption": "In the image, a man and a woman are walking in the snowy street while carrying skis. The man is wearing a red coat, and the woman is wearing a black coat. They are walking along a street with snow-covered sidewalks, likely enjoying a winter activity such as ski", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "skis", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 531327, "caption": "A bowl of colorful vegetables, including broccoli, carrots, and bell peppers, is being served on a dining table. The dish is topped with a green salad, and there is a spoon next to the bowl. This image showcases a healthy and", "mscoco_hallucinated_words": [["bowl", "bowl"], ["bowl", "bowl"]], "mscoco_gt_words": ["dining table", "wine glass", "fork", "broccoli", "spoon", "knife", "carrot"], "hallucination_idxs": [1, 40], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.5714285714285714}}, {"image_id": 451228, "caption": "A group of people are walking down a busy street in the city, with one person riding a bicycle. A red double-decker bus is also present, and a couple of people are walking on the sidewalk. There is a Christmas decoration hanging from a streetlight, adding a festive", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["traffic light", "bus", "bicycle", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 256365, "caption": "A plate of delicious cupcakes, decorated with blue frosting, is displayed on a white plate. The cupcakes are arranged in a creative and visually appealing way, making them look appetizing and attractive.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "cake", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 502936, "caption": "A man is playing tennis, hitting the ball back and forth with his tennis racket on a tennis court. The image captures the action of the man swinging his racket and preparing to hit the ball.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sports ball", "person", "tennis racket"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 451449, "caption": "A black and white dog is laying in a bookshelf, surrounded by books and a small bed.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["book", "dog", "bed"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 51054, "caption": "An elderly woman is sitting on a bed, talking on a cell phone, while a partially-eaten meal is on a nearby table.", "mscoco_hallucinated_words": [["table", "dining table"]], "mscoco_gt_words": ["cup", "bottle", "cell phone", "person", "bed"], "hallucination_idxs": [23], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.6}}, {"image_id": 1268, "caption": "A woman is sitting on a bench near a river, looking at a swan in the water while a man stands next to her. They are both enjoying the serene view of the swan and the river. The image captures the beauty of nature and the tranquility of the moment.", "mscoco_hallucinated_words": [["bench", "bench"]], "mscoco_gt_words": ["boat", "bird", "cell phone", "backpack", "handbag", "person"], "hallucination_idxs": [6], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2, "Recall": 0.3333333333333333}}, {"image_id": 62692, "caption": "A young woman is playing tennis, using her racket to hit a tennis ball back and forth on the court. She is wearing a black shirt and white shorts, and is in the process of serving the ball.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sports ball", "person", "tennis racket"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 542771, "caption": "In the image, a woman is sitting at a wooden dining table with a vase of flowers in front of her. The room is decorated with a patterned carpet, and there is a chair next to the dining table. A few items such as a book and a cup are also present on the", "mscoco_hallucinated_words": [["cup", "cup"]], "mscoco_gt_words": ["dining table", "potted plant", "vase", "chair", "book", "person"], "hallucination_idxs": [52], "metrics": {"CHAIRs": 1, "CHAIRi": 0.14285714285714285, "Recall": 0.8333333333333334}}, {"image_id": 575406, "caption": "A vibrant, blue and red bus is parked outside a store, and a person is walking past it. The bus has a large, green, and white striped canopy on top, which adds to its distinctive appearance. The presence of a person and the store in the background suggests that the bus", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bus", "potted plant", "motorcycle", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 244834, "caption": "A couple walks down a sidewalk under an umbrella, holding hands and enjoying the rainy day.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["umbrella", "potted plant", "bicycle", "car", "clock", "handbag", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.14285714285714285}}, {"image_id": 151159, "caption": "A group of young adults is enjoying themselves on a skateboard park, with one man on a skateboard and another man on a skateboard, performing a trick in the air.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["skateboard", "person", "bench"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 277073, "caption": "A man riding a motorcycle is navigating through the busy streets of a city, with a police officer in the background, while a group of people and cars are present in the background.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bicycle", "car", "motorcycle", "backpack", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 377879, "caption": "A large military tank is being transported on a trailer by a truck, with a crane in the background loading the tank onto the trailer. The tank is being transported in a city, with a train track nearby, indicating that it is likely being moved for military purposes.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["truck", "bed", "train"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 436814, "caption": "A cluttered home office with a desk, chair, computer, and various items such as books, papers, and a lamp is the setting for this image. The desk is covered with papers and a lamp is placed on top, while the chair is positioned nearby. There is a door in the background", "mscoco_hallucinated_words": [["book", "book"]], "mscoco_gt_words": ["dining table", "chair", "mouse", "laptop"], "hallucination_idxs": [17], "metrics": {"CHAIRs": 1, "CHAIRi": 0.16666666666666666, "Recall": 0.75}}, {"image_id": 63934, "caption": "A man wearing a nun's habit and a skateboard is riding down a sidewalk, passing by a parked car.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["skateboard", "truck", "person", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 275611, "caption": "A close-up image of a pizza being held by a hand in a silverware tray shows a delicious, freshly made pizza, possibly from a local restaurant. The pizza is placed on a table, and the silverware tray is holding it. The pizza's appearance suggests that", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "pizza", "knife"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 516248, "caption": "A person is sitting at a computer desk, using a keyboard to type on the computer. The person is surrounded by various electronic devices, including a laptop, a mouse, and a keyboard. The image is taken in a classroom setting, suggesting that the person might be learning how to use a computer or practicing", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "laptop", "tv", "mouse", "keyboard", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.8333333333333334}}, {"image_id": 478380, "caption": "A man is standing in front of a large group of sheep, likely on a rural road or a field. He is wearing a white hat and holding a black and white striped umbrella. The man is surrounded by a large herd of sheep, which could be part of a farm or a wildlife", "mscoco_hallucinated_words": [["umbrella", "umbrella"]], "mscoco_gt_words": ["sheep", "person", "car"], "hallucination_idxs": [35], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2, "Recall": 0.6666666666666666}}, {"image_id": 422326, "caption": "In the image, a group of people are gathered around a motorcycle, admiring it. The motorcycle is a Harley Davidson, and it appears to be parked in front of a car. A man is standing next to the motorcycle, while another man is sitting on the back of the bike", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bicycle", "car", "motorcycle", "truck", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.8}}, {"image_id": 110449, "caption": "A man and a woman are sitting on a couch in front of a dining table. The man is holding a pair of headphones and wearing a t-shirt, while the woman is holding a remote control and wearing a tank top. They both appear to be enjoying their time together,", "mscoco_hallucinated_words": [["couch", "couch"]], "mscoco_gt_words": ["dining table", "laptop", "tv", "remote", "person"], "hallucination_idxs": [9], "metrics": {"CHAIRs": 1, "CHAIRi": 0.14285714285714285, "Recall": 0.6}}, {"image_id": 45550, "caption": "A man is holding a tray of food, with a sandwich and a cup of dipping sauce on it, while standing in front of a wall with a clock on it.", "mscoco_hallucinated_words": [["cup", "cup"]], "mscoco_gt_words": ["clock", "sandwich", "person", "bowl"], "hallucination_idxs": [14], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.75}}, {"image_id": 444913, "caption": "The image shows a man standing on a grassy area, holding a golf club, and wearing a grey shirt. He is standing in front of a house, and there is a large tree in the background. The man appears to be preparing for a golf shot, possibly taking a practice swing before stepping", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "car", "frisbee"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 82709, "caption": "A dog is flying in the air with a frisbee in its mouth, and a group of people are watching from a grassy field.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dog", "bottle", "cup", "backpack", "frisbee", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 132796, "caption": "The image features a group of people riding an elephant in a forest, with one person sitting on the back of the elephant and others standing on the side. The person sitting on the elephant is wearing a backpack and appears to be enjoying the ride.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["elephant", "bench", "chair", "backpack", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 303099, "caption": "A cat and a cat are sitting on top of a toilet, next to a sink, and a bathtub.", "mscoco_hallucinated_words": [["sink", "sink"]], "mscoco_gt_words": ["cat", "toilet", "bottle"], "hallucination_idxs": [16], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.6666666666666666}}, {"image_id": 271565, "caption": "A group of motorcyclists rides down the street, passing by a parked car on the side of the road. A couple of bikers are visible in the image, with one rider wearing a helmet and another riding without one. They are surrounded by a group of cars, which", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["motorcycle", "truck", "person", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 205193, "caption": "A large cup of hot tea is sitting on a table, surrounded by a tea bag and a cup of water. The tea bag has a Japanese label on it, indicating that it might be a Japanese green tea. The tea is likely brewed using a traditional tea-making method, and the presence of the tea bag", "mscoco_hallucinated_words": [["cup", "cup"], ["table", "dining table"], ["cup", "cup"]], "mscoco_gt_words": ["oven", "toaster", "person", "microwave"], "hallucination_idxs": [2, 10, 19], "metrics": {"CHAIRs": 1, "CHAIRi": 1.0, "Recall": 0.0}}, {"image_id": 272566, "caption": "A man sits on the ground in front of a fruit stand, smoking a cigarette while surrounded by various types of fresh fruits, including bananas, apples, and pineapples.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["apple", "person", "banana", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 170099, "caption": "A man in a suit stands in front of a large, brightly colored couch with a group of orange pillows. He is holding a white couch and seems to be posing for a photograph.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["couch", "orange", "tie", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 14940, "caption": "A cute orange cat is lying on a blanket, resting its head on a stuffed animal, while a brown dog is sitting on the blanket next to the cat. The cat is surrounded by a red and white striped blanket, creating a cozy and warm atmosphere.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dog", "couch", "chair", "orange", "cat"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 408449, "caption": "A young man is standing in front of a large glass elevator while holding a skateboard and wearing a backpack. He is posing for a photo, with a smiling expression on his face. The man is surrounded by people walking on the street, creating a lively and vibrant atmosphere in", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bus", "truck", "skateboard", "car", "backpack", "handbag", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.42857142857142855}}, {"image_id": 140702, "caption": "An elephant calf is walking alongside its mother in a grassy field. The young elephant is close to its mother, and they appear to be enjoying the outdoors together.", "mscoco_hallucinated_words": [["calf", "cow"]], "mscoco_gt_words": ["bird", "elephant", "person"], "hallucination_idxs": [2], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2, "Recall": 0.6666666666666666}}, {"image_id": 354540, "caption": "A man is sitting on a kitchen counter with his laptop and a tablet, and he is using his phone as a camera to take a picture of himself. He is surrounded by cables and a power strip, which indicates that he might be working on a project or troubleshooting an issue with his devices. The", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["laptop", "microwave", "chair", "cell phone", "oven", "person", "toaster"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.42857142857142855}}, {"image_id": 19763, "caption": "A man is sitting at a table, enjoying a slice of pizza with a glass of beer.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "cup", "fork", "pizza", "chair", "knife", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.42857142857142855}}, {"image_id": 191301, "caption": "The image depicts a person sitting at a dining table with a dessert plate containing a slice of chocolate cake, a spoon, and a cup of coffee.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "cup", "spoon", "person", "cake"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 124236, "caption": "A caption for the image could be: \"A kitchen is filled with various cooking utensils, including a spoon, a bowl, and a pot, along with a kitchen sink and a dishwasher. The dining table is also set up with a vase and a plate,", "mscoco_hallucinated_words": [["sink", "sink"], ["vase", "vase"]], "mscoco_gt_words": ["dining table", "bowl", "spoon", "oven", "toaster"], "hallucination_idxs": [33, 47], "metrics": {"CHAIRs": 1, "CHAIRi": 0.4, "Recall": 0.6}}, {"image_id": 344930, "caption": "A red fire hydrant is sitting on the side of a city street next to a parked car. The image captures the vibrant color of the fire hydrant and the urban setting of the city street.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["orange", "fire hydrant", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 14285, "caption": "A cat lies on a bed, surrounded by various items such as a TV, a remote control, a remote, a book, and a stuffed animal. The cat seems to be enjoying its cozy spot, surrounded by its favorite things.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["remote", "tv", "chair", "cat", "book", "bed"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.8333333333333334}}, {"image_id": 82488, "caption": "A caption for the image would be: \"A bedroom with a comfy bed, a desk, and a clock is a cozy space to relax and unwind. The warm orange and yellow colors add a cheerful touch, while the clock serves as a reminder of time passing. This room", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "remote", "clock", "orange", "book", "bed"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 348251, "caption": "A man is standing on a snowy slope, wearing a green and black outfit, holding a ski pole, and carrying a backpack. He is skiing down a mountain, with a chairlift in the background. The scene appears to be from a winter skiing resort, where people can enjoy out", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "backpack", "skis"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 150703, "caption": "A man is enjoying a delicious sandwich and a beer at a bar, with a tasty-looking hot dog and a beer glass in front of him.", "mscoco_hallucinated_words": [["man", "person"]], "mscoco_gt_words": ["dining table", "sandwich", "hot dog", "cup"], "hallucination_idxs": [1], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.5}}, {"image_id": 381615, "caption": "The image shows a dining room window with a variety of plants and decorations, creating a cozy and welcoming atmosphere. There are potted plants, a vase, and a few decorative items placed on a table, adding to the overall aesthetic of the room. The presence of a chair", "mscoco_hallucinated_words": [["table", "dining table"]], "mscoco_gt_words": ["cup", "potted plant", "vase", "chair", "book"], "hallucination_idxs": [38], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.6}}, {"image_id": 352703, "caption": "A woman is cooking at a stove, using a blue pot to prepare food. She has a spoon in one hand and is stirring the pot with the other hand. The image shows a close-up of the woman's hand stirring the pot, with a blue dish and a spoon", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "bowl", "bottle", "cup", "spoon", "oven", "handbag", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.375}}, {"image_id": 111109, "caption": "A young boy sits on a chair, holding onto a chair's backrest with his hands. He wears a white shirt and blue shorts, and his hair is messy. The image captures a moment of the boy's playfulness and curiosity as he balances himself on the chair", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["tv", "tie", "chair", "motorcycle", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 226802, "caption": "A city street is filled with vehicles, including a bus, and a couple of cars. People are walking down the sidewalk, and a man is riding a bike. In the background, there is a large building with a sign that reads \"Hotel.\" The image captures the bustling atmosphere of", "mscoco_hallucinated_words": [["bike", "bicycle"]], "mscoco_gt_words": ["bus", "motorcycle", "person", "car"], "hallucination_idxs": [31], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.5}}, {"image_id": 49005, "caption": "A baseball game is being played on a grass field, with a man holding a baseball bat and a baseball glove standing on the field. The field is surrounded by a crowd of people, and there are other players nearby. The atmosphere is lively and engaging, showcasing the excitement and passion of the sport", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "baseball bat", "baseball glove"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 410114, "caption": "A group of cows are walking down a road, followed by a truck and a cowboy riding a horse.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["truck", "person", "horse", "cow"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 100274, "caption": "A train is parked on a railroad track, with a truck and a car driving past the train. The image captures the busy intersection of a road and railroad tracks, showcasing the diverse modes of transportation in use. The presence of both a train and cars indicates that the area is an", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["truck", "car", "train"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 317254, "caption": "A man rides his motorcycle down the street, passing a red car on the sidewalk. The motorcycle is black and has a blue background, while the man is wearing a black jacket and helmet. The scene shows a city street with a mix of cars and pedestrians.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["motorcycle", "person", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 425569, "caption": "In the image, a large, modern kitchen with various silver pots, pans, and utensils is visible. The kitchen is clean and organized, with a stainless steel sink and stove. The scene shows a well-equipped kitchen, ready for cooking and preparing meals.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["oven", "bowl", "sink"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 28842, "caption": "A man is skateboarding down a grassy hill with a group of people watching him. The man is having fun while riding his skateboard, and the group of people is enjoying the activity as well. The image captures the excitement and joy of the skateboarder and the onlook", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["skateboard", "dog", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 319607, "caption": "A busy intersection in the city is filled with various modes of transportation, including a bicycle, a car, and a bus. In the center of the intersection, a traffic light is signaling for vehicles to proceed. The scene is bustling with people, with some walking and others riding their b", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["traffic light", "bus", "bicycle", "car", "backpack", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 210372, "caption": "A red kitchen with a white sink and stove is shown in the image, with an empty sink and a dishwasher nearby. The room also features a refrigerator and a microwave oven, with a dining table nearby. The kitchen seems to be clean and organized, with a", "mscoco_hallucinated_words": [["stove", "oven"], ["microwave", "microwave"], ["oven", "oven"], ["table", "dining table"]], "mscoco_gt_words": ["refrigerator", "sink", "bottle"], "hallucination_idxs": [8, 32, 33, 38], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5714285714285714, "Recall": 0.6666666666666666}}, {"image_id": 156915, "caption": "A bouquet of red roses is sitting on a wooden table, surrounded by a vase and a white plate. The arrangement is beautiful and creates a warm and inviting atmosphere. The red roses add a touch of elegance and romance to the setting, making it a perfect choice for a special occasion or", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "potted plant", "vase"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 349642, "caption": "A man is sitting on a bench with his dog sitting next to him.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bench", "dog", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 423008, "caption": "A group of people are gathered around a pier, watching the boats in the water. The pier is filled with boats of different sizes and shapes, including some that are parked on the shore. There are several people on the pier, and some of them are holding umbrellas. The image suggests a sunny", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["umbrella", "boat", "person", "handbag", "suitcase"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 45435, "caption": "The person is holding a black and white smartphone with a large screen, and they are smiling while looking at the phone. The image is taken in a workspace, suggesting that the person might be using their phone for work-related purposes.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "person", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 35827, "caption": "In this image, a man is sitting at a desk in a room with a computer and a large screen displaying a video game. The man is playing the game on the computer, and he has a bottle of soda and a cup on the desk next to him.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "laptop", "tv", "bottle", "cup", "chair", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.7142857142857143}}, {"image_id": 72656, "caption": "Two young children are sitting at a small table with a red and white striped tablecloth, eating pizza together. They are enjoying their meal, and the table setting suggests a casual, family-friendly atmosphere. The image captures the joy and companionship of sharing a meal with", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "bowl", "pizza", "chair", "suitcase", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 372087, "caption": "A train is waiting at a platform, with a green and yellow carriage in the foreground.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "bench", "suitcase", "train"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 336209, "caption": "A young man is riding a skateboard on a dirt road, performing a trick. He is balancing himself on the skateboard while standing on a bench, showcasing his skill and athleticism.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["skateboard", "person", "bench"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 46031, "caption": "A laptop, a mouse, and a keyboard are placed on a dining table with a window behind them. The room is tidy and organized, with a laptop, a mouse, and a keyboard on the table. There is also a small desk lamp nearby.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "laptop", "tv", "mouse", "cell phone", "keyboard"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 283118, "caption": "A family of three, consisting of a mother and two children, sits at a dining table in a restaurant, enjoying a meal together. The mother and children are smiling, while the mother has her arm around the young boy.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "bottle", "car", "pizza", "chair", "cell phone", "backpack", "handbag", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2222222222222222}}, {"image_id": 429598, "caption": "A kitchen with a large wooden table and several appliances, including a stove, refrigerator, and oven, is surrounded by wood paneling. The kitchen is set up for cooking and dining, with a sink and dishwasher nearby. The appliances are arranged in", "mscoco_hallucinated_words": [["table", "dining table"]], "mscoco_gt_words": ["refrigerator", "oven", "sink", "bottle"], "hallucination_idxs": [6], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2, "Recall": 0.75}}, {"image_id": 333365, "caption": "A large airplane is parked on the runway at an airport, surrounded by other airplanes and a red-colored jet. The image captures the bustling atmosphere of an airport, with multiple aircrafts, passengers, and luggage present.", "mscoco_hallucinated_words": [["luggage", "suitcase"]], "mscoco_gt_words": ["airplane", "truck", "person", "car"], "hallucination_idxs": [38], "metrics": {"CHAIRs": 1, "CHAIRi": 0.16666666666666666, "Recall": 0.5}}, {"image_id": 424174, "caption": "A colorful fruit bowl filled with various fruits, such as bananas, apples, oranges, and grapes, sits on a wooden table. The fruit bowl is surrounded by a variety of fruit, with bananas on the table and fruit in the bowl, adding a vibr", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "bowl", "banana", "apple", "orange"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 3035, "caption": "An airplane sits on a tarmac at an airport, surrounded by various vehicles, including a truck, and a person walking near the airplane.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["airplane", "truck", "person", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 177213, "caption": "A person is sitting at a table, holding a large pizza with a fork and a knife. There is a plate of salad on the table as well.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "cup", "fork", "pizza", "knife", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.8333333333333334}}, {"image_id": 438535, "caption": "A clock with hands is located on the side of a building, and it is in front of a city street with cars driving by.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "clock", "person", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 490711, "caption": "In the image, a white refrigerator is sitting in a kitchen, with cabinets, countertops, and a sink nearby. There is also a dishwasher in the kitchen. The refrigerator is filled with food, and it appears to be covered in frost, suggesting that", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["refrigerator", "sink", "banana"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 163728, "caption": "A cat lays on a table, surrounded by a laptop and a mouse. The cat is sleeping or resting, possibly using the mouse as a pillow or cushion. This image captures a moment of relaxation and comfort for the cat, who is enjoying its surroundings and the warm", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "laptop", "cup", "mouse", "cat"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.8}}, {"image_id": 456756, "caption": "A large giraffe stands in a zoo enclosure, with a tall fence behind it, and a group of people in the background. The giraffe is eating from a feeding station.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["zebra", "person", "giraffe"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 281028, "caption": "A passenger train car with seats, with a man sitting on the window seat and looking out the window.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "person", "car", "train"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 343937, "caption": "A young woman is wearing a pink jacket, a black helmet, and black pants as she rides a snowboard down a snow-covered slope. She is standing on her snowboard, balancing and preparing to turn.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["snowboard", "person", "skis"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 277051, "caption": "Two small birds sit on a table, eating from a plate. They are in the presence of a bottle of soda and a knife. The image is quite simple and straightforward, showcasing the birds' natural behavior and interaction with the objects in their environment.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "bottle", "bird", "chair", "knife"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.8}}, {"image_id": 145666, "caption": "A bowl filled with fresh broccoli and carrots is placed in front of a stove, ready to be cooked in a pot of water. This image shows the beginning of the cooking process, where the vegetables are being prepared for consumption.", "mscoco_hallucinated_words": [["stove", "oven"]], "mscoco_gt_words": ["dining table", "bowl", "broccoli", "carrot"], "hallucination_idxs": [14], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.75}}, {"image_id": 304984, "caption": "A delicious plate of sandwiches, a glass of orange juice, and a bowl of mixed fruit are arranged on a white plate, accompanied by a fork and a knife. This setting is perfect for a casual lunch or a refreshing snack.", "mscoco_hallucinated_words": [["knife", "knife"]], "mscoco_gt_words": ["sandwich", "bowl", "wine glass", "fork", "orange", "cake"], "hallucination_idxs": [31], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2, "Recall": 0.6666666666666666}}, {"image_id": 122467, "caption": "A man is holding a handheld video game console, possibly a Nintendo Game Boy, with a controller in his hand.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "couch", "remote", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 518287, "caption": "A smiling toothbrush is sitting on top of an orange, with a white toothpaste tube beside it. The toothbrush is holding a toothbrush toothpaste, and the scene is captured in a funny and playful manner.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "orange", "cup", "toothbrush"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 145448, "caption": "A cat sits on top of a motorcycle, a man and a woman are having a conversation, and a group of people are dining at a table.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "car", "chair", "cat", "motorcycle", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 352900, "caption": "A bowl filled with a creamy, pasta dish, topped with fresh broccoli and a green apple slice, sits on a white plate.", "mscoco_hallucinated_words": [["apple", "apple"]], "mscoco_gt_words": ["fork", "knife", "bowl", "broccoli"], "hallucination_idxs": [17], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.5}}, {"image_id": 153607, "caption": "A colorful vase, a small flower, and a glass bowl are arranged on a table, creating a visually appealing and inviting setting. The blue vase adds a pop of color to the table, while the flower adds a touch of nature and beauty. The bowl, possibly filled with food", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "bowl", "vase", "orange"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 157581, "caption": "A group of wine bottles and glasses are arranged on a table, with a few empty glasses next to a wine bottle. The scene is set in a restaurant, where the wine glasses and bottles are placed for guests to enjoy during their meals.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "wine glass", "cup", "bottle", "chair", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 227438, "caption": "A spacious hotel room features a comfortable bed, a desk, and a lounge chair. A large window provides natural light and a view of the city. The room is decorated with a nice combination of colors, and there is a clock on the desk.", "mscoco_hallucinated_words": [["desk", "dining table"], ["desk", "dining table"]], "mscoco_gt_words": ["clock", "chair", "couch", "bed"], "hallucination_idxs": [10, 48], "metrics": {"CHAIRs": 1, "CHAIRi": 0.4, "Recall": 0.75}}, {"image_id": 116037, "caption": "A young girl is playing softball in a field, wearing a baseball cap and a black and yellow uniform. She is standing in front of a white fence, and she's holding a bat. The girl is swinging the bat and ready to hit the ball.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sports ball", "person", "baseball bat", "baseball glove"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 202658, "caption": "A pink toilet sits on a porcelain base in front of a trash can, with a white chair and a toilet paper holder nearby.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "bowl", "toilet"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 18150, "caption": "A man is sitting on a bed with a young boy, eating a pizza together.", "mscoco_hallucinated_words": [["bed", "bed"]], "mscoco_gt_words": ["bottle", "couch", "pizza", "backpack", "person"], "hallucination_idxs": [6], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.4}}, {"image_id": 418711, "caption": "A man rides his bicycle while carrying a large basket of bananas on the back, weaving through a busy street with cars and trucks.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["banana", "bicycle", "car", "truck", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 92107, "caption": "A bowl of creamy corn soup sits on a green tablecloth, accompanied by a spoon and a green plate. The soup is made with corn, broccoli, and milk, giving it a smooth and flavorful texture. This image captures a moment of enjoyment and satisfaction while enjo", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "bowl", "broccoli", "spoon"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 491000, "caption": "A busy street scene with people walking and biking, cars driving, and a bicycle parked on the sidewalk.", "mscoco_hallucinated_words": [["bicycle", "bicycle"]], "mscoco_gt_words": ["dog", "car", "motorcycle", "handbag", "person"], "hallucination_idxs": [15], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.4}}, {"image_id": 401163, "caption": "A man and a dog are sitting on a bench in a park, surrounded by trees and grass.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bench", "dog", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 39663, "caption": "A backpack filled with various items sits on the floor next to a chair. The items include a laptop, a book, a pencil case, and some office supplies. The laptop appears to be open, and the book is open as well, with a pencil inside it. The pencil", "mscoco_hallucinated_words": [["chair", "chair"]], "mscoco_gt_words": ["laptop", "scissors", "cell phone", "backpack", "book"], "hallucination_idxs": [13], "metrics": {"CHAIRs": 1, "CHAIRi": 0.16666666666666666, "Recall": 0.6}}, {"image_id": 268293, "caption": "A tennis player is serving the ball during a match. He is wearing a blue shirt, white shorts, and a tennis racket in his hand.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sports ball", "person", "tennis racket"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 474499, "caption": "A spacious kitchen features a countertop with a sink, stove, and refrigerator. There is a large white cupboard on the wall, which houses a variety of dishes, utensils, and cooking supplies. A dishwasher is also present, and the kitchen is", "mscoco_hallucinated_words": [["refrigerator", "refrigerator"]], "mscoco_gt_words": ["bottle", "vase", "clock", "apple", "sink", "spoon", "oven"], "hallucination_idxs": [13], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.2857142857142857}}, {"image_id": 358086, "caption": "A group of young women are playing a game of frisbee in a field, with one woman jumping to catch the frisbee. The image captures the joy and excitement of the players as they engage in the sport and spend time together.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bottle", "chair", "backpack", "frisbee", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 89541, "caption": "A colorful and delicious lunch is presented in a yellow plastic container. It contains a variety of sweet and savory foods, such as a banana, a slice of cake, and a strawberry. The lunch is placed on a colorful table, which adds a vibrant", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "bowl", "banana", "cake"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 239445, "caption": "A man is holding a frisbee and wearing a white t-shirt, posing for a photo with a beach in the background.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sports ball", "person", "frisbee"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 105782, "caption": "A young boy is holding a kite and standing in the middle of a green field, with a dog standing nearby. The kite is flying in the sky, and the boy is smiling.", "mscoco_hallucinated_words": [["boy", "person"], ["boy", "person"]], "mscoco_gt_words": ["cat", "dog", "kite", "car"], "hallucination_idxs": [2, 33], "metrics": {"CHAIRs": 1, "CHAIRi": 0.4, "Recall": 0.5}}, {"image_id": 487990, "caption": "A group of friends are enjoying a picnic outdoors, with a person playing the guitar while others are eating and drinking.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "bowl", "bottle", "cup", "fork", "donut", "spoon", "knife", "person", "cake"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.1}}, {"image_id": 138834, "caption": "A man in a black ski jacket and ski goggles is walking down a snowy road while carrying a ski pole and holding onto a snowboard.", "mscoco_hallucinated_words": [["snowboard", "snowboard"]], "mscoco_gt_words": ["person", "skis", "car"], "hallucination_idxs": [25], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2, "Recall": 0.6666666666666666}}, {"image_id": 492057, "caption": "A man, possibly in his mid-20s, is posing for a selfie in a restroom mirror. He has a beard and wears a black and white striped shirt, a green jacket, and a black tie. He is holding a phone in his hand while taking the photo", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "tie", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 388215, "caption": "A man in a white shirt is playing tennis with a yellow ball on a tennis court. He is in the middle of a swing, preparing to hit the ball with his tennis racket.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sports ball", "person", "tennis racket"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 111409, "caption": "A man wearing a helmet and riding a motorcycle is seen on a road near a parking lot. The man is riding a black motorcycle with a sidecar, which has a red engine and is parked next to a car. The man is riding the motorcycle down a slope and", "mscoco_hallucinated_words": [["car", "car"]], "mscoco_gt_words": ["bicycle", "motorcycle", "person"], "hallucination_idxs": [41], "metrics": {"CHAIRs": 1, "CHAIRi": 0.14285714285714285, "Recall": 0.6666666666666666}}, {"image_id": 451391, "caption": "The person holding a bunch of broccoli is posing in front of a display of vegetables, including a bunch of broccoli.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "person", "broccoli"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 92462, "caption": "A group of cows are walking down a street in a city, with a white car in the background.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["car", "person", "backpack", "cow"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 397268, "caption": "A cozy and inviting outdoor setting is displayed in the image, featuring a green chair and a green bench sitting next to each other, surrounded by potted plants. A bicycle is parked nearby, adding a touch of functionality and practicality to the scene. The combination of comfortable seating,", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "potted plant", "bench", "bicycle"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 127659, "caption": "A man is sitting on a bench, looking at his phone while waiting for a train on a platform. The man is likely waiting for the train to arrive at the station, and he is engaging in a conversation with someone in the image.", "mscoco_hallucinated_words": [["phone", "cell phone"]], "mscoco_gt_words": ["bench", "dog", "person", "train"], "hallucination_idxs": [11], "metrics": {"CHAIRs": 1, "CHAIRi": 0.16666666666666666, "Recall": 0.75}}, {"image_id": 251857, "caption": "A group of young men are hanging out in a park, engaging in various activities such as skateboarding, playing basketball, and hanging out. They are wearing casual outfits and appear to be enjoying their time together in the sunny outdoor setting.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["traffic light", "skateboard", "person", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 243212, "caption": "A young boy is standing in a grassy area, holding a frisbee. He is wearing a green shirt and blue jeans, and his hair is messy. The image captures the boy's joyful expression as he holds the frisbee, ready to play with it.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dog", "car", "frisbee", "truck", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 444304, "caption": "A man is sitting on a couch, watching a TV. He is holding a remote control and appears to be engaged in the show. The television is on, and the man is sitting close to the screen, focusing on the show.", "mscoco_hallucinated_words": [["couch", "couch"]], "mscoco_gt_words": ["person", "remote", "tv", "bed"], "hallucination_idxs": [6], "metrics": {"CHAIRs": 1, "CHAIRi": 0.16666666666666666, "Recall": 0.75}}, {"image_id": 305000, "caption": "A woman stands in front of a vegetable stand, surrounded by various types of fruits and vegetables. She is holding a basket, possibly filled with purchases. The woman is wearing a black shirt and pants, and her outfit suggests that she is a vendor at the market. The scene capt", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["apple", "person", "banana"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 44136, "caption": "Two men dressed in black suits and ties are enjoying a meal at a fancy dinner event. One of them is sipping a beer, while the other is holding a glass of wine. They are both sitting at a table, and the setting appears to be upscale.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "wine glass", "bottle", "tie", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 154846, "caption": "A close-up image of a slice of pizza on a plate, with several toppings and a small, sliced pineapple on top, is shown. The pizza slice has a mix of vegetables, cheese, and meat, with a generous amount of toppings. The pine", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "person", "pizza"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 567254, "caption": "A little boy is sitting on the floor in front of a television, watching a show. He has his eyes fixed on the screen and is using a pink pencil to draw.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["vase", "person", "tv", "bottle"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 79261, "caption": "A man in a white shirt and black pants is standing on the edge of a fountain, cleaning it with a mop. He is wearing a red and white striped hat and has a green plastic bucket and a mop in his hand. The man is surrounded by a large crowd", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["clock", "handbag", "person", "backpack"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 301402, "caption": "A young man sits at a dining table, typing on his laptop. He is wearing a hat and a scarf, which may be for fashion or warmth, while the man is enjoying his meal.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "laptop", "bottle", "potted plant", "chair", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 415828, "caption": "A group of people, including a man, a woman, and a child, are gathered near a street in a city. They are standing in front of a building with a red umbrella on top of it. The street has a number of cars parked along the side, and a few people are walking around", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["umbrella", "traffic light", "stop sign", "car", "backpack", "handbag", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.42857142857142855}}, {"image_id": 543231, "caption": "A woman is using a remote control to play a video game on a console, with her friends watching her in the background. She is holding the remote with her right hand and is focused on the game.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "remote", "book", "person", "bed"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 495357, "caption": "A group of people, including a man, a woman, and a young girl, are standing on a sidewalk. The man is riding a motorcycle while the woman is holding a small dog. The woman and the girl are looking at the man on the motorcycle, and they seem to be in awe", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["handbag", "motorcycle", "dog", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 523175, "caption": "A bowl of hearty vegetable soup sits on a table, filled with a variety of vegetables and a spoon for serving.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "bowl", "spoon", "carrot"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 184945, "caption": "In the image, a group of motorcycles, including one white motorcycle, are parked next to each other in a city street. The bikes are lined up against a railing, and there is a white bicycle nearby.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["potted plant", "motorcycle", "bicycle"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 49942, "caption": "A young man, dressed in a suit and holding an umbrella, poses for a photograph in a city setting.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["umbrella", "tie", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 223019, "caption": "A man is standing on a train platform, looking at a train with an orange and black exterior.", "mscoco_hallucinated_words": [["orange", "orange"]], "mscoco_gt_words": ["car", "person", "backpack", "handbag", "suitcase", "train"], "hallucination_idxs": [15], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.3333333333333333}}, {"image_id": 42889, "caption": "A cute teddy bear sits on a red computer desk, wearing glasses and holding a microphone, while a computer keyboard is laid out on the desk.", "mscoco_hallucinated_words": [["computer", "laptop"], ["desk", "dining table"], ["computer", "laptop"], ["desk", "dining table"]], "mscoco_gt_words": ["bear", "keyboard", "teddy bear"], "hallucination_idxs": [8, 9, 20, 27], "metrics": {"CHAIRs": 1, "CHAIRi": 0.6666666666666666, "Recall": 0.6666666666666666}}, {"image_id": 22112, "caption": "A small pot with green herbs sits on top of a wooden table, accompanied by a blue vase filled with flowers.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "potted plant", "vase", "bowl"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 247587, "caption": "A man is standing on a surfboard, waving to the camera while he is on the beach, with the ocean in the background.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["surfboard", "person", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 171962, "caption": "A man is riding a bike on a city street with a bus in the background.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bus", "bicycle", "person", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 545056, "caption": "In the image, there is a group of sheep grazing in a green field with a fence in the background. The sheep are standing in a grassy area, with some standing on the fence as well. The image captures the serene and peaceful scene of the sheep grazing in the open field", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sheep", "dog", "car", "cow"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 401411, "caption": "A chef stands in front of a stove, holding a spatula and a bowl of ingredients. He is surrounded by various dishes and utensils, including a cutting board, a knife, and a mixing bowl.", "mscoco_hallucinated_words": [["knife", "knife"]], "mscoco_gt_words": ["dining table", "bowl", "cup", "book", "oven", "person", "carrot"], "hallucination_idxs": [33], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2, "Recall": 0.42857142857142855}}, {"image_id": 2867, "caption": "A group of people, including a young man, a woman, and a child, are standing on a snowy trail, possibly near a ski resort. They are all wearing winter gear and are preparing to use their skis and poles to ski down the snowy trail. The woman is holding a", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "backpack", "skis"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 246963, "caption": "A group of bikers is riding down a road, with their motorcycles lined up on the side of the street. The bikers are wearing helmets, and one rider is holding a sign that reads \"Biker Safety.\" The scene appears to be a group of b", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "motorcycle", "stop sign"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 498225, "caption": "A group of people, including an elderly woman, a man, and a woman, are standing in front of a bakery display case, looking at a variety of baked goods. They are likely excited about the selection of sweet treats, and the elderly woman is holding a small bag. The scene", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["donut", "cell phone", "handbag", "person", "cake"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2}}, {"image_id": 124601, "caption": "A modern kitchen with a dining table, a sink, and a microwave is filled with various items. The dining table is covered with a tablecloth, and there are cups, a laptop, a dish, and a bottle of wine on the table. The sink is clean, and", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "laptop", "wine glass", "bottle", "cup", "microwave", "sink", "keyboard"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 581749, "caption": "A colorful and fresh image of a variety of vegetables, including broccoli, carrots, and lettuce, is sitting on a table in a kitchen.", "mscoco_hallucinated_words": [["carrot", "carrot"]], "mscoco_gt_words": ["dining table", "orange", "broccoli"], "hallucination_idxs": [14], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.6666666666666666}}, {"image_id": 227960, "caption": "A bowl filled with steamed Brussels sprouts is being served at a dinner party.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "wine glass", "cup", "spoon", "carrot"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2}}, {"image_id": 286503, "caption": "A baby elephant is standing next to a large metal cage, holding onto a rope with its trunk. The elephant is in a zoo or wildlife area, and it appears to be interacting with the cage and the people nearby.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["elephant", "sports ball", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 315740, "caption": "In the image, a spacious kitchen with a wooden floor and cabinets is filled with various appliances, including a stainless steel refrigerator, a microwave, and a sink. The kitchen also features a dining table with chairs, and there is a couch in the", "mscoco_hallucinated_words": [["refrigerator", "refrigerator"], ["table", "dining table"]], "mscoco_gt_words": ["bowl", "tv", "potted plant", "microwave", "couch", "chair", "sink", "oven"], "hallucination_idxs": [23, 38], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.5}}, {"image_id": 142108, "caption": "A group of people, including a young girl, are gathered around a table where they are engaged in a fun activity, possibly a craft project or a meal.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "person", "banana"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 542933, "caption": "A baseball player is on the field, holding a bat and ready to swing at a pitch. He is surrounded by a large crowd of fans and is positioned on a baseball field.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bench", "sports ball", "baseball glove", "chair", "baseball bat", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.16666666666666666}}, {"image_id": 475043, "caption": "A group of friends are gathered around a table, enjoying their drinks and socializing. The scene captures the warm atmosphere and shared enjoyment of the beverages.", "mscoco_hallucinated_words": [["table", "dining table"]], "mscoco_gt_words": ["bowl", "laptop", "bottle", "couch", "spoon", "person"], "hallucination_idxs": [8], "metrics": {"CHAIRs": 1, "CHAIRi": 1.0, "Recall": 0.0}}, {"image_id": 456784, "caption": "A man is cutting a cake with a knife, likely preparing it for serving or consumption.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["knife", "person", "cake"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 33753, "caption": "A black remote control sits on a bench next to a pink-colored TV set, with a green chair nearby.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "bench", "remote", "tv"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 448694, "caption": "A group of young boys are playing a game of frisbee on a grassy field, engaging in a fun and active outdoor activity.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "person", "frisbee"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 99053, "caption": "A bowl of delicious and healthy noodles is being enjoyed by a person. The noodles are stir-fried with vegetables, and a fork is being used to pick up the food. This meal is likely a balanced and satisfying option for the person, as it combines carbo", "mscoco_hallucinated_words": [["person", "person"], ["person", "person"]], "mscoco_gt_words": ["dining table", "bowl", "fork", "broccoli", "carrot"], "hallucination_idxs": [12, 44], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.4}}, {"image_id": 503210, "caption": "A living room filled with furniture, including a couch, a chair, a piano, and a couple of throw pillows. There is also a dining table with chairs, and a vase holding flowers. The room is decorated with orange curtains and a clock on the wall.", "mscoco_hallucinated_words": [["table", "dining table"]], "mscoco_gt_words": ["potted plant", "vase", "clock", "couch", "chair", "orange", "book"], "hallucination_idxs": [29], "metrics": {"CHAIRs": 1, "CHAIRi": 0.14285714285714285, "Recall": 0.7142857142857143}}, {"image_id": 142257, "caption": "A busy street with multiple cars is shown in the image. A car is stopped at a traffic light, while a person is looking at their phone or reading a book while waiting for the light to change. In the background, there are other cars and a truck driving on the road. The scene highlights the various", "mscoco_hallucinated_words": [["phone", "cell phone"], ["book", "book"]], "mscoco_gt_words": ["traffic light", "truck", "person", "car"], "hallucination_idxs": [28, 32], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 1.0}}], "overall_metrics": {"CHAIRs": 0.246, "CHAIRi": 0.08144578313253012, "Recall": 0.5712984054669704, "num_hallucinated_caps": 123.0, "num_caps": 500.0, "hallucinated_word_count": 169.0, "coco_word_count": 2075.0, "length_response": 41.856, "hallucinated_caps_ls": [144305, 324008, 247179, 39053, 269873, 253630, 317320, 161227, 195645, 343534, 370657, 460347, 254368, 459141, 277479, 409346, 300124, 185327, 482432, 379842, 203110, 556478, 506401, 278365, 368367, 21779, 333712, 148977, 467887, 401010, 388237, 24104, 527497, 61959, 473118, 265628, 499594, 258209, 285820, 245664, 443299, 354559, 545594, 219546, 535403, 375769, 426172, 138078, 180764, 147762, 47781, 14773, 563938, 47940, 134768, 526414, 273132, 412407, 188136, 191691, 561967, 280930, 3742, 217593, 477016, 539951, 564629, 53431, 381031, 9628, 330050, 423984, 30667, 328110, 366111, 291634, 70815, 88269, 463211, 536154, 560018, 353320, 416384, 531327, 51054, 1268, 542771, 436814, 478380, 110449, 45550, 303099, 205193, 140702, 124236, 150703, 381615, 226802, 210372, 429598, 333365, 145666, 304984, 352900, 227438, 18150, 491000, 39663, 474499, 105782, 138834, 111409, 127659, 444304, 223019, 42889, 401411, 581749, 315740, 475043, 99053, 503210, 142257]}}}