{"overall_metrics": {"CHAIRs": 0.1843687374749499, "CHAIRi": 0.06819421713038734, "Recall": 0.47308394160583944, "num_hallucinated_caps": 92.0, "num_caps": 499.0, "hallucinated_word_count": 125.0, "coco_word_count": 1833.0, "length_response": 39.68336673346693, "hallucinated_caps_ls": [324008, 39053, 128119, 401027, 317320, 161227, 32625, 18688, 67833, 254368, 231534, 209347, 13550, 300784, 344942, 300124, 12669, 133146, 261097, 185327, 348654, 268854, 495513, 506401, 183571, 325836, 352734, 401010, 313928, 59710, 229659, 258209, 453731, 145020, 240681, 178753, 47781, 47940, 526414, 273132, 188136, 191691, 557447, 217593, 477016, 558784, 539951, 230983, 53465, 381031, 9628, 163518, 366111, 70815, 88269, 536154, 158806, 531327, 1268, 151159, 478380, 45550, 205193, 272566, 14940, 14285, 226802, 425569, 28842, 283118, 490711, 277051, 122467, 518287, 352900, 227438, 18150, 92107, 474499, 105782, 487990, 138834, 305000, 567254, 543231, 523175, 42889, 581749, 227960, 286503, 475043, 456784]}, "results": {"sentences": [{"image_id": 144305, "caption": "There are a few computer devices displayed in the image. A laptop, placed near the center of the scene, is sitting on a desk or table", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["laptop", "keyboard", "dining table"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 164091, "caption": "In the image, there are two dolls sitting in beds. A large doll is placed in the center, while a smaller doll sits in the foreground, next to the larger one", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["teddy bear", "person", "bed"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 308003, "caption": " The image features a green park bench with a cracked and worn surface, resting under a dull sky. The bench takes up most of the scene, occupying the majority of the space within the image", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "bench", "dining table"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 54870, "caption": " The image features a sandwich and a salad on a plate. There is a knife placed near the plate as well", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["knife", "sandwich", "fork"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 95908, "caption": "A computer desk with multiple devices is showcased in the image. A keyboard and mouse are located on the desk, with the keyboard towards the left side and the mouse towards the center", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "mouse", "keyboard", "laptop", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.8}}, {"image_id": 329614, "caption": "The scene features a yellow school bus driving down a street surrounded by churches. There are several churches visible in the image, with at least two churches at the sides of the road, and another one situated further down", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bus", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 324008, "caption": " The image showcases a tray of food that includes various items. In the center of the tray is a banana sitting next to several bottles and a container", "mscoco_hallucinated_words": [["bottle", "bottle"], ["container", "bowl"]], "mscoco_gt_words": ["dining table", "banana", "train", "orange", "airplane", "person", "cup"], "hallucination_idxs": [25, 28], "metrics": {"CHAIRs": 1, "CHAIRi": 0.6666666666666666, "Recall": 0.14285714285714285}}, {"image_id": 52700, "caption": " The image depicts a large dining table that is covered with numerous dishes of cake and cupcakes. There are numerous cake slices placed on the table, covering multiple forks and spoons", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "dining table", "spoon", "cake", "handbag", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 501311, "caption": " The image captures a baseball game in progress, with several players spread throughout the scene. The main focus of the image is a pitcher on the mound, throwing a baseball in an intentional manner, possibly attempting to retire an opposing player", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "sports ball", "baseball glove"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 247179, "caption": " The image shows a group of people riding on the back of two elephants, with one of them carrying a person. The elephants have elaborate decorations on their backs, adding to the festive atmosphere", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["clock", "elephant", "person", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 577912, "caption": "A bathroom is showcased in the image, featuring a white toilet situated near a window. A sink can be seen nearby", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bottle", "toothbrush", "toilet", "sink"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 196341, "caption": "The image depicts a group of people standing and walking around an enormous clock in the middle of a room. The clock is quite large, with both numbers and letters prominent on its face", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["handbag", "clock", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 234433, "caption": " In the image, there is a left turn sign placed near a street sign and several signs below it. The signs indicate a location where the street intersects with a parking area, as there is a pole nearby with multiple bicycle symbols around it", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bicycle", "traffic light", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 455610, "caption": " In the image, there is a red motorcycle parked on the sidewalk near a building. Two people are in the scene, standing next to the motorcycle, and one person is walking toward them, possibly taking a closer look", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["traffic light", "motorcycle", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 39053, "caption": " The image shows a table with several pieces of food placed on it, including a bowl of eggs and a bowl of pita bread, surrounded by various cups and knives. The food appears to be a part of a meal or an appetizer, and it is spread out across the table", "mscoco_hallucinated_words": [["knife", "knife"]], "mscoco_gt_words": ["cell phone", "bowl", "dining table", "spoon", "cake", "apple", "cup"], "hallucination_idxs": [31], "metrics": {"CHAIRs": 1, "CHAIRi": 0.16666666666666666, "Recall": 0.42857142857142855}}, {"image_id": 493862, "caption": "In the image, there is a man standing on a grassy field holding a baseball, likely waiting for a pitch. The field is filled with grass, extending to the horizon", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["tennis racket", "dog", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 269873, "caption": "The image depicts a busy street scene with a group of people, some walking and some standing, crossing over the street from one side to the other. The people are walking on a street with a trolley passing by", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bus", "traffic light", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 524656, "caption": "The image showcases a small kitchen with a microwave, a toaster oven, and a refrigerator. The microwave is placed near a window, while the toaster oven is located closer to the kitchen's center", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "oven", "spoon", "bottle", "sink", "wine glass", "knife", "microwave", "toaster", "refrigerator", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.36363636363636365}}, {"image_id": 369547, "caption": "The image features a black and white dog sitting on a rocky surface, with a bird in the sky above. The bird seems to be circling over the dog, potentially chasing it", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cat", "bird", "dog"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 181446, "caption": "A man with glasses is leaning against an open refrigerator, looking into it. He is in a kitchen filled with various food and bottles", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "bottle", "sink", "person", "refrigerator"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 128119, "caption": "The scene features a bus with two bicycles attached to the front of it. The bus is white and parked on a street with a few cars on the side", "mscoco_hallucinated_words": [["car", "car"]], "mscoco_gt_words": ["cell phone", "backpack", "bus", "bicycle", "handbag", "person"], "hallucination_idxs": [27], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.16666666666666666}}, {"image_id": 401027, "caption": " The image features a sandwich placed on a table, which appears to be cut in half. The sandwich is accompanied by two small bowls filled with dips, one of which appears to be yellow in color", "mscoco_hallucinated_words": [["bowl", "bowl"]], "mscoco_gt_words": ["fork", "dining table", "sandwich", "knife", "cup"], "hallucination_idxs": [25], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.4}}, {"image_id": 253630, "caption": "In the image, there is a living room filled with furniture. The centerpiece of the room is a black coffee table with a glass top and a small square-shaped footstool placed in front of it", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "dining table", "potted plant", "tv"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 326021, "caption": "A woman is sitting behind a table with a teddy bear on it. The teddy bear is placed on the left side of the table, taking up most of the space", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["teddy bear", "dining table", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 317320, "caption": "In the image, there are several people present, including a man riding a bicycle down the street with yellow stripes, two other men, and a woman. The man on the bicycle is holding a backpack and is surrounded by other people going about their day", "mscoco_hallucinated_words": [["backpack", "backpack"]], "mscoco_gt_words": ["bicycle", "motorcycle", "person"], "hallucination_idxs": [39], "metrics": {"CHAIRs": 1, "CHAIRi": 0.1111111111111111, "Recall": 0.6666666666666666}}, {"image_id": 507171, "caption": "The image features a person riding a wave on a surfboard in the water. The man is in the center of the scene, riding the wave in the foreground", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["surfboard", "cat", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 161227, "caption": "The image features a couch with a remote control sitting on top of it, with a laptop on a nearby table. There are also a cell phone, a bottle, and a clock in the scene", "mscoco_hallucinated_words": [["table", "dining table"], ["bottle", "bottle"], ["clock", "clock"]], "mscoco_gt_words": ["cell phone", "remote", "chair", "couch", "keyboard", "laptop"], "hallucination_idxs": [21, 31, 35], "metrics": {"CHAIRs": 1, "CHAIRi": 0.42857142857142855, "Recall": 0.6666666666666666}}, {"image_id": 25812, "caption": " The image shows a person snowboarding down a snow-covered slope while facing towards the right side of the image. There is a snowboard and skis on the ground near the person, indicating that they may have stopped skiing before or during their downhill journey", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["snowboard", "skis", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 267537, "caption": "The image depicts a group of four women sitting on a bench, each wearing an umbrella to shield them from the rain. They are holding hands, possibly as a symbol of unity or support", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["tie", "umbrella", "person", "bench"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 195645, "caption": " In the image, there are several people gathered around a table, with a wine glass in the middle. The people appear to be engaged in conversation as they dine together", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "bottle", "wine glass", "handbag", "bench", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 155671, "caption": "The scene is an empty, sunny street on a beautiful day. There are a few cars present, one at the end of the street, one in the middle, and another near the top", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["traffic light", "car", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 412894, "caption": "According to the picture, it is a busy street scene with multiple people walking, shopping, and standing near numerous signs. There are also a few traffic lights located near the street, one at a corner and two near the center of the street", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["handbag", "backpack", "traffic light", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 32625, "caption": " In the image, there is a table with various food items placed on it. One plate holds a portion of food that appears to be a mixture of broccoli and carrots", "mscoco_hallucinated_words": [["broccoli", "broccoli"], ["carrot", "carrot"]], "mscoco_gt_words": ["fork", "bowl", "dining table", "book", "cup"], "hallucination_idxs": [30, 32], "metrics": {"CHAIRs": 1, "CHAIRi": 0.6666666666666666, "Recall": 0.2}}, {"image_id": 18688, "caption": "There is a baseball game happening in a room, captured on a television screen. In the middle of the image, a baseball player is standing at the plate, holding a bat, and another player is positioned behind him", "mscoco_hallucinated_words": [["television", "tv"]], "mscoco_gt_words": ["baseball bat", "person", "sports ball", "baseball glove"], "hallucination_idxs": [13], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.25}}, {"image_id": 343534, "caption": "According to the image, there is a small doll dressed in a knitted sweater standing next to a brown teddy bear. The doll is positioned on the left side of the image, and the teddy bear is positioned on the right side of the image", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["teddy bear", "potted plant", "chair", "book", "dog"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2}}, {"image_id": 370657, "caption": "In the image, a group of people is riding on a motorcycle, with several adults and at least two children. They are wearing masks, possibly due to an outbreak of COVID-19 in the area", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["handbag", "motorcycle", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 481596, "caption": "In the image, a man is standing at the top of the bleachers in a sports stadium, eating a hot dog in the stands with a crowd of people around him. Many other people are visible in the background, watching and socializing during the baseball game", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "hot dog", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 460347, "caption": "This image depicts a white bus driving down a road surrounded by a busy parking lot. The bus is located in the middle of the lane, while several cars are following closely behind, driving along the road in various positions", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bus", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 398753, "caption": " The image captures a baseball game taking place, with a large crowd gathered around the field, possibly watching the action on the field or waiting to play themselves. The players are dispersed throughout the field, with some players standing near the first and third bases, a few closer to the batter, and others closer to the infield", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["baseball bat", "person", "sports ball", "baseball glove"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 67833, "caption": "The image shows a large pizza placed on a table in the center of a room, surrounded by various food items, including two bottles of wine, and two spoons. There are also two cups on the table", "mscoco_hallucinated_words": [["spoon", "spoon"]], "mscoco_gt_words": ["fork", "bowl", "dining table", "bottle", "knife", "wine glass", "person", "pizza", "cup"], "hallucination_idxs": [31], "metrics": {"CHAIRs": 1, "CHAIRi": 0.16666666666666666, "Recall": 0.4444444444444444}}, {"image_id": 272880, "caption": "In the image, there is a piece of pizza on a plate with the word \"mystic pizza\" written on it. There is a cup of coffee nearby", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "dining table", "knife", "person", "pizza", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 254368, "caption": " The image depicts a man in a white robe sitting in bed, holding a slice of pizza as he eats. He is surrounded by various items such as dishes, bottles, and a handbag, which suggests a casual, relaxing setting", "mscoco_hallucinated_words": [["bottle", "bottle"], ["handbag", "handbag"]], "mscoco_gt_words": ["pizza", "person", "bed"], "hallucination_idxs": [32, 36], "metrics": {"CHAIRs": 1, "CHAIRi": 0.4, "Recall": 1.0}}, {"image_id": 193108, "caption": " In the image, there are multiple baseball players, including a batter standing at the plate, swinging a baseball bat, and a group of onlookers, likely cheering them on. ", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["baseball bat", "person", "sports ball"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 459141, "caption": " According to the picture, a person is riding a bicycle with a straw hat or a hat of some sort. There are also a few other people in the scene, but they are not riding bicycles", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bicycle", "motorcycle", "potted plant", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 231534, "caption": "The image depicts an airport scene with an airplane parked on an airport tarmac and various people, vehicles, and items involved in the logistics of the airport. On the tarmac, there are multiple trucks, several cars, and a couple of carts, all likely transporting luggage and other airport supplies", "mscoco_hallucinated_words": [["car", "car"]], "mscoco_gt_words": ["handbag", "airplane", "person", "truck", "suitcase"], "hallucination_idxs": [40], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2, "Recall": 0.8}}, {"image_id": 227031, "caption": "A man and woman are standing together, likely at a wedding or celebration, as they are getting married or commemorating their union. They are both wearing ties, and the man is cutting the cake, while the woman assists him in the process", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "potted plant", "tie", "cake", "knife", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 209347, "caption": " In the scene, there is a woman wearing headphones while sitting on the bench of a subway train, looking at her cell phone. She is surrounded by other people on the train", "mscoco_hallucinated_words": [["bench", "bench"]], "mscoco_gt_words": ["cell phone", "train", "tie", "handbag", "person"], "hallucination_idxs": [14], "metrics": {"CHAIRs": 1, "CHAIRi": 0.16666666666666666, "Recall": 0.6}}, {"image_id": 523292, "caption": " A cat is standing on top of a laptop sitting on a coffee table, looking at a piece of paper placed on the table in front of it. The laptop is positioned near the front right corner of the table, while the paper is placed near the center", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "cat", "chair", "laptop", "tv"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 12375, "caption": " The image displays a white plate, possibly a serving plate, filled with a variety of food items, including meat, potatoes, carrots, and pickles. The plate appears to be positioned on a dining table or a tabletop", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["carrot", "broccoli", "dining table"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 13550, "caption": "According to the picture, there is a woman standing next to an elephant. She seems to be petting the elephant, possibly feeding it, as people might do with domestic animals like dogs or cats", "mscoco_hallucinated_words": [["dog", "dog"], ["cat", "cat"]], "mscoco_gt_words": ["handbag", "elephant", "person"], "hallucination_idxs": [35, 37], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.6666666666666666}}, {"image_id": 146837, "caption": " The image captures a man skateboarding in an urban setting, appearing to perform a trick while riding a skateboard along a sidewalk or path. He is riding on the top of the skateboard, and it appears that he is going to leap over something or perhaps performing a trick", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["skateboard", "motorcycle", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 67042, "caption": "The image depicts a man standing in a corridor or passageway while checking his cell phone. He is dressed in a tie, possibly indicating a formal or business setting", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "tie", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 209925, "caption": "The image depicts a baseball player in the middle of the field, ready to pitch a baseball. He is standing on the mound, holding a baseball, and he is in the act of throwing a pitch", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "sports ball", "baseball glove"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 2154, "caption": " The image shows a shopping cart in the middle of a street, placed next to a park bench. There are multiple people in various locations nearby, standing, walking, and sitting on the bench", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bench", "car", "person", "umbrella"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 274931, "caption": "The image captures a black and white scene of a street where several cars are parked along the side of the road. The cars are parked near some tires and there are some buildings in the background", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fire hydrant", "traffic light", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 104326, "caption": "The image features a very clean and well-organized kitchen. It has two dining tables located near each other in the room", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "potted plant", "oven", "chair", "clock", "sink", "knife", "microwave"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.125}}, {"image_id": 233888, "caption": "According to the picture, a young child, likely around three years old, is playing a video game that features a baseball game. The child is standing in front of a large television set and holding a baseball bat, ready to play the video game", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["potted plant", "baseball bat", "person", "baseball glove", "tv"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 213905, "caption": "The image features two women in black and white walking on a tennis court. They are holding tennis rackets in their hands, possibly playing against each other or chatting before a match", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "backpack", "tennis racket", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 277479, "caption": " The image features a little girl standing in front of an open refrigerator, holding her baby doll. There are a few people standing nearby the little girl, including one person closer to the left, another person towards the center, and a third person on the right", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bottle", "refrigerator", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 300784, "caption": " The image shows a group of children sitting on a couch or bench together, enjoying the presence of a cat sitting next to them. There are four children, with two kids seated on either side of the cat, while the other two are sitting at the front of the couch", "mscoco_hallucinated_words": [["cat", "cat"], ["cat", "cat"]], "mscoco_gt_words": ["couch", "dog", "person", "bench"], "hallucination_idxs": [20, 40], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.75}}, {"image_id": 183766, "caption": "The image depicts a table with three pieces of food on it. The center piece is a cake-like dessert topped with garnishes, including cherries and berries", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "cake", "knife", "dining table"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 169169, "caption": "According to the picture, a large green tree is located near a sign on the sidewalk, with the words \"springing in the city\" above it. There are several people on the street, with some standing near the tree and others further away from it", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["traffic light", "potted plant", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 409346, "caption": " In the image, there are two women standing next to each other, attending a party. They are wearing matching outfits, which gives them a sense of unity", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "dining table", "spoon", "cake", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2}}, {"image_id": 522262, "caption": " (image description) In a picture, several bicycles are parked in a row along a fence next to a sidewalk. The bikes are various sizes and are spaced out, creating an organized yet slightly chaotic scene", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bicycle", "traffic light", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 79014, "caption": "The image features a man with glasses and a beard, who has a yellow ball placed in front of his nose. The man appears to be peering through a glass surface, which is probably a mirror, to see the yellow ball better", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["orange", "person", "sports ball"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 344942, "caption": "The image features a small toy robot with a blank expression sitting on top of a laptop, which is partially visible in the picture. There is another laptop or computer screen on the right side of the scene, likely belonging to a person or a character in a cartoon or animation", "mscoco_hallucinated_words": [["person", "person"]], "mscoco_gt_words": ["clock", "laptop", "tv"], "hallucination_idxs": [45], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.3333333333333333}}, {"image_id": 275929, "caption": "According to the picture, there are three old, dirty toilets sitting on the steps of a building. They appear to be in a pile, with the two upper toilets leaning against the steps, while the lower toilet sits further down", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "toilet", "sink"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 465601, "caption": " According to the picture, there are a number of people standing outside wearing raincoats, holding umbrellas and walking in the rain. Some of the people are wearing ties and one is wearing a green hat", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["handbag", "bench", "person", "umbrella"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 300124, "caption": "The image shows a wooden chair with a small television mounted on top. The TV is positioned on a dining table-like surface, sitting on the chair's cushion", "mscoco_hallucinated_words": [["television", "tv"], ["tv", "tv"]], "mscoco_gt_words": ["chair", "couch", "dining table", "microwave"], "hallucination_idxs": [9, 15], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.25}}, {"image_id": 46919, "caption": "According to the image, there is a man hiking on a snow-covered mountain, traversing the side of a hill. He appears to be wearing snowshoes and has a backpack", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "skis", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 434022, "caption": "This scene captures a long train traveling on a train track with several coal cars in the background. The train consists of two engines and several other cars with varying positions and widths", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["train", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 490491, "caption": " According to the picture, a small, rocky road is the main focus of the scene. It is situated in front of a tall building with various signs nearby", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["stop sign", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 175878, "caption": "According to the picture, four people are standing outside next to each other, forming a group. The people are all looking down and seem to be engaged in conversation", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "backpack", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 12669, "caption": "The image features a room with several people in it, some standing and others sitting on chairs. A woman in a striped shirt is holding a wine glass and appears to be enjoying a wine tasting event", "mscoco_hallucinated_words": [["chair", "chair"]], "mscoco_gt_words": ["handbag", "vase", "wine glass", "person"], "hallucination_idxs": [17], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.5}}, {"image_id": 192496, "caption": "The image showcases a blue and white train parked on the tracks at a train station. The train is positioned across the entire scene with two main sections: one is near the front and the other is towards the middle of the train", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["train", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 133146, "caption": "According to the picture, there is a large, nicely decorated living room with a fireplace, a couch, a chair, and a dining table. The room also contains various potted plants placed throughout, adding a touch of nature to the interior", "mscoco_hallucinated_words": [["table", "dining table"], ["potted plant", "potted plant"]], "mscoco_gt_words": ["vase", "chair", "couch", "book", "tv"], "hallucination_idxs": [27, 34], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.4}}, {"image_id": 53744, "caption": "In the image, there is a cutting board filled with a variety of food items, including sliced tomatoes and lettuce. The knife used to cut the vegetables is prominently visible in the image, along with the food spread out on the board", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["knife", "dining table", "sandwich"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 375902, "caption": " The image features a person wearing ski gear, possibly skiing down the snow-covered mountains, holding a pair of skis together. There are two people on the slopes nearby who appear to be watching or observing the skiing action", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "skis", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 498747, "caption": "In the image, a man is talking on his cell phone, possibly discussing something with the person he is communicating with. A few other people are in the background, one in the left corner and another two in the right corner, but they seem to be less involved in the conversation", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "bottle", "bird", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 52435, "caption": "According to the image, there is a large group of people on a sandy beach, some sitting and others standing around. A surfboard is visible on the beach, suggesting a water activity, with multiple people in the water", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["surfboard", "bird", "person", "umbrella"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 301977, "caption": " The image depicts a brown cow standing in front of a store or market, possibly browsing for food or drinks. The cow is positioned close to the left side of the image, right outside the store front", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bottle", "refrigerator", "cow"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 261097, "caption": " The image features a tennis player walking along a sports court, with many spectators surrounding the player. The player, wearing a black shirt and white shorts, holds a tennis racket, possibly looking off to the side or for a specific ball", "mscoco_hallucinated_words": [["ball", "sports ball"]], "mscoco_gt_words": ["chair", "bench", "tennis racket", "person"], "hallucination_idxs": [45], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2, "Recall": 0.5}}, {"image_id": 227204, "caption": " In the picture, three women are sitting at a table with a cell phone, cereal, and bananas. They appear to be chatting and drinking, perhaps on their lunch break", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "bowl", "dining table", "banana", "spoon", "bottle", "knife", "person", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4444444444444444}}, {"image_id": 353981, "caption": " The image is a black and white photograph of an airplane with multiple people on the tarmac next to it. The plane is sitting on the ground and several people are standing around it", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["airplane", "person", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 185327, "caption": " In the image, a large group of elephants is walking down a street, attracting the attention of both people and vehicles nearby. The elephants are walking from the left side of the scene towards the right, spreading out as they pass by various businesses and shops", "mscoco_hallucinated_words": [["elephant", "elephant"], ["elephant", "elephant"]], "mscoco_gt_words": ["bus", "horse", "car", "person", "cow"], "hallucination_idxs": [8, 26], "metrics": {"CHAIRs": 1, "CHAIRi": 0.6666666666666666, "Recall": 0.2}}, {"image_id": 348654, "caption": "There is an iPhone and a small television sitting on a desk in front of a keyboard, with an additional monitor visible. The iPhone is placed on a black-covered smartphone holder near the TV, while the TV is positioned to the left and behind the monitor", "mscoco_hallucinated_words": [["keyboard", "keyboard"]], "mscoco_gt_words": ["cell phone", "laptop", "tv", "dining table"], "hallucination_idxs": [16], "metrics": {"CHAIRs": 1, "CHAIRi": 0.125, "Recall": 0.75}}, {"image_id": 482432, "caption": " The image features a bathroom scene with a sink, a toothbrush, and a tube of Aveeno skin care product sitting next to it. The bathroom is spacious and well-lit, providing a sense of cleanliness and comfort", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "toothbrush", "sink"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 454161, "caption": "In the image, there is a slice of pizza placed on a white plate. The slice of pizza is situated at the middle of the plate and has several small pieces, giving the appearance of an individual-sized pizza", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["pizza", "fork", "dining table", "wine glass"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 144723, "caption": " The image features a black and white dog in the middle of a field, leaping into the air to catch a red frisbee with its mouth. The dog is the center of attention, and it appears to be enjoying the action", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["car", "dog", "frisbee", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 129707, "caption": "The image shows a person holding a cellphone in their hand. The cellphone appears to be a flip-style phone with a black and grey color scheme", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "book", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 379842, "caption": " The image shows a book and a video game controller sitting on a wooden table. The book appears to contain information about a video game, and the game controller is possibly for the Nintendo Wii game system", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["remote", "dining table", "book"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 203110, "caption": "The image depicts a large orange trolley traveling down the track, likely in a city or suburban setting. There are several people in the scene, some standing near the tracks and others further away", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bus", "train", "orange", "car", "person", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 556478, "caption": " In the image, there are two pizzas neatly placed on a stove top. One pizza is on the left side of the pan, and the other pizza is slightly higher on the right side of the pan", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["pizza", "oven", "bottle", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 103815, "caption": "The image captures a moment during a baseball game where a man in a baseball cap is on the mound, holding a baseball glove as he prepares to throw a ball. Another man, with a baseball bat in hand, is swinging at a baseball pitched by the pitcher", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["baseball bat", "person", "sports ball", "baseball glove"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 451943, "caption": " The image features a neatly made bed in a bedroom with the top sheets pulled back and white blankets visible. The bed is situated close to a window, allowing ample light into the room", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "suitcase", "dining table", "bed"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 268854, "caption": " There is a sandy beach where two boats and two cars are parked next to each other. A woman carrying a basket of bananas on her head is walking along the beach, possibly toward the water", "mscoco_hallucinated_words": [["car", "car"], ["banana", "banana"]], "mscoco_gt_words": ["handbag", "boat", "person"], "hallucination_idxs": [10, 24], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.6666666666666666}}, {"image_id": 34464, "caption": "According to the picture, a group of people are walking across a sandy beach, carrying a large board. The board appears to be red, and it is being carried by three individuals: one person is carrying the front, another person is carrying the middle section, and a third person is carrying the back", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["boat", "surfboard", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 495513, "caption": " In the image, a man and a woman are standing next to each other and posing for a photo. The man is holding a bottle and a beer, while the woman is holding a hot dog", "mscoco_hallucinated_words": [["bottle", "bottle"]], "mscoco_gt_words": ["fork", "hot dog", "person"], "hallucination_idxs": [26], "metrics": {"CHAIRs": 1, "CHAIRi": 0.16666666666666666, "Recall": 0.6666666666666666}}, {"image_id": 529256, "caption": "According to the picture, there are two dogs lying on a red bed in a room. The larger dog is on the left side of the bed, while the smaller dog is closer to the right side", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dog", "book", "bed"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 37907, "caption": "In a room with a television, a cat is sitting on top of a media center, such as a TV stand or shelf. The cat is placed on the left side of the media center and is positioned in front of the TV, with its attention directed towards the screen", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cat", "potted plant", "tv"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 506401, "caption": "The image captures a small town square featuring various public transportation vehicles such as cars, buses, and a truck parked in different parts of the area. The town square has a statue prominently displayed in the center, surrounded by trees and paved roads", "mscoco_hallucinated_words": [["bus", "bus"]], "mscoco_gt_words": ["cat", "traffic light", "car", "person", "truck"], "hallucination_idxs": [16], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.4}}, {"image_id": 406611, "caption": " The image depicts a busy ski resort, with many people standing around and skis visible. Snow covers the ground, as everyone seems to be dressed and ready for skiing activities", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "skis", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 267225, "caption": "The image shows a white truck with a satellite dish parked on the side of a road. The truck appears to be stationary, with several satellite dishes on its roof, creating a bit of interest for passersby", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["remote", "car", "person", "truck", "tv"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2}}, {"image_id": 278365, "caption": "According to the picture, the scene shows a man and a woman sitting outside at a table, enjoying a meal together. They are dining on a slice of pizza, which is placed on a plate on the table", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "dining table", "chair", "person", "pizza", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 69757, "caption": "The image features three people, a man, a woman, and another person, sitting around a dining table with chairs on each side. The woman appears to be cutting a cake that is placed in the center of the table", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "chair", "cake", "knife", "wine glass", "person", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5714285714285714}}, {"image_id": 432213, "caption": "In the image, there is a plate with a sandwich and a serving of french fries. There is another sandwich and french fries at the table", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "dining table", "sandwich", "wine glass", "knife", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 368367, "caption": "According to the picture, a woman is shown talking on a cell phone, holding it close to her face and smiling as she communicates. ", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "person", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 201555, "caption": "There is a sand-filled street at the center of the scene with traffic lights above it, creating a unique view. The street extends from the right side of the scene to the left side, and some of the sand has been pushed aside or rearranged", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["traffic light", "car", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 92131, "caption": " The scene is set in front of a parked bus, with a large green bus with a foreign writing prominently on its front, facing the viewer. A number of people are gathered around the bus, with some approaching from the left side, others from the right side, and some standing near the back", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["handbag", "bus", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 21779, "caption": " The image shows a woman laying on top of a suitcase, smiling. The woman is the main subject, while the suitcase is the background", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "suitcase", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 565148, "caption": "The scene takes place in a baseball game, likely a professional or semi-professional match. There are several players scattered around the field, including a baseball player up to bat, a catcher, and an umpire, who are the main focus of the scene", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["baseball bat", "person", "sports ball", "baseball glove"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 160183, "caption": "The image shows a red and white fire truck parked outside of a building, likely in front of a garage or parking lot. There is also a car parked near the fire truck, with another vehicle located further away in the image", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["car", "person", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 555456, "caption": "", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["snowboard", "skis", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 235595, "caption": "In the image, several motorcycles are parked along the sidewalk next to a street, forming a row of motorcycles in the same row. One of the motorcycles is on the left side of the image, with another one in the middle, followed by another one on the right side of the image", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["motorcycle", "potted plant", "car", "parking meter", "person", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.16666666666666666}}, {"image_id": 489909, "caption": "The image displays various fruits, including an orange, a banana, and two or three more fruits in the background. These fruits are placed in a basket, creating a visually appealing display of fresh produce", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["banana", "orange", "bowl"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 501080, "caption": "According to the picture, a large vase with a single flower on top is filled with a bouquet of colorful flowers, likely poinsettias, which are red and pink. The bouquet is composed of multiple flowers throughout the vase, covering the entire interior", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "dining table", "potted plant", "vase"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 405183, "caption": " The scene shows several people in a living room, with a woman standing in the center, holding a video game controller. There are a few additional individuals in the room, situated closer to the edges", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["remote", "potted plant", "chair", "couch", "book", "handbag", "person", "tv"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.125}}, {"image_id": 409138, "caption": "The image features a city street with several vehicles parked along the side and the bus, which has the words \"image content,\" written on it. One car is located in front of the bus, while two other cars are nearby", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bus", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 411840, "caption": "In the image, two women tennis players are walking across the court, each holding a tennis racquet in their hands. The women are walking from left to right, leaving a space between them as they proceed", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "chair", "sports ball", "person", "tennis racket"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2}}, {"image_id": 333712, "caption": " The image shows a slice of pizza with cheese and onions, prominently displayed on the table. The pizza has been cut into several pieces, each with a slightly different size and shape", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["pizza", "spoon", "dining table"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 148977, "caption": " In the image, there is a teddy bear with headphones on its ears sitting on a desk or table. The headphones are on top of its head, covering its ears, which is a unique and interesting aspect of the scene", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["teddy bear", "dining table", "bottle", "bear", "keyboard", "book"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 399058, "caption": " The scene depicts an elephant walking down a road in front of a truck, with a man riding the elephant. The man can be seen seated on the elephant's back, enjoying the unique experience of riding the massive animal", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bicycle", "orange", "person", "truck", "elephant"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 183571, "caption": " According to the picture, a man and a dog are on a small red boat, with the man standing on a hose near the left side and the dog on the right side of the boat. There are two bottles on the boat, with one placed near the man and the other on the right side", "mscoco_hallucinated_words": [["bottle", "bottle"]], "mscoco_gt_words": ["boat", "dog", "person"], "hallucination_idxs": [42], "metrics": {"CHAIRs": 1, "CHAIRi": 0.1111111111111111, "Recall": 1.0}}, {"image_id": 325836, "caption": "The image showcases a motorcycle with a purple and orange paint job, standing out among several other motorcycles and a car. The motorcycle is on the left side of the picture, while other motorcycles are located throughout the scene", "mscoco_hallucinated_words": [["orange", "orange"], ["car", "car"]], "mscoco_gt_words": ["handbag", "motorcycle", "bicycle", "person"], "hallucination_idxs": [9, 21], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.25}}, {"image_id": 437910, "caption": "The image captures a small bathroom with a toilet, located at the far right of the room. The toilet is positioned near the door, creating an inconvenient and cramped space", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bottle", "toilet", "sink"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 155885, "caption": "The image captures a black and white scene with a group of birds swarming around a man sitting on a boat at a dock. The birds are spread out over the water, with some closer to the man's boat while others are further away", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["boat", "bird", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 467887, "caption": " The image features a man, who appears to be in his mid-50s, sitting at a table using a laptop. He is wearing a red shirt and has glasses on", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "chair", "couch", "mouse", "person", "laptop"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 174402, "caption": " The image features a tennis player in a blue shirt holding a tennis racket on the tennis court. A sports ball is also present in the image, possibly the one the player is attempting to serve or return", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["tennis racket", "person", "sports ball"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 352734, "caption": "The image features a young boy sitting at a dining table eating a piece of chocolate cake with a fork. There is another person in the room, sitting in a chair near the child", "mscoco_hallucinated_words": [["chair", "chair"]], "mscoco_gt_words": ["fork", "dining table", "spoon", "cake", "person"], "hallucination_idxs": [32], "metrics": {"CHAIRs": 1, "CHAIRi": 0.14285714285714285, "Recall": 0.8}}, {"image_id": 346716, "caption": "In this scene, a double-decker bus is driving down a city street surrounded by traffic. There are several other buses behind the lead bus, and some are parked, likely during their normal operating schedule", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bus", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 451144, "caption": " The image captures a snowy mountain scene, with two people standing on top of the snowy slope, observing the surroundings. One person appears to be wearing skis, while the other person is not wearing any", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "skis", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 295656, "caption": "According to the picture, the scene features several people dressed in fancy attire, eating dinner together. There are three men and one woman, with each person holding food on a plate", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "tie", "clock", "car", "person", "pizza", "tv"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.14285714285714285}}, {"image_id": 129886, "caption": " The image features a group of skiers gathered at a ski slope with a ski lift in the background. Several pairs of skis are visible, including ones with two people each, on the snowy slope", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["snowboard", "skis", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 557998, "caption": "According to the picture, a young man is sitting at a table with a bottle in front of him, likely focusing on something he is holding in his hand. The bottle seems to contain a liquid, such as an alcoholic beverage", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "chair", "bottle", "wine glass", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 401010, "caption": "There is a white bed situated in the middle of the image, with a black chair next to it. Near the bed, there is a desk with a laptop placed on top of it", "mscoco_hallucinated_words": [["desk", "dining table"], ["laptop", "laptop"]], "mscoco_gt_words": ["chair", "sink", "tv", "bed"], "hallucination_idxs": [28, 31], "metrics": {"CHAIRs": 1, "CHAIRi": 0.4, "Recall": 0.5}}, {"image_id": 567562, "caption": "According to the picture, there is a woman sitting at a dining table with her two children. They are all enjoying a meal together, with pizzas, slices of pizza, and wine placed on the table", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "bowl", "dining table", "chair", "spoon", "bottle", "book", "broccoli", "person", "pizza", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2727272727272727}}, {"image_id": 313928, "caption": "A person is standing on a patio overlooking the beach, enjoying a day outdoors. The patio features a table with chairs and a large bottle of drink on the table, as well as a yellow surfboard leaning against a nearby wall", "mscoco_hallucinated_words": [["person", "person"]], "mscoco_gt_words": ["surfboard", "dining table", "chair", "bottle", "wine glass"], "hallucination_idxs": [1], "metrics": {"CHAIRs": 1, "CHAIRi": 0.16666666666666666, "Recall": 0.8}}, {"image_id": 490284, "caption": "In the image, a dog's head is seen resting on a person's arm, looking up and possibly begging for attention. There are other people present in the image, but none of them are touching the dog", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["couch", "dog", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 346940, "caption": " There is a stove in the image with a kettle resting on top. The kettle has its spout at the right side of the stove", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "knife", "oven"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 222782, "caption": "The image depicts a woman walking down the street in front of a gas station, with the sign for the store visible in the background. The gas station's sign is in black and white, indicating the time period", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "car", "person", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 255934, "caption": " The image features an adult elephant and a baby elephant walking next to each other in a fenced area. The baby elephant is following closely behind the larger one, creating a striking scene", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["handbag", "elephant", "person", "cow"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 278627, "caption": "According to the image, there are various pictures of people enjoying food at a restaurant. There is a group of people, including a man and woman, eating different types of food", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "dining table", "potted plant", "spoon", "chair", "bottle", "person", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.125}}, {"image_id": 400851, "caption": "According to the picture, there is a group of people gathered on the beach in front of a lake. Several individuals are sitting and lounging on a bench near the water, while others are standing or walking in the background", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "boat", "chair", "sports ball", "umbrella", "bench", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2857142857142857}}, {"image_id": 472610, "caption": "In the image, a woman is standing next to a dog, both outdoors in a field. There are multiple cows in the background of the scene, some of them positioned closer to the camera", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dog", "person", "cow"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 78565, "caption": " The image portrays a group of people enjoying a day at the beach. There are several small sailboats scattered around in the water, creating a pleasant and playful atmosphere for the people", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["boat", "dog", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 388237, "caption": "According to the picture, a young man is riding a skateboard down a street or alleyway, in the middle of an outdoor gathering or event. Several other people can be seen around him, some of whom are enjoying the gathering or standing in different spots, including some close to the skateboard rider", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["skateboard", "chair", "bottle", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 289640, "caption": "According to the picture, there are several people sitting around tables in a room. A man with glasses is sitting in a chair with an orange frisbee over his face, and another person is close by", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "chair", "wine glass", "orange", "person", "cup", "frisbee"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.7142857142857143}}, {"image_id": 122602, "caption": " The image displays a table with a variety of crafts and materials spread across its surface. A pair of scissors is located on the left side of the table, while a bottle of glue is situated in the middle", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["scissors", "bottle", "dining table"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 24104, "caption": "The image shows a desktop setup consisting of a television, two monitors, a book, and other assorted items. The TV is located on the left side of the setup and displays a program, with a second monitor situated on the right side", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "bed", "mouse", "keyboard", "book", "laptop", "tv", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 183709, "caption": "In the image, there are multiple people standing on the sidewalk, possibly waiting to cross the street. The scene features a crosswalk, which is a designated area for pedestrians to safely cross a road", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["handbag", "traffic light", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 59710, "caption": "According to the picture, a small, black and white refrigerator is open and visible in the room. Inside, there is a bottle on the shelf, indicating a collection of beverages", "mscoco_hallucinated_words": [["bottle", "bottle"]], "mscoco_gt_words": ["chair", "dining table", "refrigerator"], "hallucination_idxs": [25], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.3333333333333333}}, {"image_id": 279407, "caption": "According to the picture, there is a little boy wearing a baseball glove and holding a baseball in a baseball field. He is standing close to the fence that surrounds the field, with the ball in his hand and a baseball glove on his hand", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bottle", "sports ball", "bench", "person", "baseball glove"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 314729, "caption": "The image depicts a vintage photo of a baseball player in a white uniform, standing and holding a baseball bat. The player has a serious expression, and it appears that he may be posing for the photograph", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["baseball bat", "person", "sports ball"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 527497, "caption": " According to the picture, there is a large desk with two computer monitors at its center. The monitors are positioned side by side, displaying various images", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "mouse", "keyboard", "laptop", "tv"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 411564, "caption": "The image features a man sitting on a table in front of a window, using a cell phone. He is sitting on the table with a bottle near him, possibly enjoying the outdoors or the view from the window", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "dining table", "chair", "bottle", "person", "refrigerator"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 320350, "caption": "The image features a man and a woman standing next to each other on their skis, both wearing snow gear. There are three dogs with them \u2013 one is slightly in front of the couple, while the other two dogs are slightly behind them on the right side", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["skis", "dog", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 401857, "caption": "The image features a baseball player at bat, preparing to swing a baseball bat at a baseball ball on the field. The player stands near the home base, as seen in the top-left corner of the picture, and is likely waiting for the right pitch to hit", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["baseball bat", "sports ball", "bench", "person", "baseball glove", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 285302, "caption": "In the image, a young boy is sitting at a dining table, surrounded by various crafting materials. He is holding some paper and appears to be cutting it with a pair of scissors", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "scissors", "dining table", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 61959, "caption": "The image depicts a large bus driving down a street in a city. The bus has a colorful advertisement on its side, which might be a form of public transportation", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bus", "traffic light", "car", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 229659, "caption": "The image shows a laptop computer sitting on a table in a restaurant, with a keyboard, mouse, and monitor on the table. There are a few chairs placed around the table, and a man is seated at the table using the laptop", "mscoco_hallucinated_words": [["keyboard", "keyboard"], ["mouse", "mouse"]], "mscoco_gt_words": ["dining table", "chair", "bottle", "clock", "person", "laptop", "tv"], "hallucination_idxs": [16, 18], "metrics": {"CHAIRs": 1, "CHAIRi": 0.18181818181818182, "Recall": 0.7142857142857143}}, {"image_id": 473118, "caption": "The image showcases a person riding a skateboard while doing tricks on the ramp, highlighting the fun and excitement of skateboarding. The skateboard is positioned on a ramp as the rider is skillfully riding it, demonstrating their abilities and techniques", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["skateboard", "bicycle", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 391222, "caption": "Two people are standing in the snow at the top of a slight hill, wearing skis and holding ski poles. They are positioned next to each other, and a tablet or a sign is placed nearby", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "skis", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 416104, "caption": "In the image, several people are sitting around tables underneath an umbrella. The people seem to be enjoying the outdoor atmosphere, possibly having a conversation or drinking beverages", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "chair", "bottle", "wine glass", "umbrella", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 511852, "caption": " The scene depicts a pair of skiers walking on a snowy slope. There are two men, both wearing skis and with backpacks, facing the camera, and they are hiking up the mountain side by side", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "skis", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 59386, "caption": " The image portrays a group of giraffes gathered around a tree, feeding on leaves. There are four giraffes in the scene, with some standing close to the tree while others are further away", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["zebra", "giraffe", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 540180, "caption": "The image depicts an intersection in a city with various streetlights and a green traffic light with a smiley face on it. The intersection is bustling with cars of different types and sizes, both parked and moving around the city", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["traffic light", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 153692, "caption": " The image captures a man and his dog riding their bikes across a pedestrian crossing, with multiple traffic lights. The man rides his bike while walking, with the dog riding alongside him on the same bike", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "bicycle", "traffic light", "car", "person", "dog"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 265628, "caption": "The image is of a toilet, located near the corner of the room. A man is standing in front of the toilet, with his feet positioned close to the edge, wearing black shoes", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "toilet", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 499594, "caption": " (Potential question) In the image, a piece of meat is served on a plate with broccoli, accompanied by a bottle of red wine and various sauces on the table. There are also some spices and a fork on the table", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "dining table", "bottle", "knife", "broccoli", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 5934, "caption": "The image depicts a baseball and a baseball glove in close proximity. The baseball is on the left side, sitting close to the glove, which is on the right side", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bench", "sports ball", "baseball glove"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 47828, "caption": " The image portrays a night scene with a blue river and a bridge over it. There are a few boats visible on the river, one being close to the middle of the bridge, and the other boats located near both ends of the bridge", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["boat", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 47916, "caption": "In the image, there is a dog running with a frisbee in its mouth, with two other dogs in the scene. One dog is located towards the right side of the image, while the other dog is in the top left corner", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bench", "dog", "car", "truck", "frisbee"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 255483, "caption": "This image shows a person sitting at a table, likely writing or working on some sort of paper. There are multiple papers placed on the table in front of them", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["scissors", "dining table", "book", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 131138, "caption": " The image shows a computer desk with a TV screen, keyboard, and mouse. On the desk, there is also a laptop placed nearby", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "potted plant", "spoon", "mouse", "keyboard", "person", "laptop", "tv", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5555555555555556}}, {"image_id": 258209, "caption": "The image shows a man sitting on a bench near a building, probably in a city or urban area. The man is talking on a cell phone", "mscoco_hallucinated_words": [["cell phone", "cell phone"]], "mscoco_gt_words": ["bicycle", "bench", "book", "person"], "hallucination_idxs": [27], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.5}}, {"image_id": 347453, "caption": "In the image, there are several red and white buses driving down the street. One red bus is closer to the front of the scene and one white bus is positioned further back", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bus", "bench", "traffic light", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2}}, {"image_id": 285820, "caption": "The image shows a well-equipped living room with a couch, desk, and a television, all sitting on a rug. A large TV occupies a significant portion of the room, positioned near the couch", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "bowl", "dining table", "couch", "book", "bench", "tv"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.42857142857142855}}, {"image_id": 245664, "caption": "A desk is showcasing a collection of personal belongings and technology, including a computer monitor, a laptop, a keyboard, and various items spread out across the wooden surface. The computer monitor, located at the front of the desk, has a screen displaying images and documents", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "mouse", "keyboard", "wine glass", "book", "laptop", "tv", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 453731, "caption": "According to the picture, a dog is lying on a wooden table in front of a building. The dog appears to be sleeping and is positioned on the table with its legs stretched out", "mscoco_hallucinated_words": [["table", "dining table"], ["table", "dining table"]], "mscoco_gt_words": ["bottle", "dog", "cup"], "hallucination_idxs": [12, 30], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.3333333333333333}}, {"image_id": 524601, "caption": "According to the picture, a group of people, including a woman and a man, are playing a video game together in a large room. They are all actively engaged in the activity, with one woman holding a Wii remote and a man nearby", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["remote", "chair", "couch", "book", "person", "refrigerator"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 253262, "caption": " The image depicts a small airplane, likely a private jet, parked on a tarmac or airport runway. Two men can be seen in the scene, standing near the front of the aircraft", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["tie", "airplane", "person", "truck", "suitcase"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 87052, "caption": "The image depicts a small kitchen, possibly in a residence, with a couple standing and sharing the space. The man is standing towards the back of the kitchen, while the woman is to the left, in the front", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "vase", "oven", "bottle", "person", "refrigerator", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.14285714285714285}}, {"image_id": 357578, "caption": " The scene features a red fire truck parked on the street, partially visible. There are several cars parked on the street, including a white car in front of the fire truck, a white car behind it, and a black car further down the street", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["traffic light", "car", "person", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 418692, "caption": " In the image, a man is sitting on a couch in a living room, holding a cell phone. The couch is positioned towards the left side of the room and the man is sitting slightly to the right", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "remote", "chair", "couch", "book", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 259345, "caption": "According to the picture, a man with a beard and mustache is sitting in a chair, holding a large pink umbrella, and wearing a long multi-colored dress. He is the main focus of the scene, occupying the central area", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "person", "umbrella"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 119709, "caption": "According to the picture, a woman is preparing donuts on a red table, surrounded by various other donuts of different shapes and sizes. The table is full of piled-up donuts, with some of them on the ground", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "dining table", "person", "donut"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 443299, "caption": "According to the picture, two people are sitting on a bench in a subway station, both using their cell phones. The main man is checking something on his cell phone while the other man is sitting next to him", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "backpack", "handbag", "bench", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 120776, "caption": "In a busy urban environment, a small group of people is sitting on a balcony with a view of the street. Two large umbrellas, one with an artful metal sculpture on it, are on either side of the balcony", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["tie", "person", "umbrella"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 411765, "caption": "In a tennis court, a man is playing tennis, with a tennis racket in his hand, about to hit a ball. The ball is located in the center of the court, near where the player is swinging the racket", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["tennis racket", "person", "sports ball"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 447991, "caption": "A woman is standing on the sidewalk next to a van, surrounded by various storefronts, including a business with the name \"Asian Food\" and several other shops. Another person is walking along the sidewalk", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "bicycle", "handbag", "traffic light", "car", "person", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2857142857142857}}, {"image_id": 276719, "caption": " There is a scene with a small dog standing on the sidewalk in front of a blue car and two vintage cars, creating a unique and interesting intersection. The dog is positioned in the middle of the street, with two additional people walking nearby", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["motorcycle", "truck", "chair", "handbag", "dog", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.42857142857142855}}, {"image_id": 422328, "caption": "In the scene, there is a large snow pile near a horse and a carriage. The horse, likely a horse-drawn carriage, is covered in snow, while the carriage is parked next to it", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["snowboard", "horse", "skis", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2}}, {"image_id": 354559, "caption": "The image features a woman in a black dress, standing close to each other. The woman is holding a teddy bear, possibly giving the impression that she's trying to hug it or protect it", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["teddy bear", "bear", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 438788, "caption": " In the image, there are two pieces of white cake arranged on a dining table. One piece is in the process of being cut, likely by a person holding a knife nearby", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cake", "knife", "person", "dining table"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 468005, "caption": "The image features a large grey elephant walking down a street or sidewalk with several people around it. Some of the people appear to be interacting with the elephant, while others are watching it from a distance", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "elephant", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 545594, "caption": " In the picture, a man wearing a tie-dye shirt is standing on a bus, holding onto a backpack. There are several people around him, with one person standing near the front and two others towards the back of the bus", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "orange", "backpack", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 219546, "caption": "The image features a table laden with various food items. The table is set for a party or celebration, and it contains bowls, dishes, and utensils filled with a variety of food, including meat and cheese", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "bowl", "dining table", "chair", "spoon", "bottle", "knife"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2857142857142857}}, {"image_id": 386645, "caption": " The scene depicts a rickety building with its roof partially collapsed. A blue truck is parked in front of the building and several people can be seen standing near the truck, with some of them walking past it", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["motorcycle", "car", "person", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 155131, "caption": " The image shows a woman in a white dress standing on a tennis court, leaning forward and preparing to serve a tennis ball. She is the main focus of the scene", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["tie", "sports ball", "bench", "person", "tennis racket"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 188752, "caption": " The image depicts a man standing near two large bunches of bananas hanging from the ceiling at an outdoor market. There are many bananas in the bunches, with some bananas hanging individually and others clustered together", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["banana", "apple", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 228350, "caption": " A group of people is sitting outside at a restaurant, enjoying a sunny day underneath a series of red umbrellas, providing shade and comfort. There are multiple tables and chairs set up for the diners, who are dressed in a variety of attire, including jackets, t-shirts, and dresses", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "dining table", "chair", "tie", "wine glass", "umbrella", "person", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 437720, "caption": "According to the image, a naked woman is sitting at a table, looking like she is working on something. The painting depicts a feminine figure sitting on a chair with red chairs in the background", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["vase", "dining table", "chair", "person", "laptop"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 378831, "caption": "The image depicts a woman walking past a fire hydrant. She is carrying grocery bags and walking towards the right side of the picture, with a person also visible in the background near the fire hydrant", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["handbag", "fire hydrant", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 375503, "caption": "There is an image of a staircase in a home or building, possibly leading to an upper or lower level. The staircase features several wooden railings and banisters, creating an elegant and decorative style", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "chair", "clock", "person", "laptop", "tv"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 330369, "caption": "The scene features a red and white boat in the water at a dock. The boat is large, occupying a significant portion of the image, and has a distinct shape with a mix of red and white colors", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["boat", "bird", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 288576, "caption": " According to the picture, there is a man standing next to a small tree stump, throwing a red frisbee near the tree trunk. In the background, a couple of bicycles are visible, with one located near the left side and another on the right side", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bicycle", "person", "frisbee"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 32190, "caption": "The image captures a small toy horse, likely a collectible figurine, placed on the sidewalk in front of a street. The street appears to be in a city setting with various cars parked around the area", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["horse", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 535403, "caption": " The image features a bathroom with two sinks, one larger and one smaller, located in different areas of the room. The larger sink is on the left side of the image and is accompanied by a mirror above it", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["potted plant", "clock", "bottle", "sink", "hair drier", "toilet"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.16666666666666666}}, {"image_id": 449798, "caption": "The image features a home office set-up with various computer items placed on a table. There is a keyboard on the left side and a mouse placed near it", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "dining table", "mouse", "keyboard", "book", "laptop"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 375769, "caption": " The image depicts a young boy sitting at a dining table in a restaurant. He is wearing a helmet and has a hoodie on", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "bicycle", "chair", "hot dog", "umbrella", "car", "person", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 426172, "caption": " The image depicts a dining area with a table featuring a wine rack and several books. One of the books is a large book about wine placed on top of the table, with its title visible", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "chair", "bottle", "knife", "book"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 20650, "caption": " The image features a dining table with a couple of items on it. There is a large, orange plate placed on the table that is covered in broccoli and two slices of bread", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "bowl", "dining table", "sandwich", "orange", "broccoli"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 138078, "caption": "In the image, there are two young baseball players standing on a field. The first player, wearing a red shirt and white pants, is in the foreground, holding a baseball glove", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "sports ball", "baseball glove"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 152499, "caption": "According to the picture, a group of people, including some children, are sitting in a pool next to a couple of surfboards, one of which appears to be on top of an air mattress. There is a person wearing a party hat, and another person in a purple shirt", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["surfboard", "dining table", "potted plant", "chair", "umbrella", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 180764, "caption": " The image depicts a man in the process of eating a pink glazed donut. He is the focal point of the scene, and a number of other people can be seen in the background, with some situated near him and others further away", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bottle", "microwave", "person", "donut"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 147762, "caption": "The image features a plate with a small dessert on it. The dessert is covered with a white substance and has a yellow center", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cake", "fork", "dining table"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 113860, "caption": "The image depicts a sailing boat on the river, moving along the water with some trees in the background. The boat appears to be quite large and is the main focus of the scene", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["boat", "person", "umbrella"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 460866, "caption": "The image features a variety of toothbrushes grouped together inside a cup or sink. Some of the toothbrushes are clustered together in the center, while others are scattered throughout the cup", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "dining table", "toothbrush", "sink", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 177015, "caption": "According to the picture, a man is sitting on a couch, holding a cat and using a laptop. There are a couple of other individuals in the room, with one person occupying a couch nearby and another person seated on a different couch", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cat", "chair", "couch", "person", "apple", "laptop", "refrigerator"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5714285714285714}}, {"image_id": 333998, "caption": "The image features a well-equipped kitchen with a refrigerator on one side and a microwave oven on the other. Two ovens are positioned on the counter, one above the refrigerator and the other below", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "oven", "bottle", "sink", "microwave", "person", "suitcase", "refrigerator", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 47131, "caption": "The image depicts a group of men trying to get onto a train that has derailed. The men are scattered around the wreckage, with some trying to climb on top of the train cars", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["train", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 425447, "caption": "According to the picture, a white truck is driving down the street, appearing to be watering a fire hydrant in the middle of a sidewalk. The fire hydrant is located at the center of the image, surrounded by trees and parked vehicles", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fire hydrant", "person", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 295105, "caption": "The image features a man standing in front of a refrigerator in a kitchen. He is looking towards a person outside the frame, likely through a window or door", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "oven", "bottle", "sink", "person", "apple", "refrigerator"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2857142857142857}}, {"image_id": 443259, "caption": "This is an image of a large open kitchen with a refrigerator and a dining area. The kitchen features a stainless steel refrigerator and a few cabinets", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "dining table", "potted plant", "oven", "chair", "bottle", "sink", "orange", "refrigerator"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.1111111111111111}}, {"image_id": 537861, "caption": " In the image, there is a yellow and gray train traveling along a train track. The train occupies the middle of the picture, while the left side is occupied by the station platform", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["train", "bench", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 145020, "caption": "According to the image, there is a large stuffed duck with a yellow vest standing next to a toy car and many other toys in a parade setting. The duck is likely a Disney character like Donald Duck or Mickey Mouse, and there are other toys present in the scene", "mscoco_hallucinated_words": [["car", "car"]], "mscoco_gt_words": ["teddy bear", "mouse", "bird", "person"], "hallucination_idxs": [20], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2, "Recall": 0.5}}, {"image_id": 249969, "caption": "In the image, a plate of food is set on a table. The meal features multiple kinds of meat, such as chicken and beef, as well as vegetables like broccoli and carrots", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "dining table", "spoon", "knife", "wine glass", "broccoli", "carrot", "bird"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.375}}, {"image_id": 146504, "caption": " In the image, there is a person sitting at a desk with their hands on a computer keyboard and mouse. The keyboard and mouse are placed on a table in front of the person", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "mouse", "keyboard", "person", "laptop", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.8333333333333334}}, {"image_id": 40037, "caption": "There is a large clock tower with a green roof near a building in a scene. The clock tower is tall and has a large clock on top of it, indicating a building with a clock face on top", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["clock", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 343218, "caption": " In the image, two men can be seen on an outdoor tennis court, playing and enjoying a game of tennis. One of the men is holding a tennis racket, likely in the middle of a match or warm-up, while the other man is positioned nearby, waiting to play", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["tennis racket", "car", "person", "sports ball"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 301837, "caption": "The image showcases a long and narrow kitchen with white cabinets. The countertops appear to be made of granite or another similar stone material", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["oven", "clock", "sink", "apple", "refrigerator"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 309071, "caption": " The image features an older man bending over to remove the wheel of his bicycle from the paved area. He is standing next to a small potted plant and closer to the left side of the picture", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "potted plant", "bicycle", "bench", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 240681, "caption": "In the image, a person is standing next to a red motorcycle on the side of the road. The man is holding a cell phone and appears to be taking a photo of the motorcycle or possibly using it to take a call", "mscoco_hallucinated_words": [["cell phone", "cell phone"]], "mscoco_gt_words": ["backpack", "motorcycle", "car", "person"], "hallucination_idxs": [25], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2, "Recall": 0.5}}, {"image_id": 178753, "caption": "The image features a girl with braces smiling and holding a cellphone. She appears to be seated in a chair or a bench in an indoor environment", "mscoco_hallucinated_words": [["bench", "bench"]], "mscoco_gt_words": ["cell phone", "chair", "person"], "hallucination_idxs": [23], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 1.0}}, {"image_id": 278890, "caption": " The image shows a person holding a cell phone, wearing a blue shirt. The person seems to be in the process of using the phone while it's being placed close to their face", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "dining table", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 47781, "caption": "There is a room with a large bed and other furniture, including a table located near the bed. The bed is situated at the center of the room, and there are a few drawers underneath it", "mscoco_hallucinated_words": [["table", "dining table"]], "mscoco_gt_words": ["vase", "bed", "book", "person", "tv"], "hallucination_idxs": [14], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.2}}, {"image_id": 542792, "caption": "According to the picture, a large wooden baseball bat is standing tall, leaning against a building in the foreground. The large bat is a prominent feature of the scene, taking up most of the area around it", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["baseball bat", "person", "sports ball"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 293703, "caption": " A group of three men, presumably friends, is sitting at a table at a restaurant, enjoying a meal of pizza. The table has two large slices of pizza placed on it, one closer to the camera and another further away", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "bowl", "dining table", "chair", "bottle", "knife", "person", "pizza", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 318777, "caption": " The image features a baseball game happening in a stadium surrounded by a large crowd of spectators. There are several baseball players on the field, scattered throughout the scene", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "chair", "sports ball", "baseball glove"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 14773, "caption": " The image features a colorful plate with a hot dog and fries, placed on a table dining. The hot dog is surrounded by the fries, giving the impression that it's a snack or a meal", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "dining table", "spoon", "hot dog", "bottle", "car", "person", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 521863, "caption": "According to the picture, a young man riding a skateboard is skating through a crowd of people near a library. The skateboarder is skating down the sidewalk, making his way through the busy pedestrian area", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["skateboard", "bicycle", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 250540, "caption": "In the image, there is a group of four people sitting on motorcycles, one after another. They appear to be in the center of the street, with other motorcycles surrounding them", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "motorcycle", "handbag", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 211604, "caption": " In the image, there is a young woman lying on the floor, possibly due to exhaustion or illness. She is wearing a hat, a black and white shirt, and pants", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["tennis racket", "person", "sports ball"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 298067, "caption": "The image features a close-up view of meat being served with vegetables and a glass of beer next to it. The meat appears to be chicken or some other kind of poultry dish", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bottle", "dining table", "bowl", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 563938, "caption": " The scene depicts two people sitting on a couch, with one person wearing sunglasses and the other wearing a tie. Sitting in front of them is a woman, and a man can be seen to the left", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["tie", "couch", "bottle", "bench", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 461311, "caption": "The image depicts a crowded outdoor park filled with numerous people of all ages, some with kites in the sky. There are multiple kites in the air, with a clear blue sky as the backdrop", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "kite", "handbag", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 47940, "caption": "In the image, there is a person sitting on a bed, resting their legs on the edge of the bed. The person is holding a book and a mouse, with a computer keyboard visible in the background", "mscoco_hallucinated_words": [["mouse", "mouse"], ["keyboard", "keyboard"]], "mscoco_gt_words": ["person", "laptop", "book", "bed"], "hallucination_idxs": [31, 36], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 1.0}}, {"image_id": 261318, "caption": " There is a man sitting outside on a bench, talking on a cell phone. He is wearing a grey shirt and a red chair is located behind him", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "chair", "handbag", "bench", "person", "suitcase"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 134768, "caption": "In a close-up view of a computer desk, a keyboard is visible, sitting near the computer screen. A pair of speakers is also situated on the desk, just to the left of the keyboard", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["mouse", "laptop", "keyboard", "dining table"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 526414, "caption": " The image shows a quaintly decorated sewing room with various household items, including a TV, books, and a computer. The room has a comfortable atmosphere, with a desk and a chair arranged next to a bookshelf", "mscoco_hallucinated_words": [["chair", "chair"]], "mscoco_gt_words": ["scissors", "bowl", "dining table", "cat", "remote", "couch", "book", "laptop", "tv", "cup"], "hallucination_idxs": [35], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2, "Recall": 0.4}}, {"image_id": 273132, "caption": "The image shows an old woman, perhaps in her 70s, sitting on a park bench, wearing a hat and with a hand placed near her head. A suitcase is placed next to the woman, likely signifying her traveling or preparing for a trip", "mscoco_hallucinated_words": [["suitcase", "suitcase"]], "mscoco_gt_words": ["handbag", "bench", "person"], "hallucination_idxs": [31], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.6666666666666666}}, {"image_id": 505213, "caption": "In the image, a man with a black jacket is taking a bite of a hot dog while laughing. There are multiple hot dogs visible surrounding the man", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["hot dog", "sandwich", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 192656, "caption": " According to the picture, a baseball player is standing on a grass field wearing a baseball glove and throwing the ball. The player is wearing a black and blue jersey and white pants, giving a casual and cool appearance", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "sports ball", "baseball glove"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 272728, "caption": " The image showcases a vase filled with different types of flowers and greens. The vase is prominently placed on a table, creating a nice display", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "vase", "dining table", "potted plant"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 509811, "caption": "In a room filled with many wooden tables, a woman is sitting at one of them, surrounded by numerous laptops that are spread out around her. There are at least 15 laptops placed on the tables in various locations, some on the desks themselves and others on the floor", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "chair", "book", "apple", "person", "laptop"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 412407, "caption": "The image depicts a person holding an open cell phone up to their right hand. The cell phone is displaying a screen with red bars across the top, indicating the phone is active", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "clock", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 353658, "caption": " The scene features a woman holding a pink polka dot umbrella on a rainy day in an outdoor market. She is standing amidst a group of people gathered at the market, some of whom are holding their umbrellas to stay dry", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["clock", "suitcase", "handbag", "umbrella", "person", "carrot"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 441363, "caption": "The image depicts a man playing tennis, in the middle of the tennis court, swinging a racket as he strikes a tennis ball with it. The surrounding area of the court is filled with other people, either watching the game or waiting their turn to play", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["tennis racket", "person", "sports ball"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 331084, "caption": "The image shows a large, black dining table filled with various ingredients for making pizzas. There are several uncooked pizzas placed on the table, each with toppings such as onions and tomatoes", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "dining table", "spoon", "knife", "person", "pizza", "carrot"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2857142857142857}}, {"image_id": 282553, "caption": "According to the image, there are two women standing near the road at dusk. One of them appears to be closer to the camera than the other", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["handbag", "cell phone", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 328818, "caption": "According to the picture, there is a woman in a pink shirt, standing by a bench, adjusting her shoes. There is a bicycle placed behind the bench, partially visible in the scene", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bicycle", "bench", "bottle", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 3103, "caption": " | According to the picture, the image features a young man wearing a yellow shirt riding a skateboard and performing a trick on a large skate ramp. The skateboarder is in the middle of the trick, leaning into the skate ramp and showing off his skills", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["skateboard", "clock", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 188136, "caption": "The scene takes place inside a kitchen, featuring various appliances and food on a countertop. The counter is filled with fruit, including apples, oranges, and pears, which are scattered throughout", "mscoco_hallucinated_words": [["apple", "apple"]], "mscoco_gt_words": ["bowl", "dining table", "sink", "orange", "person", "carrot"], "hallucination_idxs": [25], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.16666666666666666}}, {"image_id": 449675, "caption": "In the image, there is a white plate with a sandwich cut in half on it. A fork and knife are situated near the sandwich, ready for someone to eat it", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "dining table", "spoon", "bottle", "sandwich", "knife", "carrot", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.375}}, {"image_id": 191691, "caption": "The image depicts a man shaving his face in a bathroom. He is standing by the sink, shaving his face in front of a mirror, while another person is standing in the background", "mscoco_hallucinated_words": [["sink", "sink"]], "mscoco_gt_words": ["bottle", "toothbrush", "person"], "hallucination_idxs": [17], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.3333333333333333}}, {"image_id": 89378, "caption": " In the image, a man wearing a red suit is standing near a motorcycle, which is positioned in front of him. The motorcycle is next to a red building with large doors, giving the scene an attention-grabbing appearance", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bicycle", "backpack", "motorcycle", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 99874, "caption": " In the image, a woman is sitting at a table while using her cell phone. She is holding her phone close to her ear, and appears to be in a conversation", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "dining table", "cat", "bottle", "handbag", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 437895, "caption": "There is an image of a bed with a colorful quilt spread over it. There is a lamp situated next to the bed, adding a touch of light to the scene", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["vase", "potted plant", "bed"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 557447, "caption": "The image features a man in a suit sitting at a desk, looking focused as he points at something on the table in front of him. There are multiple books or binders placed on the table, and one chair is positioned to the left of the desk", "mscoco_hallucinated_words": [["book", "book"], ["chair", "chair"]], "mscoco_gt_words": ["fork", "dining table", "spoon", "tie", "knife", "person"], "hallucination_idxs": [31, 41], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2857142857142857, "Recall": 0.3333333333333333}}, {"image_id": 159979, "caption": "The image shows a large group of people standing around a waterway filled with small boats. There are many umbrellas present in the scene, with one being much larger than the rest and covering a number of the boats", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["boat", "bowl", "person", "umbrella"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 357, "caption": " A baseball game is in progress, with several players on the field. The baseball player on the left side of the image is holding a baseball bat, getting ready to swing", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["baseball bat", "person", "baseball glove"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 538891, "caption": "The image features a woman playing tennis on a sports field. She is holding a tennis racket, prepared to serve the ball", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["tennis racket", "person", "sports ball"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 561967, "caption": "The image features a train traveling down the train tracks on a sunny day. The engine and cars are spread out across the track, with a blue and yellow train on the right side and several other train cars visible on the left", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["train", "traffic light", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 565778, "caption": "The image shows a blue passenger train on train tracks traveling along a section of track that extends into a tunnel. The train is moving from left to right, giving the impression of a train entering a tunnel", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["train", "traffic light", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 7125, "caption": " According to the picture, a group of people is riding bicycles along a path near a river or body of water. There are five distinct bicycles visible in the image, each with a person riding on it", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "bicycle", "bottle", "dog", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 221350, "caption": " In the image, a man is holding his necktie, which has an intricate heart pattern. The tie is a red color, and the man appears to be putting on or adjusting it", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "chair", "tie", "handbag", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 280930, "caption": "The image shows a little girl laughing in a kitchen. She is wearing a blue shirt and holding a pan with various food items inside", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bottle", "refrigerator", "person", "oven"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 151081, "caption": "The image features a large green field with a single tractor in the center. There are two helicopters, one of which is flying above the tractor, while the other is following the tractor along the highway, creating an interesting and peculiar sight", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["airplane", "person", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 122232, "caption": "The image features a woman in a yellow raincoat playing tennis on a tennis court. She is holding a tennis racket while standing on the court, with several tennis balls scattered around her", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["tennis racket", "person", "sports ball"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 134223, "caption": "The image features a plate of food containing a hot dog and french fries. The hot dog is situated at the center of the plate, surrounded by the french fries and various sauces", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "broccoli", "hot dog", "dining table"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 198163, "caption": "In the image, there is a man sitting at a table, surrounded by several white pans filled with a variety of colors. The pans are arranged on the table and cover most of the space, with some closer to the man and others further away", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "dining table", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 3742, "caption": " A vase of a single rose is placed next to a pink bowl filled with apples on a window sill. The apples are arranged neatly in the bowl, giving the appearance of being both fresh and carefully arranged", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "dining table", "apple", "vase"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 217593, "caption": " The image features a young boy in a baseball uniform standing in a dirt area near two trees, likely a sandbox or play area. The boy is holding a baseball glove in his hand, ready to throw the ball during a game", "mscoco_hallucinated_words": [["ball", "sports ball"]], "mscoco_gt_words": ["baseball bat", "chair", "handbag", "person", "baseball glove"], "hallucination_idxs": [41], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.4}}, {"image_id": 279078, "caption": " The image features a young man standing in front of a refrigerator, holding out an open bottle of beer and showcasing all the different bottles of beer inside the fridge. The bottles are displayed both on the left and right sides of the refrigerator, providing a view of a variety of different brands and types of beer", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bottle", "refrigerator", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 572081, "caption": " The image features a group of people gathered around a tennis court, likely watching a game or playing themselves. There are several tennis rackets on the court, including two at the far left side, one in the center, and three towards the right side of the scene", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "couch", "sports ball", "person", "tennis racket"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 477016, "caption": "According to the picture, a young girl wearing a pink shirt is standing in front of a refrigerator that has a fish and other items displayed inside it. A woman, possibly her mother or a family member, is also present, along with other people in the background", "mscoco_hallucinated_words": [["refrigerator", "refrigerator"]], "mscoco_gt_words": ["backpack", "potted plant", "oven", "sink", "handbag", "person"], "hallucination_idxs": [18], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2, "Recall": 0.16666666666666666}}, {"image_id": 301266, "caption": " In the scene, a group of people is gathered around a large dining table. There are two tables, one is located at the left side of the room and the other one at the right side", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "dining table", "spoon", "sink", "book", "person", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2857142857142857}}, {"image_id": 475813, "caption": "The scene features a child, likely between the ages of two and four, standing in a room with their arms outstretched, holding a remote control. The child appears to be playing or engaged in some sort of activity, such as testing the remote", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["handbag", "remote", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 558784, "caption": "According to the picture, there is a man standing next to a dugout area near a lake. The man is holding a baseball bat, indicating a possible intention to practice or play baseball", "mscoco_hallucinated_words": [["baseball bat", "baseball bat"]], "mscoco_gt_words": ["backpack", "person", "frisbee"], "hallucination_idxs": [24], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.3333333333333333}}, {"image_id": 308543, "caption": " The image depicts a hand holding two silverware utensils, namely two spoons, with their metallic surface and silver color contrasting the black background. The spoons appear to be in close proximity, perhaps being placed side by side or in the hand", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["spoon", "sink", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 359164, "caption": "According to the image, there are two small dogs standing on the grass in the backyard. The dogs seem to be enjoying their time outside, likely exploring their surroundings or chasing each other", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "dining table", "dog", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 539951, "caption": "The image displays a kitchen with a refrigerator and sink placed in the middle of the space, surrounded by checkers. There is also a stove in the kitchen, as well as a few bottles, including one near the center of the room", "mscoco_hallucinated_words": [["bottle", "bottle"]], "mscoco_gt_words": ["refrigerator", "clock", "sink", "oven"], "hallucination_idxs": [36], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.75}}, {"image_id": 143479, "caption": "According to the picture, a group of people is gathered together outdoors in a backyard setting. An old man is holding a tray with a large number of hot dogs, possibly being shared with others in the group", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "hot dog", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 475024, "caption": " The image depicts a vase with a variety of flowers inside. It is placed in front of a mirror, likely a decorative mirror", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["orange", "vase", "dining table", "potted plant"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 238065, "caption": "According to the image, a person is skateboarding up the side of a ramp, with the skateboard and the person being on the left side. The skateboarder is wearing a blue hat, likely a baseball cap, as they are skillfully riding the skateboard in the skatepark", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["skateboard", "chair", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 314016, "caption": "According to the picture, the bathroom contains a toilet and a sink, with a bottle of liquor placed on a shelf near the sink. In the background, there is a sign above the sink pointing towards the bathroom's name", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bottle", "toilet", "sink", "book"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 322163, "caption": "The image portrays a group of people in a commercial kitchen, preparing various foods and drinks for a meal. The main person in the scene is a man in a chef's apron, standing in the middle of the kitchen, surrounded by others who are also preparing the food", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "dining table", "potted plant", "remote", "oven", "bottle", "person", "pizza", "microwave"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.1111111111111111}}, {"image_id": 230983, "caption": "According to the picture, it captures a scene of a man on a skateboard performing a trick on a green container, which is partially blocked by another person. The skateboarder is in motion, creating an interesting visual contrast by leaping over the green object in the midst of the city", "mscoco_hallucinated_words": [["container", "bowl"]], "mscoco_gt_words": ["skateboard", "car", "person"], "hallucination_idxs": [21], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2, "Recall": 0.6666666666666666}}, {"image_id": 564629, "caption": "A kitchen has wooden cabinets, [IDK], [IDK]. The image also shows a stove top and oven in the kitchen, possibly a combination appliance", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["oven", "refrigerator", "sink", "microwave"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 53431, "caption": " In the image, there is a man sitting on a ledge next to a building, with a laptop on his lap. He is wearing a vest and two ties", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "laptop", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 441840, "caption": "In the image, there are two people and a young boy in a baseball field. The boy is wielding a baseball bat, while the other two people are present in the scene as well", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["baseball bat", "baseball glove", "car", "person", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 53465, "caption": "In the image, there is a cake with the words \"welcome to McDonald's\" written on it, sitting on a plate placed on a dining table. The table is covered with a tablecloth and surrounded by a few chairs, giving the scene a welcoming atmosphere", "mscoco_hallucinated_words": [["chair", "chair"]], "mscoco_gt_words": ["fork", "bowl", "dining table", "spoon", "cake", "person", "cup"], "hallucination_idxs": [43], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.2857142857142857}}, {"image_id": 381031, "caption": "The image depicts a plate of food, consisting of two donuts and a sandwich. The donuts are placed towards the right side of the plate, while the sandwich is located closer to the center", "mscoco_hallucinated_words": [["sandwich", "sandwich"], ["sandwich", "sandwich"]], "mscoco_gt_words": ["dining table", "donut", "spoon", "bottle", "microwave", "apple", "cup"], "hallucination_idxs": [14, 30], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.14285714285714285}}, {"image_id": 530520, "caption": " In the image, there are two men sitting on the grass in front of a building. One of them is using a laptop, while the other sits nearby, appearing to be engaged in conversation", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "motorcycle", "clock", "person", "laptop"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 539555, "caption": "In the image, there are multiple people of various ages and heights, with some standing or walking around. There is a man actively playing with a frisbee, which is visible in the background, possibly flying through the air", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["skateboard", "person", "frisbee"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 279521, "caption": "According to the picture, there are three men standing next to a sidewalk near a train. One person is in front of the group, with two others standing further back, close to the train", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "bus", "train", "handbag", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 560439, "caption": " In the image, three snowshoes can be seen, with two men and one woman wearing them and walking down a snowy hill. The group is in the center of the scene, and their snowshoes can be seen throughout the image", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["snowboard", "backpack", "skis", "handbag", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2}}, {"image_id": 248353, "caption": " There are several people skiing down a snowy slope, with some standing in line near the path. Among the group of skiers, a man can be seen in the front, wearing a red jacket, while another person is standing slightly behind and to the right", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["snowboard", "skis", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 9628, "caption": "The image captures an exciting scene on the water where a man is skydiving with a parachute. The man can be seen on the water, wearing a harness, as he leaps through the air with a kite, likely behind him", "mscoco_hallucinated_words": [["kite", "kite"]], "mscoco_gt_words": ["boat", "surfboard", "person"], "hallucination_idxs": [39], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.3333333333333333}}, {"image_id": 330050, "caption": "According to the image, a man and a woman are standing on a tennis court, each holding a tennis racket. They are both smiling and appear to be enjoying themselves", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bench", "tennis racket", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 254161, "caption": " According to the picture, the scene depicts a plaza or public square with a man standing on a red brick surface, looking up at a kite flying high in the sky. The kite flies off in the distance, near a tall building", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["handbag", "kite", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 275749, "caption": "According to the picture, there is a group of people standing and sitting around a table, interacting with one another. There are four people in the scene, with three of them positioned closer to the table while the remaining one is further away", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "chair", "bottle", "mouse", "person", "laptop", "tv", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 163518, "caption": "In the image, a woman is standing in a kitchen, working on a buffet or table filled with a variety of vegetables. There are numerous vegetable dishes on the table, such as lettuce, tomatoes, and broccoli", "mscoco_hallucinated_words": [["broccoli", "broccoli"]], "mscoco_gt_words": ["bowl", "dining table", "oven", "chair", "person"], "hallucination_idxs": [41], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.4}}, {"image_id": 156696, "caption": "The image is of a train station with a train parked on the right side and a person standing near the left side of the train. The train is located in a building, perhaps a train station, and a person is walking on the left side of the train", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["handbag", "train", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 525202, "caption": " In the image, a large pizza is placed on a metal pizza panner in front of a table. It appears to be a take-out pizza, as it has no visible toppings or cheese, but it has a distinct round shape", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "dining table", "chair", "spoon", "bottle", "knife", "person", "pizza", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2222222222222222}}, {"image_id": 423984, "caption": " The picture features a plate full of food that appears to be pasta with vegetables, including carrots and broccoli. There are several pieces of carrots spread across the plate, some closer to the edges and others more towards the center", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["carrot", "broccoli", "dining table"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 499486, "caption": "According to the picture, there are two cats sitting on a bed. One cat is black and white, while the other cat is grey and white", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cat", "book", "bed"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 118124, "caption": " The image shows a young man sitting in a car wearing glasses and a purple tie. The man is also wearing a shirt, possibly dark-colored, under his button-down shirt", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["tie", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 288729, "caption": "The image features a decorated cake with a small elephant inside, placed underneath a large red and yellow tipped tent, which looks like a circus tent. The cake appears to be about two feet high and covers a significant portion of the image", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["teddy bear", "cake", "bear", "person", "elephant"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 177721, "caption": "According to the picture, a man is performing a trick on a skateboard, with a green shirt and blue jeans visible in the scene. He is balancing on the skateboard as he is skillfully riding it while in motion", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["skateboard", "dining table", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 372220, "caption": "According to the picture, there are multiple people standing in different areas of the scene, including two men in the center of the image, and another man standing to the right. A man with a beard, glasses, and a black hat is standing near the other people, looking at something on his cell phone", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["handbag", "cell phone", "horse", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 252625, "caption": "The image depicts a narrow, empty sidewalk street with several people and bicycles, creating a quaint town-like atmosphere. A bicyclist rides down the sidewalk on the left side of the street, while three additional people are on the street in different spots", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bicycle", "traffic light", "potted plant", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 493610, "caption": "The image captures a scene of people sitting on the back of a truck, with a crowd of individuals enjoying a car ride. Some of the people are seated close to each other, while others are dispersed across the truck", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bus", "car", "person", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 302789, "caption": "The image shows a room with a small bed and a fridge, possibly in a kitchen or hotel room. The bed is covered with a sheet and has a suitcase placed on top of it, suggesting that someone has just packed their belongings before leaving", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "bed", "bottle", "sink", "handbag", "suitcase", "refrigerator"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.42857142857142855}}, {"image_id": 30667, "caption": " Sitting in the middle of the scene is a large, brown dog. It appears to be comfortably lying down on the floor, with a person sitting nearby, on the right side", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["boat", "dog", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 114108, "caption": "The image depicts a dining table with two pizzas placed on it, one with cheese and the other with cheese on it. There are multiple people around the table, and some of them are sitting on chairs while others stand", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "dining table", "chair", "spoon", "knife", "person", "pizza", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 328110, "caption": "The image captures a scene with a woman sitting on a bench and holding a baby. Other people are around the woman, with some sitting on a bench or standing nearby", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["handbag", "bench", "backpack", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 366111, "caption": "This is a black and white image showcasing a street scene with several men riding bicycles. In the middle, there is a man in a suit wearing a bow tie while traveling on his bicycle", "mscoco_hallucinated_words": [["tie", "tie"]], "mscoco_gt_words": ["bicycle", "traffic light", "car", "person"], "hallucination_idxs": [30], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2, "Recall": 0.5}}, {"image_id": 532481, "caption": " The image captures a thrilling moment of a person parasailing in the ocean. There are two kites visible: one on the left side and another on the right, indicating a pair of people enjoying the outdoor activity together", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["surfboard", "kite", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 291634, "caption": " The scene features a row of motorcycles parked on the side of the street, with several bikes of various sizes and colors lined up side by side. Some motorcycles are positioned closer to the viewer, while others are further down the street", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bicycle", "motorcycle", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 463678, "caption": "The image captures a man standing on a tennis court, preparing to swing his racket and hit the tennis ball. The man is wearing white and can be seen in the center of the picture, holding the tennis racket in his hand", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["tennis racket", "person", "sports ball"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 70815, "caption": "This image depicts a dog being walked on a leash, which is hanging from a motorcycle or bicycle in the background. The scene is likely a street or sidewalk, as there are multiple other people nearby, some sitting and others standing", "mscoco_hallucinated_words": [["motorcycle", "motorcycle"]], "mscoco_gt_words": ["bicycle", "dog", "person", "truck"], "hallucination_idxs": [16], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.75}}, {"image_id": 367872, "caption": " The image captures a baseball game, with a batter swinging at an oncoming ball. The batter is in the middle of the action, while the team members gather around the field to watch the play", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["baseball bat", "sports ball", "umbrella", "person", "baseball glove"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2}}, {"image_id": 353898, "caption": "The image features a man sitting on a stone bench surrounded by a large group of birds. The birds are a mix of doves and pigeons, with a few standing on the ground and many more in the air", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "backpack", "bench", "person", "bird"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 88269, "caption": " The image features a meal consisting of a bowl of soup and a couple of grilled cheese sandwiches. There are three sandwiches, each placed on the plate with different knives, one in the center and two on either side", "mscoco_hallucinated_words": [["knife", "knife"]], "mscoco_gt_words": ["spoon", "bowl", "sandwich"], "hallucination_idxs": [31], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.6666666666666666}}, {"image_id": 463211, "caption": "The image features two little girls wearing backpacks, one on the left and the other on the right, in front of a school bus. The girls appear to be leaving the bus and walking towards the right side of the scene", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "bus", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 396269, "caption": "There is a large room with two chairs against the wall, one closer and one farther back. The furniture is adorned with decorative elements, and there are three vases in the room filled with flowers", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "vase", "dining table"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 98979, "caption": "The image showcases a microwave, sitting on top of a kitchen counter, with its oven door slightly open. The microwave features a silver color, and a small button is visible inside the oven's interior, close to the bottom of the door", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["oven", "knife", "microwave"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 244455, "caption": " In the image, two men riding motorcycles are on the street, passing through the city or at a public event. They are both dressed in black and wearing helmets, and are riding on their motorcycles with one wearing a white shirt and the other wearing a black one", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["motorcycle", "bicycle", "car", "person", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 379443, "caption": "The image features a pair of orange scissors, arranged in a diagonal pattern. The scissors appear to be lying on the top of a table or desk", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["scissors", "dining table", "orange"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 536154, "caption": "The image features a young boy sitting on a bed, surrounded by a massive collection of stuffed animals. The boy is the main subject in the scene, while the stuffed animals are arranged all around him in various sizes and shapes", "mscoco_hallucinated_words": [["bed", "bed"]], "mscoco_gt_words": ["teddy bear", "cat", "person"], "hallucination_idxs": [9], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.3333333333333333}}, {"image_id": 374061, "caption": "The scene is a black and white photo featuring a cat, which is lying down on a couch. It appears to be sleeping or resting next to several teddy bears", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["teddy bear", "cat", "bed", "couch", "bear"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 560018, "caption": " The image captures a group of people enjoying a day out in the water on surfboards. The large crowd, consisting of various individuals, is spread out across the ocean waves, having fun and riding them", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["surfboard", "kite", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 353320, "caption": "In the scene, a guitar case is leaning on a bench, with various pieces of luggage surrounding it. There are five suitcases in total: one is situated close to the guitar case and the bench, while the other four are further back and towards the right side of the image", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["handbag", "bench", "suitcase", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 256628, "caption": " The image features a large dog lying on the wooden floor, with its mouth open and tongue out. The dog is positioned on the right side of the scene, with its head and neck occupying a significant portion of the area", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "bowl", "dog"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 158806, "caption": " The image captures a scene of a person feeding a cute brown and black dog a sandwich on a blue plate. The person has placed the sandwich on the table and the dog seems excited and eager to eat it", "mscoco_hallucinated_words": [["table", "dining table"]], "mscoco_gt_words": ["sandwich", "person", "dog"], "hallucination_idxs": [30], "metrics": {"CHAIRs": 1, "CHAIRi": 0.14285714285714285, "Recall": 1.0}}, {"image_id": 424270, "caption": " There is a small child in a white dress sitting on the bed in the image, occupying the center of the scene. The bed looks comfortable, with sheets and blankets covering it", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "tv", "bed"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 368335, "caption": " In the image, a brown horse is walking in between two cars, seemingly calmly exploring the area. The horse is placed in the middle of the street, surrounded by cars and various other traffic, creating a unique scene", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["horse", "car", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 483227, "caption": " The image captures a group of young tennis players wearing purple shirts standing on a tennis court. The players are holding tennis rackets, ready to play or practice", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["tennis racket", "person", "sports ball"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 228306, "caption": "This is a photo featuring a red bus driving on a street, likely in a city. The bus is parked near several tall buildings, including a building in the front, another in the middle, and another at the back of the bus", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bus", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 416384, "caption": " The image features a woman sitting on a white, wooden outdoor chair using her cell phone. There are other people in the background, including some near the sidewalk, and some standing at the side of the scene", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "chair", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 364783, "caption": "The image features a red and white bathroom with various bathroom accessories. There is a sink located next to the toilet, and the toilet itself is surrounded by red walls", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["potted plant", "chair", "bottle", "toothbrush", "sink", "toilet", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2857142857142857}}, {"image_id": 335041, "caption": "The image features a person in a red jacket skiing down a snowy street, surrounded by a lot of cars parked along the side. The cars are of different sizes and styles, including some that are at the edge of the street and others that are closer to the middle", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["skis", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 531327, "caption": " The image features a large white bowl filled with a variety of mixed vegetables, including broccoli, carrots, and other colorful, small pieces. The bowl is on a table, surrounded by different dining utensils such as forks, a knife, and a spoon, indicating that it is a meal to be served or enjoyed", "mscoco_hallucinated_words": [["bowl", "bowl"], ["bowl", "bowl"]], "mscoco_gt_words": ["fork", "dining table", "spoon", "knife", "wine glass", "broccoli", "carrot"], "hallucination_idxs": [6, 28], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.8571428571428571}}, {"image_id": 451228, "caption": "The image depicts a city street at night with numerous streetlights and multiple red double-decker buses traveling down the street. Some of the lights are hung up overhead in a festive display, creating a celebratory mood", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bicycle", "bus", "traffic light", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 256365, "caption": " The image depicts a plate covered in white frosting, filled with variously decorated cupcakes. Three cupcakes are present on the plate, one of which features blue frosting, creating an interesting contrast to the white frosting on the others", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cake", "dining table", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 502936, "caption": "The scene features a man playing tennis on a court, holding a tennis racket as he tries to hit a tennis ball. The ball is positioned near the center of the court, and the man is standing in the left side of the court, preparing to strike the ball", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["tennis racket", "person", "sports ball"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 451449, "caption": "According to the picture, a black and white dog is lying in a dog bed surrounded by numerous books, both small and larger ones. The dog bed is in a room, and the books are stacked on various surfaces throughout the scene", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dog", "book", "bed"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 51054, "caption": "The image features a woman sitting on a bed, holding a cellphone and talking on it. She appears to be an older woman, possibly the subject of a photo blur effect", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "bed", "bottle", "person", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 1268, "caption": "The image depicts a group of people gathering on a bridge over water. A man is standing in the middle, sitting on a bench to look out over the water, while a woman is next to him taking a picture", "mscoco_hallucinated_words": [["bench", "bench"]], "mscoco_gt_words": ["cell phone", "backpack", "boat", "handbag", "person", "bird"], "hallucination_idxs": [25], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.16666666666666666}}, {"image_id": 62692, "caption": "The image captures a female tennis player swinging her racket during a game, focused on her task. She is positioned at the center of the court and has her back to the camera", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["tennis racket", "person", "sports ball"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 542771, "caption": "The image features an old black and white photograph of a room with several chairs and a single table. There is a vase of flowers on the table, adding a decorative touch to the setting", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["vase", "dining table", "potted plant", "chair", "book", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 575406, "caption": "The image depicts a blue and red bus with a large white wing on the side parked on a city street. The bus seems to be a tourist attraction and features a mix of passenger seating and standing areas", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bus", "motorcycle", "potted plant", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 244834, "caption": "In the scene, two people, a man and a woman, are walking along a rainy sidewalk. They both hold colorful umbrellas, with the man carrying one in red, white, and blue and the woman carrying a yellow one", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["potted plant", "bicycle", "clock", "umbrella", "handbag", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2857142857142857}}, {"image_id": 151159, "caption": " In the image, two men can be seen riding skateboards on a tennis court. One man is wearing a tie, while the other person is dressed in a white shirt and brown pants", "mscoco_hallucinated_words": [["tie", "tie"]], "mscoco_gt_words": ["skateboard", "bench", "person"], "hallucination_idxs": [21], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2, "Recall": 0.6666666666666666}}, {"image_id": 277073, "caption": "In the scene, two adults are sitting on the back of a moped as they travel down a busy street. One person is a man, the other a woman", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "motorcycle", "bicycle", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 377879, "caption": " The image shows two military tanks on a train. They appear to be large and in good condition", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["train", "bed", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 436814, "caption": "The image depicts a small room with various items placed inside it. In the room, there is a laptop sitting on a desk, with a mouse positioned near it", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "mouse", "laptop", "dining table"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 63934, "caption": "A person dressed as a nun is skating down a city street on a skateboard, likely in a parking lot or other public area. The skateboard is located on the sidewalk, with some cars parked alongside the road", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["skateboard", "car", "person", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 275611, "caption": " The image features a whole pizza with cheese and spinach sitting on a plate. The pizza is placed on top of a wood table, which takes up most of the image", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["pizza", "dining table", "knife"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 516248, "caption": " Sitting in front of a computer at night, someone is holding a keyboard and mouse. The keyboard and mouse are plugged into a computer, indicating that the person is using it to communicate or navigate through the internet", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "mouse", "keyboard", "person", "laptop", "tv"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 478380, "caption": " The image shows a man driving a truck down a road, surrounded by a large herd of sheep. There are multiple large flocks of sheep scattered throughout the scene, with some in the front of the truck, while others are further back", "mscoco_hallucinated_words": [["truck", "truck"], ["truck", "truck"]], "mscoco_gt_words": ["sheep", "car", "person"], "hallucination_idxs": [7, 39], "metrics": {"CHAIRs": 1, "CHAIRi": 0.4, "Recall": 0.6666666666666666}}, {"image_id": 422326, "caption": " The image features a parking lot filled with various vehicles, including motorcycles, a sidecar, and a pickup truck. Among the motorcycles, there is a sidecar, which stands out in the scene", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["motorcycle", "bicycle", "car", "person", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 110449, "caption": "The image shows two men wearing headphones, each standing near the edge of a table. One man is in the foreground, and the other man is in the background", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["remote", "dining table", "person", "laptop", "tv"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 45550, "caption": " The image features a man standing in a restaurant or cafe, smiling as he poses for a photo. He holds a plate with a sandwich, likely French fries and a cup of soda", "mscoco_hallucinated_words": [["cup", "cup"]], "mscoco_gt_words": ["clock", "bowl", "sandwich", "person"], "hallucination_idxs": [33], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.5}}, {"image_id": 444913, "caption": "According to the picture, the scene is of a man standing in a grassy area. He appears to be holding a red Frisbee and throwing it towards a nearby building", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["car", "person", "frisbee"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 82709, "caption": " The image depicts a black and white dog catching a frisbee in the air, mid-jump, as it leaps over a large group of people. The frisbee is suspended in the air, with the dog in pursuit", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "frisbee", "bottle", "dog", "person", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 132796, "caption": " In the image, three people are riding on the backs of two elephants. The first elephant has a man sitting on its back, with another person seated to the right, and a third person seated to the left", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "chair", "bench", "person", "elephant"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 303099, "caption": "In the image, two cats are sitting on a toilet seat. One cat is black and white, while the other is mostly black", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bottle", "toilet", "cat"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 271565, "caption": "According to the image, there is a group of motorcycles driving down a street. There are a total of nine motorcycles lined up on the road, some in the front row and others in the middle row", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["motorcycle", "car", "person", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 205193, "caption": "In the picture, there is an assortment of beverages, with two cups and one bottle positioned on a marble counter. The cups are placed close to each other, while the bottle is located further away to the right", "mscoco_hallucinated_words": [["cup", "cup"], ["bottle", "bottle"], ["cup", "cup"], ["bottle", "bottle"]], "mscoco_gt_words": ["oven", "microwave", "person", "toaster"], "hallucination_idxs": [13, 16, 24, 34], "metrics": {"CHAIRs": 1, "CHAIRi": 1.0, "Recall": 0.0}}, {"image_id": 272566, "caption": "The image shows a man sitting on the ground near a sidewalk outside a store, surrounded by various types of fruits. In the front of the display, there are numerous bananas, both ripened and green, spread out across multiple bowls", "mscoco_hallucinated_words": [["bowl", "bowl"]], "mscoco_gt_words": ["banana", "person", "apple", "cup"], "hallucination_idxs": [44], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.5}}, {"image_id": 170099, "caption": " In the image, a man dressed in a suit is standing in front of a couch. He appears to be in the middle of speaking, as he looks towards the camera and gestures with his hands", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["tie", "orange", "couch", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 14940, "caption": " The image shows two animals, a cat and a stuffed dog, both laying on a bed or couch, with the cat closer to the front of the scene. The cat is laying on top of the stuffed dog, which has a long snout", "mscoco_hallucinated_words": [["bed", "bed"]], "mscoco_gt_words": ["cat", "chair", "couch", "orange", "dog"], "hallucination_idxs": [17], "metrics": {"CHAIRs": 1, "CHAIRi": 0.14285714285714285, "Recall": 0.6}}, {"image_id": 408449, "caption": "According to the picture, a man is shirtless and riding a skateboard down the street, likely enjoying his activity. There are multiple people in the background, some closer to the skateboarder and others further away", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "bus", "handbag", "skateboard", "car", "person", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2857142857142857}}, {"image_id": 140702, "caption": " The image features two elephants, one large and one small, walking in the grass. The larger elephant is significantly taller than the smaller one, and they appear to be standing close to each other, possibly even in a playful manner", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["elephant", "bird", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 354540, "caption": " The image depicts a kitchen with a person sitting at a tabletop, working on a laptop. There is a microwave oven and a toaster oven in the kitchen, with the laptop placed on top of one of them", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "oven", "chair", "person", "toaster", "laptop", "microwave"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.7142857142857143}}, {"image_id": 19763, "caption": "According to the picture, a slice of deep-fried pizza is sitting on a white plate, which is placed on a dining table in a restaurant. There is another plate visible near the pizza, likely containing another piece of food", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "dining table", "chair", "knife", "person", "pizza", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2857142857142857}}, {"image_id": 191301, "caption": " The image showcases a dinner table with a tray displaying two desserts \u2013 a cake and a piece of ice cream. The cake is a chocolate one, and the ice cream is a combination of two scoops", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "spoon", "cake", "person", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 124236, "caption": " The image displays a kitchen area with a dark, narrow opening from a window, revealing sunlight and a few items placed on the countertop. A table sits in the middle of the kitchen space, surrounded by a few pots and pans", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "dining table", "oven", "spoon", "toaster"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2}}, {"image_id": 344930, "caption": "A red fire hydrant sits on the side of the road in the image. The fire hydrant is placed close to a car parked nearby, with a blue top on it", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["orange", "car", "fire hydrant"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 14285, "caption": " There is a large, multi-colored cat sitting on a bed in the image. The bedroom setting has a TV in one corner, a couch nearby, and a desk with a computer on it", "mscoco_hallucinated_words": [["couch", "couch"], ["desk", "dining table"], ["computer", "laptop"]], "mscoco_gt_words": ["remote", "cat", "bed", "chair", "book", "tv"], "hallucination_idxs": [26, 31, 34], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.5}}, {"image_id": 82488, "caption": " The image features two beds in a hotel room setting, each with a yellow pillow on top. One bed is positioned to the left, and the other bed is located to the right", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["remote", "dining table", "bed", "clock", "book", "orange"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.16666666666666666}}, {"image_id": 348251, "caption": " The image shows a person skiing down a snow-covered slope. They are wearing skis and holding ski poles, as seen in the surrounding area", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "skis", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 150703, "caption": " The image displays a table with a hot dog served on a tray. The hot dog has tomatoes and pickles, making it an interesting culinary choice", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["hot dog", "dining table", "sandwich", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 381615, "caption": "The image features a window filled with colorful plants and a potted plant, creating a lively and cozy atmosphere. The plants are arranged both around the edges of the window and near the middle, filling the scene", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["vase", "potted plant", "chair", "book", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2}}, {"image_id": 352703, "caption": " The image shows a woman standing in a kitchen, surrounded by various objects. She is wearing an apron and appears to be in the middle of cooking", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "dining table", "oven", "spoon", "bottle", "handbag", "person", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.125}}, {"image_id": 111109, "caption": "The image features a young boy wearing a sweater and shorts, sitting on a chair in the middle of the room. The boy seems to be enjoying his time while posing for the camera", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["motorcycle", "chair", "tie", "person", "tv"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 226802, "caption": " The image captures a busy street in an Asian city where people are gathered, walking, or sitting, such as on the sidewalks. There are multiple vehicles present, including a large truck and several buses", "mscoco_hallucinated_words": [["truck", "truck"]], "mscoco_gt_words": ["bus", "motorcycle", "car", "person"], "hallucination_idxs": [35], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.5}}, {"image_id": 49005, "caption": "There is a baseball game happening on a field, with several players visible around the grassy area. A total of 15 players are spread across the field, participating in the game", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["baseball bat", "person", "baseball glove"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 410114, "caption": " In this image, a herd of cattle is walking down a dirt road, with a large group of cows and bulls following the lead of a person riding a horse nearby. There are also several other horses along the road, riding along or trailing behind the lead horse and other animals", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["truck", "horse", "person", "cow"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 100274, "caption": " The image features a train track where multiple train cars are parked, including a flat car. The train cars are spaced out along the track, with the flat car at the center of the scene", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["train", "car", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 317254, "caption": "The image features a person wearing a mask while riding a motorcycle down the street. The person appears to be in motion, possibly traveling on the motorcycle", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["motorcycle", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 425569, "caption": " The image captures an empty, large, restaurant-style kitchen with various appliances and cooking utensils. There are multiple refrigerators and ovens in the space", "mscoco_hallucinated_words": [["refrigerator", "refrigerator"]], "mscoco_gt_words": ["bowl", "sink", "oven"], "hallucination_idxs": [20], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.3333333333333333}}, {"image_id": 28842, "caption": "There is a small park near a grassy area where a few people are hanging out. One person appears to be riding a skateboard, and another person appears to be wearing a blue backpack", "mscoco_hallucinated_words": [["backpack", "backpack"]], "mscoco_gt_words": ["skateboard", "dog", "person"], "hallucination_idxs": [35], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2, "Recall": 0.6666666666666666}}, {"image_id": 319607, "caption": "The image depicts a street scene with a combination of traffic lights and a bike on the side of the road. On the right side, there are multiple traffic lights, with one red light to the left, followed by a yellow light, another red light to the right, and another yellow light", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "bus", "bicycle", "traffic light", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 210372, "caption": "The image portrays a small kitchen with red cabinets and a sink. The sink is located towards the middle of the kitchen, positioned underneath a window", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["refrigerator", "bottle", "sink"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 156915, "caption": "The image showcases a table with a beautiful arrangement of flowers, featuring a red rose in the center and white flowers around it. There are also some greens and filler flowers accompanying the roses, adding a bit of greenery to the overall bouquet", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["vase", "dining table", "potted plant"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 349642, "caption": "According to the image, there are two people sitting on a bench while a dog is sitting on the ground in front of them. The dog is positioned in the foreground, while the people are seated further back", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bench", "dog", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 423008, "caption": " The image depicts a group of people gathered around a body of water where several boats are docked. The people are standing close to the water's edge, with some of them occupying spots under umbrellas or tents", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["boat", "umbrella", "handbag", "person", "suitcase"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 45435, "caption": "According to the picture, a person is holding a cell phone in their hand. The phone is occupying a significant portion of the image, making it the focal point", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "person", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 35827, "caption": " The image depicts a man sitting at a desk in front of two computers, using one of them. He is sitting in front of a computer, which has a laptop on the desk", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "chair", "bottle", "person", "laptop", "tv", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.42857142857142855}}, {"image_id": 72656, "caption": " In the image, three young boys are sitting at a small table eating. There are two chairs at the table and each child has a plate on the table", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "dining table", "chair", "person", "pizza", "suitcase"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 372087, "caption": "The scene depicts a green and yellow train traveling along train tracks as it crosses a bridge. The train occupies a substantial portion of the image, with different areas of the train visible", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["train", "bench", "suitcase", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 336209, "caption": "According to the picture, a man is standing on a skateboard, likely practicing a trick. He appears to be riding on a wooden ledge or a ramp", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["skateboard", "bench", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 46031, "caption": "The image features a table with a laptop sitting on it. The laptop has a keyboard, mouse, and a monitor, creating a typical setup for a desktop computer", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "dining table", "mouse", "keyboard", "laptop", "tv"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.8333333333333334}}, {"image_id": 283118, "caption": "The image captures a family at a dining table with a variety of foods, including a few sandwiches and chicken wings. The father, mother, and their two children appear in the picture, sharing a moment at the dinner table", "mscoco_hallucinated_words": [["sandwich", "sandwich"]], "mscoco_gt_words": ["cell phone", "backpack", "dining table", "chair", "bottle", "handbag", "car", "person", "pizza"], "hallucination_idxs": [18], "metrics": {"CHAIRs": 1, "CHAIRi": 0.16666666666666666, "Recall": 0.2222222222222222}}, {"image_id": 429598, "caption": "The image shows a kitchen with a brick wall and a small refrigerator located near the sink. A stove top oven can be seen in the foreground", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sink", "bottle", "refrigerator", "oven"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 333365, "caption": "Scene", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["car", "airplane", "person", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 424174, "caption": "The image features a large bowl filled with a variety of fruit, including numerous bananas and apples, placed on a table. The bananas can be found dispersed throughout the bowl, while the apples are situated around the edges", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "dining table", "banana", "orange", "apple"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.8}}, {"image_id": 3035, "caption": " The image captures an airport scene where two airplanes are parked on a runway. One airplane is positioned at the top right, while the other airplane is situated closer to the bottom center of the scene", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["car", "airplane", "person", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 177213, "caption": "The image features a person sitting at a table, eating a pizza with cheese and spinach on it. The pizza is the main focus of the scene, occupying the majority of the table's space", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "dining table", "knife", "person", "pizza", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 438535, "caption": "The image captures a city street in black and white, featuring a large clock with a white face and Roman numerals in the center of the photo. The clock, mounted on a large pole, has a dark background, making the numbers more visible", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "clock", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 490711, "caption": "According to the picture, the image features a white refrigerator standing next to a white cabinet in a kitchen. There is a large sink located on the left side of the refrigerator and a microwave placed on the right side, which could be used for cooking or warming food", "mscoco_hallucinated_words": [["microwave", "microwave"]], "mscoco_gt_words": ["sink", "banana", "refrigerator"], "hallucination_idxs": [36], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.6666666666666666}}, {"image_id": 163728, "caption": " The image features a small black and white kitten sleeping on a table, specifically on a mouse pad, seemingly relaxing after its playtime or nap.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "cat", "mouse", "laptop", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 456756, "caption": " The scene features a tall giraffe standing next to a zebra, both looking towards the right side of the image. There are three other giraffes, one to the left of the tall giraffe and two more located near the center of the image, further back from the camera", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["zebra", "giraffe", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 281028, "caption": "The image features a train, likely a subway car, with a set of chairs placed in the center of the vehicle. There are two side chairs on the left side of the image, and two more chairs are situated on the right side", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["train", "chair", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 343937, "caption": " In the image, a woman in black snow pants and a white jacket is snowboarding down a snowy hill. She is wearing a helmet for added safety and protection", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["snowboard", "skis", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 277051, "caption": "Two birds are sitting on top of a table covered with pizza slices and other items. There are two bottles visible in the background, one closer to the left side of the image and the other one on the right side", "mscoco_hallucinated_words": [["pizza", "pizza"]], "mscoco_gt_words": ["dining table", "chair", "bottle", "knife", "bird"], "hallucination_idxs": [11], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.6}}, {"image_id": 145666, "caption": " The image portrays a large pot filled with a variety of vegetables, primarily broccoli and carrots. The broccoli is situated in different parts of the pot, while the carrots are positioned in the middle of the pot", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "broccoli", "dining table", "carrot"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 304984, "caption": " The image displays a plate of food, including a sandwich and two small bowls. The sandwich appears to be a French or grilled cheese sandwich, and it's placed on a white plate", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "bowl", "cake", "sandwich", "wine glass", "orange"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 122467, "caption": "According to the picture, a person is holding a white Wii remote, likely playing a video game. In the background, there are two chairs positioned in the left corner, one couch and the other more upright", "mscoco_hallucinated_words": [["chair", "chair"]], "mscoco_gt_words": ["couch", "remote", "dining table", "person"], "hallucination_idxs": [27], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.75}}, {"image_id": 518287, "caption": "According to the image, a toothbrush is sticking out of an orange container. This unique object, likely a toothbrush holder or a cup, features a smile on one side and a toothbrush sticking out of the other side", "mscoco_hallucinated_words": [["container", "bowl"]], "mscoco_gt_words": ["orange", "toothbrush", "dining table", "cup"], "hallucination_idxs": [13], "metrics": {"CHAIRs": 1, "CHAIRi": 0.16666666666666666, "Recall": 0.75}}, {"image_id": 145448, "caption": "The image features a black cloth covering an area on a table, likely on a patio or a similar outdoor setting, where a small cat is sitting and resting. The cat is curiously watching a man standing closer to the camera than the cat", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["motorcycle", "dining table", "cat", "chair", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 352900, "caption": "The image displays a dish of food on a table, likely containing a combination of pasta and broccoli. It is served on a white plate and appears to be a substantial portion", "mscoco_hallucinated_words": [["table", "dining table"]], "mscoco_gt_words": ["fork", "bowl", "broccoli", "knife"], "hallucination_idxs": [9], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.25}}, {"image_id": 153607, "caption": "According to the picture, a blue vase with a flower can be seen in different parts of the image. There is a close-up shot of the vase with a single flower placed in it, and a few other parts of the image reveal the vase with different angles and perspectives", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["orange", "bowl", "dining table", "vase"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 157581, "caption": "The image shows a table lined with a variety of bottled wine, giving it a festive appearance. There are 10 different wine bottles of various sizes, colors, and designs arranged across the table", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "chair", "bottle", "wine glass", "person", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 227438, "caption": " The image features a clean, well-made bed in a hotel room. The bed takes up most of the space in the room, and there are a few decorative elements, including a vase situated on a table near the bed", "mscoco_hallucinated_words": [["vase", "vase"], ["table", "dining table"]], "mscoco_gt_words": ["chair", "couch", "clock", "bed"], "hallucination_idxs": [35, 39], "metrics": {"CHAIRs": 1, "CHAIRi": 0.4, "Recall": 0.25}}, {"image_id": 116037, "caption": "The image captures a baseball game scene with multiple people involved. There are three main people in the scene: a batter swinging a baseball bat at a ball during a game, a catcher, and an umpire standing close to the players", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["baseball bat", "person", "sports ball", "baseball glove"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 202658, "caption": " A small toilet, adorned with a Hello Kitty seat cover, is sitting in a room, likely in a basement or storage area. The toilet has a pink seat, which gives it a cute appearance", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "bowl", "toilet"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 18150, "caption": "A man and a young child are sitting on a floor together, surrounded by some chairs, likely in a living room setting. The child is eating a slice of pizza as the man watches, seeming to share the pizza with him", "mscoco_hallucinated_words": [["chair", "chair"]], "mscoco_gt_words": ["backpack", "couch", "bottle", "person", "pizza"], "hallucination_idxs": [16], "metrics": {"CHAIRs": 1, "CHAIRi": 0.14285714285714285, "Recall": 0.4}}, {"image_id": 418711, "caption": " The image features a man riding a bicycle down the street, with a large load of bananas strapped to the bike's back. The man appears to be moving from the right to left direction of the scene", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["banana", "bicycle", "car", "person", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 92107, "caption": " The image depicts a green bowl filled with soup, likely containing corn, broccoli, and carrots. The bowl is sitting on top of a placemat or place mat in a dining room setting", "mscoco_hallucinated_words": [["carrot", "carrot"]], "mscoco_gt_words": ["spoon", "bowl", "broccoli", "dining table"], "hallucination_idxs": [17], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.5}}, {"image_id": 491000, "caption": "In a narrow city street, a group of people is walking and enjoying their surroundings. They are spread out along the sidewalk and walking in different directions, some near a building with a sign on it", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["motorcycle", "handbag", "car", "person", "dog"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2}}, {"image_id": 401163, "caption": "In the image, a man is sitting on a park bench while a dog is laying near him. They appear to be enjoying the park area, with a green park bench serving as the setting", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bench", "dog", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 39663, "caption": " The image shows a collection of items, including a backpack, a laptop, and a few books spread out across the floor. The backpack is placed in the center of the scene, while the laptop is located slightly towards the left side", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "scissors", "backpack", "book", "laptop"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 268293, "caption": " The image captures a tennis player in motion, swinging a racket to hit a tennis ball during a game. The main subject, wearing a blue and white shirt, is holding a tennis racket and is focused on the approaching ball", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["tennis racket", "person", "sports ball"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 474499, "caption": "The image depicts a small kitchen with various appliances. In the room, there is an oven, a washing machine, and a refrigerator", "mscoco_hallucinated_words": [["refrigerator", "refrigerator"]], "mscoco_gt_words": ["vase", "oven", "spoon", "bottle", "clock", "sink", "apple"], "hallucination_idxs": [25], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.14285714285714285}}, {"image_id": 358086, "caption": " The image depicts a group of people playing a game of frisbee. There are several people standing or jumping around the field, actively participating in the game", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "chair", "bottle", "person", "frisbee"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 89541, "caption": " The image features a variety of food in a yellow container, with several pieces of cakes and muffins. Among these items, there are three different kinds of cakes, with one being larger and the other two being smaller", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["banana", "cake", "bowl", "dining table"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 239445, "caption": "The image depicts a man with a white shirt standing in front of a fenced-in area with several people scattered around. He is holding a white frisbee, seemingly contemplating what to do with it", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "sports ball", "frisbee"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 105782, "caption": "A giraffe is standing in a large grassy field, appearing to be chasing a kite. The kite flies in the background, adding interest to the scene", "mscoco_hallucinated_words": [["giraffe", "giraffe"]], "mscoco_gt_words": ["cat", "kite", "dog", "car"], "hallucination_idxs": [1], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.25}}, {"image_id": 487990, "caption": "A person is holding a guitar and placing it in front of a table filled with various food items. The table is surrounded by chairs and other people, creating a fun and festive atmosphere", "mscoco_hallucinated_words": [["chair", "chair"]], "mscoco_gt_words": ["fork", "bowl", "dining table", "donut", "spoon", "bottle", "cake", "knife", "person", "cup"], "hallucination_idxs": [25], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2, "Recall": 0.2}}, {"image_id": 138834, "caption": "In the scene, there is a man walking next to a vehicle, possibly a truck or a SUV, wearing snow equipment. He is carrying ski poles in his right hand and skis on his back", "mscoco_hallucinated_words": [["truck", "truck"]], "mscoco_gt_words": ["skis", "car", "person"], "hallucination_idxs": [16], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2, "Recall": 1.0}}, {"image_id": 492057, "caption": "In the image, a man wearing a black jacket is taking a selfie. He appears to be in a public bathroom, possibly recording a message or a sign on the back wall", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "tie", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 388215, "caption": "The image shows a man in a blue and white shirt playing tennis, standing on a court and preparing to serve the tennis ball. The man is holding a tennis racket and is getting ready to swing it to hit the ball, which is positioned at a location on the court close to his left side", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["tennis racket", "person", "sports ball"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 111409, "caption": "The image features a man riding a motorcycle on a sidewalk. He is wearing a helmet and sitting on the bike while it's stationary", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bicycle", "motorcycle", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 451391, "caption": "The image captures a person holding a large bouquet of green broccoli flowers, which are arranged in an artistic manner. This arrangement showcases the beauty of broccoli flowers, which are typically used as decorative items or presented as a gift", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["broccoli", "dining table", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 92462, "caption": "The image features a group of cows walking down a dirt road in front of a car. There are six cows visible in the scene, with two of them in the middle and the others trailing behind, creating a long line of cows", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "car", "person", "cow"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 397268, "caption": "According to the picture, a store window displays two bicycles side by side, one leaning against the other. The bicycles are placed in front of the window, outside the shop", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bicycle", "chair", "bench", "potted plant"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 127659, "caption": " The image features a large passenger train pulling along the railroad tracks, which is the main focus of the scene. There are a few people waiting at a train station, some sitting on the benches that are placed throughout the platform, and others walking around the area", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["train", "bench", "dog", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 251857, "caption": "The image captures a group of skateboarders in a city plaza. Two men are skateboarding, with one skateboarding right in front of the camera, and the other one further back", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["skateboard", "traffic light", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 243212, "caption": "According to the picture, a young boy in a green shirt is standing in a field while holding a blue frisbee. The boy is the main focus of the image as he is the only person present in the scene", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dog", "car", "truck", "person", "frisbee"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 444304, "caption": "The scene shows a person sitting on a bed, crouching down with their back to the wall. They appear to be playing a video game on a TV, possibly on a stand next to them", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "remote", "tv", "bed"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 305000, "caption": " In the image, there is a market stand in the background with two women shopping for produce. An older woman is standing near a table full of vegetables, with several baskets and an empty cup nearby", "mscoco_hallucinated_words": [["table", "dining table"], ["cup", "cup"]], "mscoco_gt_words": ["banana", "apple", "person"], "hallucination_idxs": [26, 37], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.3333333333333333}}, {"image_id": 44136, "caption": "Two men dressed in tuxedos are seated at a table in a social setting. One of the men is holding a glass bottle, possibly a wine bottle, while the other person has a bottle in their hand", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "tie", "bottle", "wine glass", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 154846, "caption": "The image features a large pan of pizza covered in pepperoni and mushrooms. Several slices of the pizza can be seen throughout the dining table", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["pizza", "dining table", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 567254, "caption": " The image features a small child with blonde hair in the center of the scene, sitting in front of a television. The child appears to be playing with a pink toothbrush held in her right hand, possibly brushing her teeth", "mscoco_hallucinated_words": [["toothbrush", "toothbrush"]], "mscoco_gt_words": ["person", "bottle", "tv", "vase"], "hallucination_idxs": [32], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.5}}, {"image_id": 79261, "caption": " According to the picture, a man is standing in a body of water, mopping the area with a broom. The water appears to be located in front of a building and is surrounded by various people in different areas of the scene", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["handbag", "backpack", "clock", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 301402, "caption": "The image depicts a man wearing a hat, sitting on a chair and looking at his laptop. He is positioned at the center of the scene, focusing on his laptop, which is placed on a table nearby", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "potted plant", "chair", "bottle", "person", "laptop"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 415828, "caption": "The scene takes place on a street where a man and a woman are standing outside of a building. They appear to be waiting for a bus or a ride, as they are accompanied by a few other people nearby", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "stop sign", "umbrella", "handbag", "traffic light", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.14285714285714285}}, {"image_id": 543231, "caption": " In the image, a woman is taking a picture with a camera. She is holding a remote control in one hand while standing next to a couch, and there is another person in the background", "mscoco_hallucinated_words": [["couch", "couch"]], "mscoco_gt_words": ["remote", "bowl", "bed", "book", "person"], "hallucination_idxs": [28], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.4}}, {"image_id": 495357, "caption": " In the scene, a small motorcycle is traveling down the street with a person riding it. There are several people on the street, including a few men and a woman, who are interacting with each other or focusing on other aspects of the street scene", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["handbag", "motorcycle", "dog", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 523175, "caption": " The image displays a bowl filled with soup on a countertop or table. The soup has many vegetables, including oranges, carrots, and onions", "mscoco_hallucinated_words": [["orange", "orange"]], "mscoco_gt_words": ["spoon", "bowl", "carrot", "dining table"], "hallucination_idxs": [21], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.75}}, {"image_id": 184945, "caption": "The image depicts a row of motorcycles parked on the side of a road. The motorcycles are positioned close to each other, creating a line", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bicycle", "motorcycle", "potted plant"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 49942, "caption": " The image features a man holding an umbrella with a pink and white striped shirt. The man is facing forward, and the umbrella covers much of his face", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["tie", "person", "umbrella"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 223019, "caption": "The image features a blue train, likely a commuter train, sitting on the train tracks, with a person standing on the right side of the train and several people on the left side of the train. There are also a couple of handbags on the platform, one closer to the left side of the train and the other closer to the right side", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "train", "handbag", "car", "person", "suitcase"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 42889, "caption": "In the image, there is a teddy bear sitting on a table in front of a computer, with a keyboard and a mouse nearby. The keyboard is placed slightly behind the teddy bear, while the mouse is positioned to the right of it", "mscoco_hallucinated_words": [["table", "dining table"], ["computer", "laptop"], ["mouse", "mouse"], ["mouse", "mouse"]], "mscoco_gt_words": ["teddy bear", "bear", "keyboard"], "hallucination_idxs": [12, 17, 24, 39], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.6666666666666666}}, {"image_id": 22112, "caption": "In the image, there are a few interesting objects on display. Among the items, a large, blue vase with greenery inside is prominently positioned in the center of the image", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "dining table", "potted plant", "vase"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 247587, "caption": "In the image, there is a beach scene with a man riding a surfboard on the sand. The man appears to be standing on the surfboard as he walks along the beach", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["surfboard", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 171962, "caption": " There is a large city bus with bicycles attached to the front of it. The bicycles can be seen on the right side of the bus", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bicycle", "bus", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 545056, "caption": " The scene takes place in a large, grassy field where a herd of cows is grazing. There are many cows scattered throughout the field, with some closer to the front of the image and others further away", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sheep", "dog", "car", "cow"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 401411, "caption": " In the image, there is a man standing in a kitchen, surrounded by other people. There are three people sitting across from the man, with one person slightly to his left, another slightly to his right, and the third one right behind him", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "dining table", "oven", "book", "person", "carrot", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.14285714285714285}}, {"image_id": 2867, "caption": " The image portrays a group of people standing outside in the snow, ready to go skiing. All the individuals have skis on their backs and some are holding backpacks", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "skis", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 246963, "caption": "According to the picture, it depicts a group of motorcyclists riding down the road. They appear to be traveling in a single lane on the right side of the road, with a stop sign and traffic sign nearby", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["stop sign", "motorcycle", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 498225, "caption": "In the picture, there are three people standing in front of a glass door, likely to be a display window of a bakery. They appear to be admiring the various cakes and pastries visible in the shop", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "donut", "cake", "handbag", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 124601, "caption": " In the image, there is a kitchen with various appliances and a laptop on a counter. The kitchen has a wooden surface with cabinets against the wall, along with two cupboards with bottles of drinks placed inside", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "bottle", "keyboard", "sink", "wine glass", "microwave", "laptop", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 581749, "caption": " The image displays a variety of different types of vegetables and fruits. Among the produce, there are several bunches of broccoli, which are placed together in two separate containers, with some broccoli scattered on the table as well", "mscoco_hallucinated_words": [["container", "bowl"]], "mscoco_gt_words": ["orange", "broccoli", "dining table"], "hallucination_idxs": [31], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.6666666666666666}}, {"image_id": 227960, "caption": " The image displays a dining table with a white dish containing various food items, including carrots and at least one bowl of broccoli with sauce. A spoon can be seen next to the white dish, indicating the presence of sauce within the food itself", "mscoco_hallucinated_words": [["table", "dining table"], ["broccoli", "broccoli"]], "mscoco_gt_words": ["bowl", "spoon", "wine glass", "carrot", "cup"], "hallucination_idxs": [5, 23], "metrics": {"CHAIRs": 1, "CHAIRi": 0.4, "Recall": 0.6}}, {"image_id": 286503, "caption": "The image depicts an elephant standing near an artificial structure, likely a tall support or a bench, in a fenced enclosure. The elephant appears to be engaging in its feeding activity, as it is surrounded by a group of people, likely visitors or staff members at a zoo", "mscoco_hallucinated_words": [["bench", "bench"]], "mscoco_gt_words": ["elephant", "person", "sports ball"], "hallucination_idxs": [17], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.6666666666666666}}, {"image_id": 315740, "caption": "The image depicts a clean and nicely organized kitchen with a sink and a countertop. There is a living room in the same space or nearby", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "potted plant", "oven", "chair", "couch", "sink", "tv", "microwave"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.125}}, {"image_id": 142108, "caption": "In the image, a group of people with bandannas covering their eyes are gathered around a dining table with multiple bananas placed on it. The bananas are scattered across the table and several hands are visible, likely belonging to the blindfolded individuals attempting to peel the bananas", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["banana", "dining table", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 542933, "caption": " This image captures a baseball game in action. There are several people standing around the field, including the baseball player who has just hit an inside ball during a game", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["baseball bat", "chair", "sports ball", "bench", "person", "baseball glove"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 475043, "caption": "The scene is set in a living room, with a woman sitting on a couch in the center and a man sitting on another couch nearby. The woman has a laptop and a cup on a table, while the man has two beers and a cup", "mscoco_hallucinated_words": [["cup", "cup"], ["table", "dining table"], ["cup", "cup"]], "mscoco_gt_words": ["bowl", "spoon", "couch", "bottle", "person", "laptop"], "hallucination_idxs": [35, 38, 48], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3, "Recall": 0.5}}, {"image_id": 456784, "caption": " The image captures a person cutting a cake with a large knife. The cake, which has a white, round shape, is positioned on a table", "mscoco_hallucinated_words": [["table", "dining table"]], "mscoco_gt_words": ["cake", "knife", "person"], "hallucination_idxs": [28], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2, "Recall": 1.0}}, {"image_id": 33753, "caption": "According to the picture, there is a wooden park bench in the scene, which has a remote control sitting on top of it. The remote control is positioned in the center of the bench", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "bench", "remote", "tv"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 448694, "caption": " A group of young men, most likely friends, are playing a game of frisbee outside in a field. They are engaged in the activity, with some of them trying to catch the frisbee, while others focus on the game", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "person", "frisbee"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 99053, "caption": "The image features a bowl of food on a table, likely dining or dining table. The bowl contains a mixture of noodles and vegetables such as broccoli", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "bowl", "dining table", "broccoli", "carrot"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 503210, "caption": "According to the picture, a spacious room with a piano and two couches has been converted into a living area by removing the piano and adding chairs. A large couch is situated on the left side of the room, and two smaller couches are placed on the right side, with one couch closer to the middle", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["vase", "potted plant", "chair", "couch", "clock", "book", "orange"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2857142857142857}}, {"image_id": 142257, "caption": "A busy street with a traffic light is the setting of this scene. There are several cars, some more prominent than others, going about their business", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["traffic light", "car", "person", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}], "overall_metrics": {"CHAIRs": 0.1843687374749499, "CHAIRi": 0.06819421713038734, "Recall": 0.47308394160583944, "num_hallucinated_caps": 92.0, "num_caps": 499.0, "hallucinated_word_count": 125.0, "coco_word_count": 1833.0, "length_response": 39.68336673346693, "hallucinated_caps_ls": [324008, 39053, 128119, 401027, 317320, 161227, 32625, 18688, 67833, 254368, 231534, 209347, 13550, 300784, 344942, 300124, 12669, 133146, 261097, 185327, 348654, 268854, 495513, 506401, 183571, 325836, 352734, 401010, 313928, 59710, 229659, 258209, 453731, 145020, 240681, 178753, 47781, 47940, 526414, 273132, 188136, 191691, 557447, 217593, 477016, 558784, 539951, 230983, 53465, 381031, 9628, 163518, 366111, 70815, 88269, 536154, 158806, 531327, 1268, 151159, 478380, 45550, 205193, 272566, 14940, 14285, 226802, 425569, 28842, 283118, 490711, 277051, 122467, 518287, 352900, 227438, 18150, 92107, 474499, 105782, 487990, 138834, 305000, 567254, 543231, 523175, 42889, 581749, 227960, 286503, 475043, 456784]}}}