{"overall_metrics": {"CHAIRs": 0.12525252525252525, "CHAIRi": 0.06157270029673591, "Recall": 0.41950321987120515, "num_hallucinated_caps": 62.0, "num_caps": 495.0, "hallucinated_word_count": 83.0, "coco_word_count": 1348.0, "length_response": 30.272727272727273, "hallucinated_caps_ls": [144305, 493862, 401027, 343534, 209347, 12375, 2154, 104326, 233888, 183766, 169169, 344942, 185327, 401010, 313928, 388237, 122602, 265628, 5934, 347453, 259345, 443259, 537861, 240681, 178753, 250540, 526414, 331084, 328818, 188136, 151081, 477016, 558784, 230983, 381031, 118124, 328110, 88269, 98979, 379443, 560018, 531327, 110449, 45550, 14940, 354540, 191301, 14285, 352703, 317254, 35827, 72656, 163728, 277051, 352900, 227438, 474499, 42889, 124601, 227960, 99053, 503210]}, "results": {"sentences": [{"image_id": 144305, "caption": "There are a few computer devices displayed in the image. A laptop, microphone, and keyboard are placed on top of a laptop with a television set nearby", "mscoco_hallucinated_words": [["television", "tv"]], "mscoco_gt_words": ["laptop", "keyboard", "dining table"], "hallucination_idxs": [27], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2, "Recall": 0.6666666666666666}}, {"image_id": 164091, "caption": "In a scene involving two dolls and a baby, one doll is seated in a baby carriage, while the other dolls are positioned on a bed", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["teddy bear", "person", "bed"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 308003, "caption": "The image captures a large wooden park bench with weathered paint peeling off, situated on the sidewalk near a dirt field", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "bench", "dining table"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 54870, "caption": "According to the image, the scene is a plate with a sandwich and salad. The sandwich, likely a hamburger or cheeseburger, is on the right side of the plate, and the salad is placed on the left side", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["knife", "sandwich", "fork"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 95908, "caption": "The image features a mouse pad, keyboard, and two computer mice on a desk", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "mouse", "keyboard", "laptop", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.8}}, {"image_id": 329614, "caption": "There is a large street in the image with a yellow church-style building on the left side and a car parked in front of the building", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bus", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 324008, "caption": "The image displays a tray filled with a variety of food items, including bananas and yogurt. The bananas are spread throughout the tray, with some closer to the edge and others towards the middle", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "banana", "train", "orange", "airplane", "person", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.14285714285714285}}, {"image_id": 52700, "caption": " In the image, there is a long dining table filled with various types of cakes and cupcakes arranged in lines and placed neatly on the table", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "dining table", "spoon", "cake", "handbag", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 501311, "caption": "The image captures a baseball game happening on a field. A man in a baseball uniform is on the pitcher's mound, holding a baseball as he is pitching", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "sports ball", "baseball glove"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 247179, "caption": " There are two elephants in the scene, with people standing and sitting on them as well as in between. The people are wearing different types of clothing, including a few with white attire and a few with black attire", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["clock", "elephant", "person", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 577912, "caption": "According to the image, there is a small, beige-colored bathroom with a tub sitting in the center", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bottle", "toothbrush", "toilet", "sink"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 196341, "caption": "In the image, there is a large clock located inside the building, with people walking around the clock near its location", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["handbag", "clock", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 234433, "caption": "The scene features an old street sign left right turn with an arrow pointing up and only painted in black", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bicycle", "traffic light", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 455610, "caption": "The image showcases a red motorcycle parked outside a building, possibly in a parking lot or a parking spot. There are two people standing near the motorcycle; one person is closer to the motorcycle and another is a bit further away", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["traffic light", "motorcycle", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 39053, "caption": " There is a table in the image with several pieces of food on it", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "bowl", "dining table", "spoon", "cake", "apple", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.14285714285714285}}, {"image_id": 493862, "caption": " The image features a man in a grassy field standing with a tennis racket in his hand. He is holding the racket while standing in a position that suggests he is waiting for an opportunity to hit a ball", "mscoco_hallucinated_words": [["ball", "sports ball"]], "mscoco_gt_words": ["tennis racket", "dog", "person"], "hallucination_idxs": [39], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.6666666666666666}}, {"image_id": 269873, "caption": " The image captures a busy sidewalk scene where a large group of people are standing and watching a trolley go by", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bus", "traffic light", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 524656, "caption": "The image features a small, well-organized kitchen with wooden cabinets", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "oven", "spoon", "bottle", "sink", "wine glass", "knife", "microwave", "toaster", "refrigerator", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 369547, "caption": " The image features a beach scene, with a dog and a bird sharing the same space", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cat", "bird", "dog"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 181446, "caption": " The image depicts a man reaching into an open refrigerator while standing inside a kitchen. The man is leaning in from the left side of the scene, peering into the refrigerator to get something", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "bottle", "sink", "person", "refrigerator"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 128119, "caption": "A large, white city bus is making its way down a street in front of an intersection, with a parking lane on the right side of the bus. There are two bicycles placed prominently on the front of the bus, one near the left side of the bus and the other closer to the center", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "backpack", "bus", "bicycle", "handbag", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.16666666666666666}}, {"image_id": 401027, "caption": "The image features a plate on a table with a sandwich cut in half and a bowl of sauce in front of it. The sandwich appears to be made with bread, cheese, and tomato slices, which makes it a typical sandwich", "mscoco_hallucinated_words": [["bowl", "bowl"]], "mscoco_gt_words": ["fork", "dining table", "sandwich", "knife", "cup"], "hallucination_idxs": [16], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2, "Recall": 0.4}}, {"image_id": 253630, "caption": "The image showcases a living room with a coffee table located to the left, next to the wall. The coffee table is rectangular in shape and has a glass top", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "dining table", "potted plant", "tv"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 326021, "caption": "According to the picture, a woman is sitting at a dining table with a teddy bear", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["teddy bear", "dining table", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 317320, "caption": "There are a group of people riding bicycles in the middle of a street. The bicycles are going in different directions, with one going right, another going left, and a third one going further left", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bicycle", "motorcycle", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 507171, "caption": " The image captures a surfer riding a wave on a surfboard, likely enjoying the sport in a body of water", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["surfboard", "cat", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 161227, "caption": "In the image, there is a black leather chair occupied by a yellow and white pillow with a decorative pattern, and a laptop sitting on top of the pillow", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "remote", "chair", "couch", "keyboard", "laptop"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 25812, "caption": "The image captures a person in ski gear, snowboarding down a hill. They appear to be wearing a white hat and a jacket, and are likely enjoying the snowy landscape", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["snowboard", "skis", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 267537, "caption": " The image shows a group of women sitting together on a bench, possibly at a park or outside, while holding umbrellas to protect themselves from the weather", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["tie", "umbrella", "person", "bench"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 195645, "caption": " A gathering of people, including a baby, is standing around a table", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "bottle", "wine glass", "handbag", "bench", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 155671, "caption": "According to the picture, a small car is traveling down a city street with several traffic lights. A second car is also present on the street, sitting at a red traffic light further down the road", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["traffic light", "car", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 412894, "caption": " The scene takes place in front of a building with several people standing and walking near it, forming a large group", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["handbag", "backpack", "traffic light", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 32625, "caption": "The image features a table filled with various food items, including two main dishes, cereal, soup, and two cups of beverage. On the table, you can see a white plate with two pieces of food, one containing a fork, and a bowl filled with soup", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "bowl", "dining table", "book", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.8}}, {"image_id": 18688, "caption": "The image captures a baseball game in progress, with a focus on the players on the field", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["baseball bat", "person", "sports ball", "baseball glove"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 343534, "caption": "According to the image, there is a small girl doll, dressed in a pink outfit, standing next to two stuffed bears, one brown and one black. The doll is holding a pink hat", "mscoco_hallucinated_words": [["girl", "person"], ["bear", "bear"]], "mscoco_gt_words": ["teddy bear", "potted plant", "chair", "book", "dog"], "hallucination_idxs": [9, 23], "metrics": {"CHAIRs": 1, "CHAIRi": 1.0, "Recall": 0.0}}, {"image_id": 370657, "caption": "In the image, there is a group of people riding on the back of motorcycles, with a total of six people visible", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["handbag", "motorcycle", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 481596, "caption": "In the image, a man wearing a baseball cap is standing at a sports stadium, surrounded by numerous people in various spots throughout the crowd. The man is holding a couple of hot dogs in one hand, with one hand in his pocket", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "hot dog", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 460347, "caption": "The image depicts a long street with a city bus in the middle, traveling down two lanes", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bus", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 398753, "caption": "The scene is a busy baseball field where a baseball game is in progress. Several people are scattered across the field, with some standing closer to the batter and others farther away", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["baseball bat", "person", "sports ball", "baseball glove"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 67833, "caption": "The image features a dinner table with a couple of pizzas on it", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "bowl", "dining table", "bottle", "knife", "wine glass", "person", "pizza", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2222222222222222}}, {"image_id": 272880, "caption": " The image features a plate filled with a delicious slice of pizza placed on the side, awaiting someone to enjoy it. There is a sign on top of the pizza, with the word \"mystic\" written on it", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "dining table", "knife", "person", "pizza", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.16666666666666666}}, {"image_id": 254368, "caption": "According to the picture, there is a man sitting in a bed eating a piece of food", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["pizza", "person", "bed"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 193108, "caption": "According to the picture, there are two baseball players in the scene, both wearing baseball helmets, and they are preparing to play a game", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["baseball bat", "person", "sports ball"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 459141, "caption": "According to the image, a person wearing a straw hat is riding a bicycle", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bicycle", "motorcycle", "potted plant", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 231534, "caption": "There are several trucks lined up in front of an airplane on an airport runway, including a truck in the foreground and three more trucks further back. Some of the trucks appear to be moving and unloading while others are stationary", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["handbag", "airplane", "person", "truck", "suitcase"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 227031, "caption": "In the image, a man and a woman are standing in front of a white cake, presumably being cut into for a party or celebration. They appear to be getting close to each other, likely to get a better view or position for the event. Another person is visible in the background, possibly waiting in line to get close to the cake", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "potted plant", "tie", "cake", "knife", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 209347, "caption": " The image depicts a woman sitting on a park bench, surrounded by potted plants", "mscoco_hallucinated_words": [["bench", "bench"], ["potted plant", "potted plant"]], "mscoco_gt_words": ["cell phone", "train", "tie", "handbag", "person"], "hallucination_idxs": [9, 13], "metrics": {"CHAIRs": 1, "CHAIRi": 0.6666666666666666, "Recall": 0.2}}, {"image_id": 523292, "caption": " The scene features a cat sitting on top of a table, positioned in the middle, close to a laptop that is open on a table", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "cat", "chair", "laptop", "tv"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 12375, "caption": " The image features a plate filled with a variety of foods, including meat, potatoes, carrots, and other vegetables. The meat appears to be either chicken or turkey, while the potatoes are either mashed or boiled", "mscoco_hallucinated_words": [["turkey", "bird"]], "mscoco_gt_words": ["carrot", "broccoli", "dining table"], "hallucination_idxs": [31], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.3333333333333333}}, {"image_id": 13550, "caption": " The image depicts a woman standing on a rock, near a body of water, and feeding an elephant. The elephant is the focal point of the scene, with several others present in the background", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["handbag", "elephant", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 146837, "caption": "In the image, a young man is shown skateboarding, likely practicing or perfecting a trick. He is performing a trick on a rail, with the skateboard close to the top edge, while also balancing on it", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["skateboard", "motorcycle", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 67042, "caption": "According to the picture, a man in a white shirt is standing in a building, possibly an archway. He is looking at his cell phone, checking it while standing in this location", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "tie", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 209925, "caption": "According to the picture, a baseball player is getting ready to throw a baseball in the outfield", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "sports ball", "baseball glove"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 2154, "caption": "In the scene, a shopping cart is sitting outside a large parking area with many cars parked. The parking area is adjacent to the street, and there are several dining tables scattered in different places", "mscoco_hallucinated_words": [["table", "dining table"]], "mscoco_gt_words": ["bench", "car", "person", "umbrella"], "hallucination_idxs": [33], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.25}}, {"image_id": 274931, "caption": " The image features a black and white view of a side street, with multiple cars parked on it. The cars are parked in a row, and some of them appear to be older models", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fire hydrant", "traffic light", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 104326, "caption": "According to the image, there is a long green-colored kitchen located in the middle of a room. A wooden dining table stands near the kitchen area, with two long benches placed at the sides", "mscoco_hallucinated_words": [["bench", "bench"]], "mscoco_gt_words": ["dining table", "potted plant", "oven", "chair", "clock", "sink", "knife", "microwave"], "hallucination_idxs": [32], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.125}}, {"image_id": 233888, "caption": " According to the picture, a little boy is playing baseball in a room while a baseball game is on television. The boy is holding a bat and the ball is in the room as well, just in front of the TV", "mscoco_hallucinated_words": [["ball", "sports ball"]], "mscoco_gt_words": ["potted plant", "baseball bat", "person", "baseball glove", "tv"], "hallucination_idxs": [30], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2, "Recall": 0.4}}, {"image_id": 213905, "caption": "The image features two women standing on a tennis court together, both holding tennis rackets in each hand, as they seem to be discussing something together. There are various people in the background, some seated and others standing in different parts of the court, likely engaged in different activities or watching the tennis players", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "backpack", "tennis racket", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 277479, "caption": " The image features a toddler, a baby and an open refrigerator", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bottle", "refrigerator", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 300784, "caption": " The image portrays a group of young children sitting together in a sitting area or on a couch, surrounded by a bunch of stuffed animals, possibly a collection or a museum display. The children are sitting close to one another, looking at the animals and enjoying their time together", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["couch", "dog", "person", "bench"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 183766, "caption": " The image features a dish with cherries and wine glasses on a dining table. The dish, possibly a dessert, is surrounded by small plates holding cake and macarons", "mscoco_hallucinated_words": [["wine glass", "wine glass"]], "mscoco_gt_words": ["fork", "cake", "knife", "dining table"], "hallucination_idxs": [8], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.5}}, {"image_id": 169169, "caption": " In the scene, there is a long, blue bench with pillows sitting near a building", "mscoco_hallucinated_words": [["bench", "bench"]], "mscoco_gt_words": ["traffic light", "potted plant", "car", "person"], "hallucination_idxs": [10], "metrics": {"CHAIRs": 1, "CHAIRi": 1.0, "Recall": 0.0}}, {"image_id": 409346, "caption": " In the image, there are two women standing near a table with a variety of foods and desserts displayed. They are possibly sharing a meal or event together", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "dining table", "spoon", "cake", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 522262, "caption": "In the image, there are numerous bikes parked on the sidewalk next to a railing", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bicycle", "traffic light", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 79014, "caption": "The image captures a man's reflection in a glass window, with a yellow object placed in front of his face", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["orange", "person", "sports ball"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 344942, "caption": "A person is sitting at a computer with a laptop placed on a table. On the screen, a brown box is visible on the top part, possibly representing the profile picture of someone on a social networking site", "mscoco_hallucinated_words": [["person", "person"], ["table", "dining table"]], "mscoco_gt_words": ["clock", "laptop", "tv"], "hallucination_idxs": [1, 13], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.3333333333333333}}, {"image_id": 275929, "caption": " The image features several white toilets sitting on the front steps of a building, which is covered with a staircase", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "toilet", "sink"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 465601, "caption": " According to the picture, a group of people is standing outside under umbrellas. Some of the people are holding umbrellas, while others are not", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["handbag", "bench", "person", "umbrella"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 300124, "caption": "The image features a large chair with a broken frame and a small microwave sitting on top of it", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "couch", "dining table", "microwave"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 46919, "caption": "According to the image, there is a man snowshoeing down a snowy slope", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "skis", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 434022, "caption": "A large train is traveling down a long train track, passing over a small river near the coast. The train is filled with an abundance of people onboard, with some gathered at the front of the train, and others spread throughout its length", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["train", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 490491, "caption": "According to the picture, there is a street with a brick wall in the middle of it", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["stop sign", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 175878, "caption": "According to the picture, a group of four people are standing near each other in a building. They are holding or holding a cell phone, and one of them appears to be taking a picture with their cell phone", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "backpack", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 12669, "caption": "According to the image, a group of people is standing inside a building or room, with one of them holding a glass of wine", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["handbag", "vase", "wine glass", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 192496, "caption": " In the image, two train cars can be seen, one behind the other, as they are traveling through a city", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["train", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 133146, "caption": "The image presents a room with a large collection of furniture in a well-organized manner", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["vase", "chair", "couch", "book", "tv"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 53744, "caption": "The image features various food items on a cutting board, including several slices of tomato and lettuce. These vegetables appear to be cut into different pieces, creating a colorful and appetizing scene", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["knife", "dining table", "sandwich"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 375902, "caption": "In this image, there is a person wearing skis who has just crossed the finish line, possibly completing a skiing event", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "skis", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 498747, "caption": " In the image, a man wearing a sweater is holding a cell phone up to his ear, while the people in the background are focused on something else", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "bottle", "bird", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 52435, "caption": "A large group of people is at the beach, with several people surfing in the water. There are many people on the beach, ranging from a few in the background to a handful closer to the water's edge", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["surfboard", "bird", "person", "umbrella"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 301977, "caption": " The image features a cow walking across a road near a store, likely a market or shop, in the middle of a busy street. There are a few bottles located around the cow, some closer to it and others farther away, including ones that resemble sodas", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bottle", "refrigerator", "cow"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 261097, "caption": " The scene takes place on a tennis court with a group of people, including a man holding a tennis racket, walking or standing around it", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "bench", "tennis racket", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 227204, "caption": " In the image, three women of Asian descent are sitting around a dining table, enjoying a meal together", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "bowl", "dining table", "banana", "spoon", "bottle", "knife", "person", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2222222222222222}}, {"image_id": 353981, "caption": "There is an image of an airplane on a runway in the image. The airplane appears to be a large plane with multiple air tanks attached to it, likely used to transport and store various substances such as fuel, oil, or weapons", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["airplane", "person", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 185327, "caption": "In the image, there is a car driving down a city street, surrounded by a herd of walking elephants. The elephants are in a line, with some walking closer to the car and others farther away", "mscoco_hallucinated_words": [["elephant", "elephant"], ["elephant", "elephant"]], "mscoco_gt_words": ["bus", "horse", "car", "person", "cow"], "hallucination_idxs": [20, 23], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.2}}, {"image_id": 348654, "caption": "In the image, there is a cell phone sitting in a holder on a wooden desk", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "laptop", "tv", "dining table"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 482432, "caption": "The image is a close-up view of a bathroom sink", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "toothbrush", "sink"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 454161, "caption": " The image features a piece of pizza placed on a plate, which is the main focus of the image", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["pizza", "fork", "dining table", "wine glass"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 144723, "caption": "The image depicts a dog leaping into the air with a frisbee in its mouth as it tries to catch the disc. The dog is mid-jump, and its head and front paws are close to the frisbee, while its back legs are further away", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["car", "dog", "frisbee", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 129707, "caption": "A person is holding a cell phone in their hand, showing the front side of the phone. The cell phone has multiple buttons, including buttons on the front and back of the device", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "book", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 379842, "caption": "A picture of a book on top of a table is displaying two video games, a Wii game and a Nintendo 3DS game titled \"super mario bros. wii\". The Wii game is positioned slightly above the 3DS game and both are side by side", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["remote", "dining table", "book"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 203110, "caption": "The scene takes place on a street with several people walking around and a train car traveling down the tracks", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bus", "train", "orange", "car", "person", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 556478, "caption": "The image features two vegetarian pizzas placed side by side on a stove top. They are cooked on pans, with one pan located further right and the other one on the left", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["pizza", "oven", "bottle", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 103815, "caption": "The image features a baseball game in progress. There are multiple players on the field, and two baseball players are visible, one pitching and the other swinging at the ball", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["baseball bat", "person", "sports ball", "baseball glove"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 451943, "caption": "According to the picture, the scene is a bedroom with a double bed", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "suitcase", "dining table", "bed"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 268854, "caption": " The scene features a group of people standing around on a sandy beach near a body of water, with several boats in the background", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["handbag", "boat", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 34464, "caption": "The image depicts a beach scene where a red surfboard is partially submerged in the ocean water", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["boat", "surfboard", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 495513, "caption": "According to the picture, there are two main people in the scene: a man and a woman standing next to each other. The couple is wearing coats and holding up hot dogs on sticks", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "hot dog", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 529256, "caption": "According to the picture, there are two dogs lying on a bed. One dog is situated near the left side of the bed, covering most of it, while the other dog lies on the right side of the bed, occupying a smaller area", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dog", "book", "bed"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 37907, "caption": "The image shows a cat sitting on top of a television in a room", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cat", "potted plant", "tv"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 506401, "caption": "According to the picture, it is a sunny day as various street lights, including a traffic light, illuminate a small intersection in a city setting", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cat", "traffic light", "car", "person", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2}}, {"image_id": 406611, "caption": " The image features a group of people gathered around a ski slope on a sunny day. Most of the crowd is standing, with people of all ages and sizes, including children and adults", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "skis", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 267225, "caption": "In the image, there are several vehicles and people gathered around them, creating a scene of a transport truck and a few smaller vehicles. The truck, with large satellite dishes mounted on its sides, dominates the scene", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["remote", "car", "person", "truck", "tv"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 278365, "caption": "According to the picture, there is a man and a woman sitting at a dining table eating pizza in the evening", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "dining table", "chair", "person", "pizza", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 69757, "caption": "According to the picture, the scene features a group of people gathered around a dining table. One person in particular, a woman, is wearing a striped shirt and seems to be the center of attention as she cuts a cake", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "chair", "cake", "knife", "wine glass", "person", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.42857142857142855}}, {"image_id": 432213, "caption": " The image features a plate filled with a variety of food items, including a sandwich and French fries. The sandwich appears to be a breakfast sandwich, with an egg and a variety of ingredients", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "dining table", "sandwich", "wine glass", "knife", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.16666666666666666}}, {"image_id": 368367, "caption": "In a scene featuring several people, a woman is smiling as she talks on a cell phone, holding it up to her ear", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "person", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 201555, "caption": "A dirt road has been constructed on the beach to support the new highway bridge, creating a significant construction site for the area", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["traffic light", "car", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 92131, "caption": " The image features a green bus with people outside waiting for it", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["handbag", "bus", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 21779, "caption": " The image depicts a young woman lying down on the floor, propping herself up with her head resting on a large suitcase", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "suitcase", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 565148, "caption": "This scene takes place in a baseball game, as a batter stands at home plate, ready to hit. A catcher is also present, waiting for the ball to be thrown", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["baseball bat", "person", "sports ball", "baseball glove"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 160183, "caption": " The image features a fire truck parked near a small building", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["car", "person", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 555456, "caption": "", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["snowboard", "skis", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 235595, "caption": " The scene features several parked motorcycles lined up in a row along the sidewalk on the right side of the street. They are next to a couple of cars, one located in front of the parked motorcycles and another farther back", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["motorcycle", "potted plant", "car", "parking meter", "person", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 489909, "caption": " The image features a basket filled with various types of vegetables and fruits, including tomatoes, oranges, bananas, and cucumbers. The oranges are located in the center of the basket, with a few of them spread throughout the space", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["banana", "orange", "bowl"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 501080, "caption": " The image features a potted flower arrangement sitting on a table. It consists of pink flowers, which are located towards the top and middle of the arrangement", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "dining table", "potted plant", "vase"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 405183, "caption": "The scene is a living room where a group of people are gathered around a TV. A man is standing next to a woman, holding a remote control, and he is enjoying a Wii video game", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["remote", "potted plant", "chair", "couch", "book", "handbag", "person", "tv"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.375}}, {"image_id": 409138, "caption": "The image captures a large white bus driving down a road past buildings, likely in a city environment", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bus", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 411840, "caption": "The image depicts a tennis court with a group of tennis players walking on the court. There are two main players, both women, walking on the left side of the court", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "chair", "sports ball", "person", "tennis racket"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2}}, {"image_id": 333712, "caption": " In the image, there's a piece of pizza that is covered in toppings. The pizza has several slices cut into it, and some appear to be on a plate or dish", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["pizza", "spoon", "dining table"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 148977, "caption": " In the image, a teddy bear is sitting on a table, wearing headphones. The teddy bear seems to be enjoying the music or audio it's listening to", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["teddy bear", "dining table", "bottle", "bear", "keyboard", "book"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 399058, "caption": " In the image, there are two trucks driving on the road, one behind the other, with an elephant standing in the middle of the road", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bicycle", "orange", "person", "truck", "elephant"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 183571, "caption": " According to the picture, there is a man standing on a red boat while a dog is located next to him on the left side of the boat", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["boat", "dog", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 325836, "caption": " There is a display of multiple motorcycles on exhibition at a gathering, likely a trade show or expo. These custom-painted motorcycles are parked and displayed on a red carpet, showcasing the custom paint designs and decorations", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["handbag", "motorcycle", "bicycle", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 437910, "caption": "The image depicts a small bathroom with a sink and toilet", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bottle", "toilet", "sink"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 155885, "caption": "The image shows a black and white photo of a bay with boats in it. There are multiple boats of different sizes scattered around the bay", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["boat", "bird", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 467887, "caption": "The image depicts a man sitting at a dining table in his home, using a laptop computer", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "chair", "couch", "mouse", "person", "laptop"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 174402, "caption": " The image shows a man standing on a tennis court holding a tennis racket in his right hand. He appears to be concentrating on the incoming tennis ball", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["tennis racket", "person", "sports ball"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 352734, "caption": " The image depicts a little boy, seated at a dining table, eating a piece of chocolate cake", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "dining table", "spoon", "cake", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 346716, "caption": " There is a city street scene with two red double-decker buses driving down the road next to each other. The buses are moving in opposite directions, creating a unique sight", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bus", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 451144, "caption": " In this snowy outdoor scene, a pair of snowboarders is standing on a snow-covered slope", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "skis", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 295656, "caption": " According to the picture, there are three people in the scene, one of them is a man and the other two are women. They appear to be dressed up, perhaps for a special event or gathering", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "tie", "clock", "car", "person", "pizza", "tv"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.14285714285714285}}, {"image_id": 129886, "caption": "In the image, there are several people standing on the snowy slope in skiing attire. Two main ski lifts are visible, one near the left side of the image and the other near the center of the scene", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["snowboard", "skis", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 557998, "caption": "According to the picture, a woman is sitting at a table with bottles on it", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "chair", "bottle", "wine glass", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 401010, "caption": "The image features a room with a large, neatly made bed and two windows. The bed is situated in the center of the room and is surrounded by various items, including a bottle, a clock, a cup, and a television", "mscoco_hallucinated_words": [["bottle", "bottle"], ["clock", "clock"], ["cup", "cup"]], "mscoco_gt_words": ["chair", "sink", "tv", "bed"], "hallucination_idxs": [35, 38, 41], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.5}}, {"image_id": 567562, "caption": " In the image, there is a woman sitting at a table surrounded by three children. The table is full of food, and the woman is smiling as she eats", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "bowl", "dining table", "chair", "spoon", "bottle", "book", "broccoli", "person", "pizza", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.18181818181818182}}, {"image_id": 313928, "caption": "In the picture, there is a large outdoor area overlooking the ocean, featuring a table and chairs set up for people to enjoy their beach vacation. The table is positioned near a railing and a surfboard can be seen sitting on the ground next to the table", "mscoco_hallucinated_words": [["person", "person"]], "mscoco_gt_words": ["surfboard", "dining table", "chair", "bottle", "wine glass"], "hallucination_idxs": [22], "metrics": {"CHAIRs": 1, "CHAIRi": 0.16666666666666666, "Recall": 0.6}}, {"image_id": 490284, "caption": "A black dog is lying on a couch, partially covering a person seated beside it. The dog's head is near the left side of the couch, while its back end is on the right side", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["couch", "dog", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 346940, "caption": "The image features a stove with a pot, skillet and an electric kettle", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "knife", "oven"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 222782, "caption": "The image is a black and white photo of a street scene with people walking on the sidewalk near a gas station", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "car", "person", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 255934, "caption": "In the image, two elephants are walking, one of which is a baby. The mother elephant is slightly larger, with a noticeable size difference", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["handbag", "elephant", "person", "cow"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 278627, "caption": "According to the image, the following descriptions are associated with the food presented in the picture:", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "dining table", "potted plant", "spoon", "chair", "bottle", "person", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 400851, "caption": " The scene is an outdoor sandy beach, filled with a large group of people gathered near the water", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "boat", "chair", "sports ball", "umbrella", "bench", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.14285714285714285}}, {"image_id": 472610, "caption": " The image features a woman standing near a large field surrounded by cows", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dog", "person", "cow"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 78565, "caption": "The image is an old photo of people and boats in the water", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["boat", "dog", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 388237, "caption": " In the scene, a boy is skateboarding down a street while riding on a bench", "mscoco_hallucinated_words": [["bench", "bench"]], "mscoco_gt_words": ["skateboard", "chair", "bottle", "person"], "hallucination_idxs": [15], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.25}}, {"image_id": 289640, "caption": " In the scene, there are four people sitting at dining tables or chairs at a dining area. One person is holding a red frisbee in their hand, which they are about to throw", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "chair", "wine glass", "orange", "person", "cup", "frisbee"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5714285714285714}}, {"image_id": 122602, "caption": " The image features a table with an assortment of supplies, including books, scissors, and craft paper. The table is filled with various items, such as a glue bottle and multiple paper cutouts", "mscoco_hallucinated_words": [["book", "book"]], "mscoco_gt_words": ["scissors", "bottle", "dining table"], "hallucination_idxs": [12], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2, "Recall": 1.0}}, {"image_id": 24104, "caption": "The image showcases a desk with multiple electronic devices arranged in front of a wall. On the desk, there are two computer monitors placed side by side, one of which is a 20-inch monitor and the other one is a 14-inch monitor", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "bed", "mouse", "keyboard", "book", "laptop", "tv", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.375}}, {"image_id": 183709, "caption": " The image features a busy intersection with numerous people standing at various locations. Some of the people are walking around, while others appear to be waiting or hanging out", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["handbag", "traffic light", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 59710, "caption": " The image depicts a small refrigerator with a black color and two doors. One of the doors is completely open, revealing the interior of the refrigerator, while the other door is closed", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "dining table", "refrigerator"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 279407, "caption": " The scene features a young boy in a baseball uniform, holding a baseball ball, dressed in green and white colors, and wearing a baseball glove", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bottle", "sports ball", "bench", "person", "baseball glove"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 314729, "caption": "The image depicts a black and white baseball scene with an old baseball player holding a bat, standing in a ready-to-hit stance. The player is dressed in vintage clothing, and there is a ball on the ground, suggesting that he may be practicing for a game or an upcoming competition", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["baseball bat", "person", "sports ball"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 527497, "caption": "According to the picture, there is a computer in the workplace that has a keyboard, mouse, and a TV monitor on a desk", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "mouse", "keyboard", "laptop", "tv"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 411564, "caption": "According to the picture, a man is sitting in a window, looking at his cell phone", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "dining table", "chair", "bottle", "person", "refrigerator"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 320350, "caption": " According to the image, there is a group of three people standing together on snow skis in a large snow-covered field", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["skis", "dog", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 401857, "caption": "The image features a baseball game happening on a field. Several people are present in the scene, with some playing baseball, while others serve as the catcher and umpire", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["baseball bat", "sports ball", "bench", "person", "baseball glove", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.16666666666666666}}, {"image_id": 285302, "caption": "A little boy is seated at a dining table, sitting in a chair and actively working on a craft project. The table is set with various materials like paper and scissors", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "scissors", "dining table", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 61959, "caption": "The image captures a city street scene, showcasing a white, double-decker bus making its way down the road. There are several cars around it, parked in various positions, such as one in front of the bus and others farther back on the street", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bus", "traffic light", "car", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 229659, "caption": " The image depicts a laptop computer sitting on a counter in a restaurant, which is open for business. In the vicinity of the laptop, several chairs are arranged around two tables, some more closely around the counter, others scattered in the area", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "chair", "bottle", "clock", "person", "laptop", "tv"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.42857142857142855}}, {"image_id": 473118, "caption": "The image shows a man on a skateboard riding a ramp, with a blue background. The skateboarder is in the middle of a trick, possibly doing a grind", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["skateboard", "bicycle", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 391222, "caption": "In the image, a group of three people, bundled up in coats and hats, is standing in the snow", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "skis", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 416104, "caption": "According to the picture, there is a group of people sitting at outdoor tables while others walk by. A large number of tables with blue chairs and umbrellas are set up, providing shade for those enjoying their meals", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "chair", "bottle", "wine glass", "umbrella", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 511852, "caption": "In the image, there are two skiers descending a snowy hill, with the main focus being on the person on the right, skiing down the slope with skis on their backpacks", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "skis", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 59386, "caption": "In the image, a group of giraffes stands together in a field eating from a tree, which is located near several other trees. There are several giraffes present, with some of them closer to the tree while others are further away", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["zebra", "giraffe", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 540180, "caption": "According to the picture, there is a street scene with traffic lights and a few cars on the road", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["traffic light", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 153692, "caption": "In the image, a man is riding a bike accompanied by his dog, while they are crossing a street. They are both wearing backpacks and appear to be on their way somewhere", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "bicycle", "traffic light", "car", "person", "dog"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 265628, "caption": " The image showcases a toilet, with its bowl sitting atop a sink", "mscoco_hallucinated_words": [["sink", "sink"]], "mscoco_gt_words": ["bowl", "toilet", "person"], "hallucination_idxs": [12], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.6666666666666666}}, {"image_id": 499594, "caption": "In the image, a piece of meat is served on a plate along with a variety of vegetables, including broccoli", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "dining table", "bottle", "knife", "broccoli", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.16666666666666666}}, {"image_id": 5934, "caption": " The image showcases a baseball glove and a baseball inside it, sitting on top of a dining table or bench", "mscoco_hallucinated_words": [["table", "dining table"]], "mscoco_gt_words": ["bench", "sports ball", "baseball glove"], "hallucination_idxs": [18], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.6666666666666666}}, {"image_id": 47828, "caption": "The image depicts a river with a variety of blue lights, likely illuminating the bridge over the water", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["boat", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 47916, "caption": " In the image, there are several dogs present in a grassy field, some of which are playing with a frisbee", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bench", "dog", "car", "truck", "frisbee"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 255483, "caption": "This image shows a person sitting at a table with a lot of paper in front of them. They are holding a stapler or some other office object in their hand, possibly to read the documents on the table", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["scissors", "dining table", "book", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 131138, "caption": "The image shows a desk with various computer-related items, highlighting a laptop and computer monitor on top", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "potted plant", "spoon", "mouse", "keyboard", "person", "laptop", "tv", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 258209, "caption": "According to the image, a man is sitting on a bench in front of a building", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bicycle", "bench", "book", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 347453, "caption": "The image captures a busy city street with multiple buses and a couple of red double-decker buses parked and driving on the street. There are several vehicles, including a truck on the left, a car in the middle, and another car on the right", "mscoco_hallucinated_words": [["truck", "truck"]], "mscoco_gt_words": ["bus", "bench", "traffic light", "car", "person"], "hallucination_idxs": [31], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2, "Recall": 0.4}}, {"image_id": 285820, "caption": "According to the picture, the image shows a living room with a couch, featuring a white, black, and brown interior design. There is a kitchen in the room with a table and a dining room table, and the couch is facing towards the dining table", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "bowl", "dining table", "couch", "book", "bench", "tv"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2857142857142857}}, {"image_id": 245664, "caption": "The image features a desk with several electronic devices, including a laptop sitting on the right side, a computer monitor and keyboard placed near the laptop, and a mouse on the left side of the desk. The laptop is closed, and the computer monitor is partially visible, showing its screen", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "mouse", "keyboard", "wine glass", "book", "laptop", "tv", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.625}}, {"image_id": 453731, "caption": "According to the image, there is a sleeping dog resting on a wooden floor in front of an apothecary. The dog appears to be sleeping and is surrounded by various bottles, likely containing wine", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bottle", "dog", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 524601, "caption": "A group of people is gathered in a living room playing a video game. There are four people in the scene: one standing on the left, another standing slightly behind him, one in the middle, and another standing on the right", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["remote", "chair", "couch", "book", "person", "refrigerator"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.16666666666666666}}, {"image_id": 253262, "caption": "In the image, a small white propeller plane is parked on the airport tarmac, and two people are getting off of it, likely carrying their luggage with them", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["tie", "airplane", "person", "truck", "suitcase"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 87052, "caption": "The image depicts a kitchen area, with three people standing in it", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "vase", "oven", "bottle", "person", "refrigerator", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.14285714285714285}}, {"image_id": 357578, "caption": "There is an image on a city street, featuring a fire truck driving past several cars parked next to them. The fire truck is parked on the right side of the street, with the fire engine and lights prominent on its rear side", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["traffic light", "car", "person", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 418692, "caption": " There is a living room in the image with a large sofa and a couple of chairs", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "remote", "chair", "couch", "book", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 259345, "caption": "According to the picture, there is a bearded man sitting on a bench, possibly outdoors, with a pink umbrella held over his head. The man is dressed in a colorful, flowing robe", "mscoco_hallucinated_words": [["bench", "bench"]], "mscoco_gt_words": ["chair", "person", "umbrella"], "hallucination_idxs": [13], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.6666666666666666}}, {"image_id": 119709, "caption": "According to the picture, the scene features a woman dressed in an apron, standing in front of a table covered with donuts", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "dining table", "person", "donut"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 443299, "caption": "In the image, two people are sitting on a white bench next to a wall. One of them appears to be a man, wearing a jacket, while the other is a woman", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "backpack", "handbag", "bench", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 120776, "caption": " In the image, there is a large outdoor sculpture in the shape of an 'S' that is being viewed by a group of people standing on various outdoor surfaces. The sculpture has several umbrellas positioned around it to provide shade", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["tie", "person", "umbrella"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 411765, "caption": " The image features a tennis court surrounded by a chain-link fence, and a man in a white and blue shirt is holding a tennis racket, preparing to hit a tennis ball. He appears to be in the middle of a tennis match", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["tennis racket", "person", "sports ball"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 447991, "caption": "The image features a city street with a van parked near the curb and a woman standing on the sidewalk next to it. She appears to be looking at her phone while holding it with one hand", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "bicycle", "handbag", "traffic light", "car", "person", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.42857142857142855}}, {"image_id": 276719, "caption": "A small dog is running around an intersection near two parked cars. The dog appears to be enjoying the space and its surroundings", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["motorcycle", "truck", "chair", "handbag", "dog", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2857142857142857}}, {"image_id": 422328, "caption": "The scene depicts a horse pulling a snow plow while traveling down a snow-covered road. There are multiple people around the horse and a snowman in the background", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["snowboard", "horse", "skis", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 354559, "caption": "The image shows a woman dressed in a black and white stripped bustier with long hair, and she is posing with a stuffed animal. The teddy bear is quite large, covering much of her upper body", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["teddy bear", "bear", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 438788, "caption": "The image features two pieces of cake on a dining table, with a knife cutting one of them. There is another knife located close to the knife used to cut the cake", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cake", "knife", "person", "dining table"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 468005, "caption": " The image features an elephant walking on a cement path near the water, with many people standing around the animal, likely enjoying the scene or waiting for a ride. The elephant is walking near the shoreline, with its massive tusks out, attracting the attention of the people", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "elephant", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 545594, "caption": "The image captures a group of people sitting on a bus. Several passengers can be seen, including a young girl with colorful hair in the center", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "orange", "backpack", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 219546, "caption": "A large, elaborate dining table is filled with an array of different foods, including meats, cheese, and vegetables", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "bowl", "dining table", "chair", "spoon", "bottle", "knife"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.14285714285714285}}, {"image_id": 386645, "caption": "In the image, a truck has toppled over on the roof of a building, potentially causing some damage", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["motorcycle", "car", "person", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 155131, "caption": "In the image, a woman dressed in white is jumping high into the air, arms fully extended, as she tries to hit a ball flying above her", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["tie", "sports ball", "bench", "person", "tennis racket"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 188752, "caption": "According to the picture, a person has hanging a few bananas from a string above a fruit stand", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["banana", "apple", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 228350, "caption": " The image features a busy dining area with many people sitting around a table and a long counter. Some people are sitting near the counter while others occupy tables, where they are enjoying their meal", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "dining table", "chair", "tie", "wine glass", "umbrella", "person", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 437720, "caption": "According to the picture, there is a nude woman sitting at a desk in front of a red chair and a red table", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["vase", "dining table", "chair", "person", "laptop"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 378831, "caption": " The image depicts a woman walking on the street, carrying two red shopping bags", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["handbag", "fire hydrant", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 375503, "caption": "The image captures an upstairs view of a room featuring a wooden staircase, a small clock, and a desk or table near the top of the stairs. The room is ornate with paneled walls, carpets, and a large chandelier hanging from the ceiling", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "chair", "clock", "person", "laptop", "tv"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 330369, "caption": "According to the picture, there is a large red and white boat on the water", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["boat", "bird", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 288576, "caption": "According to the picture, a man is standing on a tree stump with a frisbee thrown near him. He is also holding a bicycle nearby", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bicycle", "person", "frisbee"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 32190, "caption": "According to the picture, it shows a small toy horse placed in the middle of a street in front of a parked car", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["horse", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 535403, "caption": "This image displays a small bathroom with a sink and mirrors", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["potted plant", "clock", "bottle", "sink", "hair drier", "toilet"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.16666666666666666}}, {"image_id": 449798, "caption": "The image displays a desk with multiple items placed on top of it", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "dining table", "mouse", "keyboard", "book", "laptop"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.16666666666666666}}, {"image_id": 375769, "caption": "According to the picture, the scene features a small child wearing a helmet eating at a table in a restaurant or cafe setting", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "bicycle", "chair", "hot dog", "umbrella", "car", "person", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 426172, "caption": " The image features a table display with several items in a store", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "chair", "bottle", "knife", "book"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2}}, {"image_id": 20650, "caption": "The image features a tasty, nutritious meal with a sandwich and plenty of broccoli on the plate. The sandwich is a delicious meal in itself, but the accompanying broccoli provides a nutritious and flavorful side dish", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "bowl", "dining table", "sandwich", "orange", "broccoli"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 138078, "caption": " An outdoor baseball scene is depicted in the image, with three baseball players present in the field. Two of the players are wearing baseball gloves, and one of them is wearing red-colored clothing", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "sports ball", "baseball glove"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 152499, "caption": "The image depicts a family swimming pool scene, with a group of people around a pool, including children, having fun in the water", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["surfboard", "dining table", "potted plant", "chair", "umbrella", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.16666666666666666}}, {"image_id": 180764, "caption": " According to the picture, a young man is eating a pink frosted donut in a kitchen setting", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bottle", "microwave", "person", "donut"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 147762, "caption": " The image features a piece of food on a plate, topped with a yellow substance", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cake", "fork", "dining table"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 113860, "caption": "The scene features a boat on water, moving down a river. This boat is carrying people who are riding it and enjoying their experience on the water", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["boat", "person", "umbrella"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 460866, "caption": "The image features a large number of toothbrushes stuck in a plastic container, forming a congested mass", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "dining table", "toothbrush", "sink", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 177015, "caption": "According to the picture, a man is sitting in a room, holding a cat on his lap as he uses a laptop computer", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cat", "chair", "couch", "person", "apple", "laptop", "refrigerator"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.42857142857142855}}, {"image_id": 333998, "caption": "The image shows a well-furnished kitchen with various appliances and equipment. At the center of the room, there is a refrigerator located in front of the main refrigerator, as well as an oven situated to the right", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "oven", "bottle", "sink", "microwave", "person", "suitcase", "refrigerator", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2222222222222222}}, {"image_id": 47131, "caption": "The image shows a train derailed on the tracks, with several men standing on and around the car", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["train", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 425447, "caption": "A white pickup truck is driving down a side street, with a sprinkler system on top of the truck spraying the back of the vehicle. A man is standing near the truck, possibly adjusting the sprinkler system or ensuring the operation is working", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fire hydrant", "person", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 295105, "caption": "The image portrays a black and white picture of a kitchen with a man standing in the middle of it. He is wearing a black shirt and appears to be enjoying a meal in the kitchen, possibly preparing or eating food", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "oven", "bottle", "sink", "person", "apple", "refrigerator"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.14285714285714285}}, {"image_id": 443259, "caption": "The image shows a very clean kitchen with two sinks and two refrigerators. The kitchen is spacious, featuring a large oven and a microwave placed on opposite ends of the room", "mscoco_hallucinated_words": [["microwave", "microwave"]], "mscoco_gt_words": ["bowl", "dining table", "potted plant", "oven", "chair", "bottle", "sink", "orange", "refrigerator"], "hallucination_idxs": [25], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.3333333333333333}}, {"image_id": 537861, "caption": "There are two trains on the train tracks in the image, one of which has an odd number of cars. The trains appear to be in motion as they are moving along the railroad track", "mscoco_hallucinated_words": [["car", "car"]], "mscoco_gt_words": ["train", "bench", "person"], "hallucination_idxs": [20], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.3333333333333333}}, {"image_id": 145020, "caption": "The image features a Disney character mascot standing in front of a large group of people at a street party. There are several people around the mascot, some closer to it and others further away", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["teddy bear", "mouse", "bird", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 249969, "caption": " The image depicts a white plate filled with assorted pieces of food, including a meat, vegetables such as broccoli and carrots, and bread. The meat appears to be sliced, while the vegetables are sliced as well", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "dining table", "spoon", "knife", "wine glass", "broccoli", "carrot", "bird"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 146504, "caption": "The image features a person's hand with a mouse placed on top of a keyboard, indicating that they are typing with the mouse. The mouse is positioned in the center of the image, while the keyboard is located to the right of the hand", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "mouse", "keyboard", "person", "laptop", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 40037, "caption": "The image features a grey building with a clock tower, creating an interesting scene with its unique architecture", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["clock", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 343218, "caption": "", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["tennis racket", "car", "person", "sports ball"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 301837, "caption": "It is a clean, sleek and modern kitchen featuring stainless steel appliances, a sink and an oven. The kitchen is well-lit with a skylight, making it a bright and airy space", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["oven", "clock", "sink", "apple", "refrigerator"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 309071, "caption": " The image features an elderly man wearing a button-up shirt, reaching to open the door on a parked bicycle. The bicycle is parked on the sidewalk near the curb", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "potted plant", "bicycle", "bench", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 240681, "caption": "A man is standing in the middle of the street with a backpack on, leaning over to use his cellphone", "mscoco_hallucinated_words": [["cellphone", "cell phone"]], "mscoco_gt_words": ["backpack", "motorcycle", "car", "person"], "hallucination_idxs": [20], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.5}}, {"image_id": 178753, "caption": "In the image, a young girl is seated in an orange chair in a room, with a cellphone to her right", "mscoco_hallucinated_words": [["orange", "orange"]], "mscoco_gt_words": ["cell phone", "chair", "person"], "hallucination_idxs": [11], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 1.0}}, {"image_id": 278890, "caption": "According to the picture, a person is holding their cell phone in their hand while sitting in a crowded area, likely in a restaurant or public place", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "dining table", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 47781, "caption": "There is a bedroom with a large red bed situated on the floor in the image", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["vase", "bed", "book", "person", "tv"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2}}, {"image_id": 542792, "caption": "There is a very large wooden baseball bat positioned near the end of a building in a city setting. It appears to be prominently placed and stands out in the urban environment", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["baseball bat", "person", "sports ball"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 293703, "caption": "The image features three people, a woman and two men, sitting at a table in a restaurant. There are pizzas placed on the table as well, which is their main meal", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "bowl", "dining table", "chair", "bottle", "knife", "person", "pizza", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 318777, "caption": " The image is a live baseball game taking place in a stadium", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "chair", "sports ball", "baseball glove"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 14773, "caption": " In the image, there is a plate full of hot dogs on a table, and a few more on the table's surface", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "dining table", "spoon", "hot dog", "bottle", "car", "person", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 521863, "caption": "According to the picture, a person is riding a skateboard while navigating through a crowd of people. There are several other people scattered throughout the scene, with some walking in the background and others engaged in various activities", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["skateboard", "bicycle", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 250540, "caption": " In the scene, there are several people riding motorcycles, with two motorcycles in the foreground and two in the background. There is a person sitting in a truck in the right side of the image", "mscoco_hallucinated_words": [["truck", "truck"]], "mscoco_gt_words": ["cell phone", "motorcycle", "handbag", "car", "person"], "hallucination_idxs": [30], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2, "Recall": 0.4}}, {"image_id": 211604, "caption": " In the image, a young man is lying on his back on the floor", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["tennis racket", "person", "sports ball"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 298067, "caption": "This is a food-related image featuring meat and a drink. The meat, likely chicken, is pictured next to a beer or another beverage, likely an alcoholic drink", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bottle", "dining table", "bowl", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 563938, "caption": "The scene depicts a man and a woman sitting on a couch together, with the man wearing sunglasses, a woman on the right and another woman on the left", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["tie", "couch", "bottle", "bench", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 461311, "caption": " The image depicts a large group of people gathered in a park or field on a sunny day. They are standing and walking around, spread throughout the area, and flying various kites at different heights, indicating that the park or field is a popular spot for kite flying", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "kite", "handbag", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 47940, "caption": " The image features a person lying on a bed, their legs resting on a book, and their feet occupying a significant portion of the scene", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "laptop", "book", "bed"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 261318, "caption": " The image features a man sitting on a bench, holding a cell phone to his ear as he talks", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "chair", "handbag", "bench", "person", "suitcase"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 134768, "caption": " The image depicts a computer keyboard with a set of speakers in the background. The keyboard appears to be an electronic keyboard, with the buttons located at various positions", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["mouse", "laptop", "keyboard", "dining table"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 526414, "caption": "The image shows a living room with a long table and chairs in the middle, and a black cat is sitting on top of the table", "mscoco_hallucinated_words": [["chair", "chair"]], "mscoco_gt_words": ["scissors", "bowl", "dining table", "cat", "remote", "couch", "book", "laptop", "tv", "cup"], "hallucination_idxs": [11], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.2}}, {"image_id": 273132, "caption": " The image depicts an older woman sitting on a park bench, with a hand touching her face", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["handbag", "bench", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 505213, "caption": " In the image, there is a man taking a large hot dog out of a bun while posing for the camera. The man appears to be laughing, and the hot dog is clearly visible as he is holding it up to show it to the camera", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["hot dog", "sandwich", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 192656, "caption": "According to the picture, it appears to be a baseball field where a man in a baseball uniform is shown standing in the grass. He is wearing a baseball glove and waving his hand, indicating he is ready to throw the ball", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "sports ball", "baseball glove"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 272728, "caption": " In the image, there is a beautiful vase filled with a variety of pink, yellow, and purple flowers on a table", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "vase", "dining table", "potted plant"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 509811, "caption": "In the image, a person is standing in front of a large number of open laptops arranged in rows of dining tables in a large lecture room, creating a scene where someone has set up a presentation and is addressing an audience of students and computers. There is a projector, placed above a chair, possibly being used during the presentation", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "chair", "book", "apple", "person", "laptop"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 412407, "caption": " The image shows a person holding a flip phone in their hand, which has an open screen displaying various lines. In the background, several other people are present, likely members of a crowd or event", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "clock", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 353658, "caption": "In the image, there is a group of people, including the woman holding the umbrella, shopping in a farmer's market area. A person can be seen wearing a handbag, while two others appear to be standing closer to the back of the scene", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["clock", "suitcase", "handbag", "umbrella", "person", "carrot"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 441363, "caption": "The image captures a man in a red shirt and white shorts playing tennis on a court. He is mid-air, trying to hit the tennis ball with his tennis racket, which is also shown in the scene", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["tennis racket", "person", "sports ball"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 331084, "caption": "In the image, there are four people at a dining table, where they are making pizzas. The table is filled with various ingredients and kitchen tools, including carrots, tomatoes, a knife, forks, and a bottle", "mscoco_hallucinated_words": [["fork", "fork"], ["bottle", "bottle"]], "mscoco_gt_words": ["bowl", "dining table", "spoon", "knife", "person", "pizza", "carrot"], "hallucination_idxs": [38, 42], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.7142857142857143}}, {"image_id": 282553, "caption": "According to the picture, two women are walking together on a dirt path, with one of them holding a cell phone", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["handbag", "cell phone", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 328818, "caption": "According to the picture, a woman in a pink shirt is bending over to tie her shoe to the bench", "mscoco_hallucinated_words": [["tie", "tie"]], "mscoco_gt_words": ["bicycle", "bench", "bottle", "person"], "hallucination_idxs": [15], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.5}}, {"image_id": 3103, "caption": " The image depicts a man skateboarding down a steep ramp, possibly practicing or performing a trick. He is wearing knee pads for protection while in motion", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["skateboard", "clock", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 188136, "caption": "The image depicts a large and open room filled with various items, including apples and an oven. A refrigerator is positioned near the center of the room, while a couple of pitchers are found on different parts of the countertop", "mscoco_hallucinated_words": [["apple", "apple"], ["oven", "oven"], ["refrigerator", "refrigerator"]], "mscoco_gt_words": ["bowl", "dining table", "sink", "orange", "person", "carrot"], "hallucination_idxs": [14, 17, 20], "metrics": {"CHAIRs": 1, "CHAIRi": 0.75, "Recall": 0.16666666666666666}}, {"image_id": 449675, "caption": " The image shows a plate on a table, featuring a sandwich and a salad. There's a fork also on the table, close to the plate", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "dining table", "spoon", "bottle", "sandwich", "knife", "carrot", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.375}}, {"image_id": 191691, "caption": "According to the picture, there is a man standing in a bathroom, shaving his face", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bottle", "toothbrush", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 89378, "caption": "The image depicts a man standing near a red motorcycle parked next to a brick building", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bicycle", "backpack", "motorcycle", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 99874, "caption": "In the image, a woman is seated at a table in a restaurant or dining establishment, using her cell phone", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "dining table", "cat", "bottle", "handbag", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 437895, "caption": "The image is a bedroom scene with a large bed in the center. There's a colorful comforter or blanket draped over the bed, giving it a warm and cozy appearance", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["vase", "potted plant", "bed"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 557447, "caption": " The image depicts a man in a suit wearing a yellow tie sitting at a conference table, looking down at a piece of paper in his hands. He appears to be concentrating and examining it", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "dining table", "spoon", "tie", "knife", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 159979, "caption": " There is an interesting scene taking place on the water, with multiple people in small boats and under various umbrellas. There are four boats present, two of which have umbrellas over them, while the other two do not have such shade", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["boat", "bowl", "person", "umbrella"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 357, "caption": "The image captures a professional baseball game with many players present on the field. The scene shows multiple players holding baseball bats and gloves, both in the dugout and on the field, ready to make plays or contribute to the game", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["baseball bat", "person", "baseball glove"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 538891, "caption": "", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["tennis racket", "person", "sports ball"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 561967, "caption": " The image features a large train traveling along the tracks. It appears to be carrying several cars, with several of them being in a line on the train's left side, while others are scattered throughout the train's length", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["train", "traffic light", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 565778, "caption": "The image depicts a blue and white passenger train traveling on a railroad track. It has a long body and is in motion, moving from left to right as it passes by a train station", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["train", "traffic light", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 7125, "caption": " A group of people is enjoying a bike ride on a dirt path, with one man riding his bicycle in the center and others riding their bicycles to the right and left", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "bicycle", "bottle", "dog", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 221350, "caption": "The image depicts a man holding a red and white tie, seemingly preparing to adjust or tighten it. The tie is adorned with various hearts, which can be seen as decorative embellishments", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "chair", "tie", "handbag", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 280930, "caption": "The scene features a little girl, likely around four or five years old, standing in a kitchen wearing a pink shirt", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bottle", "refrigerator", "person", "oven"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 151081, "caption": "According to the picture, a helicopter is flying over a large field with two other vehicles nearby, such as cars, trucks or construction equipment", "mscoco_hallucinated_words": [["car", "car"]], "mscoco_gt_words": ["airplane", "person", "truck"], "hallucination_idxs": [21], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.3333333333333333}}, {"image_id": 122232, "caption": " The image features a person in a yellow coat, posing on a tennis court. The person is holding a tennis racket and appears to be playing or practicing", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["tennis racket", "person", "sports ball"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 134223, "caption": " The image shows a plate containing a hot dog and various toppings such as ketchup and mustard. There are also French fries, with several portions placed on the plate", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "broccoli", "hot dog", "dining table"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 198163, "caption": "In the image, a man is sitting behind a window, likely at work in a studio or a workshop. He is surrounded by countless bowls and jars, which are placed in an assortment throughout the room", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "dining table", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 3742, "caption": " The image showcases a vase containing a red rose and a bowl filled with apples placed on a window sill", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "dining table", "apple", "vase"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 217593, "caption": "According to the picture, there is a little boy wearing a baseball uniform standing in a field", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["baseball bat", "chair", "handbag", "person", "baseball glove"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2}}, {"image_id": 279078, "caption": " The scene depicts a young boy standing next to a refrigerator, opening its door and pointing to the array of bottles inside", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bottle", "refrigerator", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 572081, "caption": "The image captures a moment on a tennis court where two men are playing a game of tennis. They are both holding tennis rackets, with one player holding a tennis racket in his right hand and the other player holding it in his left hand", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "couch", "sports ball", "person", "tennis racket"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 477016, "caption": " The image features several people standing in a room, likely a living room. In the center of the room, a little girl is standing in front of an appliance, likely an oven or a refrigerator, with small plastic fish or aquarium inside", "mscoco_hallucinated_words": [["refrigerator", "refrigerator"]], "mscoco_gt_words": ["backpack", "potted plant", "oven", "sink", "handbag", "person"], "hallucination_idxs": [38], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.3333333333333333}}, {"image_id": 301266, "caption": " According to the picture, there is a group of people gathered in a kitchen, with several baskets and cups on the table in front of them", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "dining table", "spoon", "sink", "book", "person", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.42857142857142855}}, {"image_id": 475813, "caption": "A little girl is standing in a room, possibly playing or exploring her surroundings. She is wearing pyjamas and holding a small remote control in one hand", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["handbag", "remote", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 558784, "caption": "The image features a man standing on the side of a baseball field near a pond. The man is holding a baseball bat, and there is a baseball on the ground next to him", "mscoco_hallucinated_words": [["baseball bat", "baseball bat"]], "mscoco_gt_words": ["backpack", "person", "frisbee"], "hallucination_idxs": [22], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.3333333333333333}}, {"image_id": 308543, "caption": "The image depicts a person holding two spoons in their hand while standing in front of a sink. The person appears to be in a kitchen or bathroom setting, with the sink being close by", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["spoon", "sink", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 359164, "caption": "The image shows a pair of dogs, one white and one brown, on a grassy lawn. The white dog is running in the foreground, while the brown one is standing further back", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "dining table", "dog", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 539951, "caption": "This image features a large kitchen scene with various kitchen appliances. There is a large oven in the middle of the kitchen and multiple sinks and refrigerators on the left side of the kitchen", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["refrigerator", "clock", "sink", "oven"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 143479, "caption": "According to the picture, there are two men in the scene: one older gentleman in a white shirt and khaki pants, and another, closer to the right side of the image. The older gentleman is holding a tray with a group of hot dogs placed on it", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "hot dog", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 475024, "caption": " In the image, a vase with various colored flowers and leaves is prominently displayed in a room under a mirror", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["orange", "vase", "dining table", "potted plant"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 238065, "caption": "In the image, a person is on a skateboard riding on the side of a cemented block, enjoying their time and performing tricks. They appear to be practicing or honing their skills while cruising on the skateboard", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["skateboard", "chair", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 314016, "caption": "According to the picture, a small bathroom has a sink and a toilet in the corner", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bottle", "toilet", "sink", "book"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 322163, "caption": "The image captures a scene in a restaurant kitchen where two men are actively preparing food together. One of the men appears to be the main cook, standing in front of the kitchen counter, and the other is situated closer to the oven area", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "dining table", "potted plant", "remote", "oven", "bottle", "person", "pizza", "microwave"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2222222222222222}}, {"image_id": 230983, "caption": "In the image, a man is shown riding a skateboard while doing a trick, as he is jumping in the air on the sidewalk. The skateboard he is riding is partially covered by a container that seems to be placed in front of it, possibly creating a dramatic scene", "mscoco_hallucinated_words": [["container", "bowl"]], "mscoco_gt_words": ["skateboard", "car", "person"], "hallucination_idxs": [37], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.6666666666666666}}, {"image_id": 564629, "caption": "The image depicts a very clean and organized kitchen with a sink, stove, and oven. The sink is located in the center of the kitchen, with a black countertop surrounding it", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["oven", "refrigerator", "sink", "microwave"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 53431, "caption": "In a scene featuring a man sitting outdoors near a brick building, a man is using a laptop and wearing a pair of black shoes with white ties on them", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "laptop", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 441840, "caption": "The image features a field with several people present", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["baseball bat", "baseball glove", "car", "person", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2}}, {"image_id": 53465, "caption": " The image depicts a cake, or more specifically, a piece of cake that has been decorated with \u201cwelcome to punch\u201d written on it", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "bowl", "dining table", "spoon", "cake", "person", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.14285714285714285}}, {"image_id": 381031, "caption": "There are several items on a table, including a plate filled with a variety of foods, a couple of bottles, and a cup. The food on the plate includes apples, a handful of oranges, and a couple of donuts", "mscoco_hallucinated_words": [["orange", "orange"]], "mscoco_gt_words": ["dining table", "donut", "spoon", "bottle", "microwave", "apple", "cup"], "hallucination_idxs": [38], "metrics": {"CHAIRs": 1, "CHAIRi": 0.16666666666666666, "Recall": 0.7142857142857143}}, {"image_id": 530520, "caption": "In the image, three men are sitting on the grass in front of a building, engaged in an outdoor activity", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "motorcycle", "clock", "person", "laptop"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2}}, {"image_id": 539555, "caption": "According to the picture, a man in a white shirt is playing with a frisbee, attempting to throw it in the air and catch it", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["skateboard", "person", "frisbee"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 279521, "caption": " In the image, there is a large silver train parked by a small train", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "bus", "train", "handbag", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.16666666666666666}}, {"image_id": 560439, "caption": "The image depicts a group of people wearing snowboards engaged in an exciting winter sporting activity", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["snowboard", "backpack", "skis", "handbag", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 248353, "caption": "The image captures a group of people standing on skis in the snow, making it a winter snow sport scene. There are four people in total, with two groups of skiers separated by a large distance", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["snowboard", "skis", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 9628, "caption": "The image captures a thrilling scene where a man is enjoying a waterskiing experience in the lake", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["boat", "surfboard", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 330050, "caption": "According to the image, the man and woman are standing on a tennis court", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bench", "tennis racket", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 254161, "caption": " In the image, a man is flying a kite on a brick plaza in the city, surrounded by tall buildings. There are several people standing nearby, including another man standing off to the side, as well as a few other people further back in the scene", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["handbag", "kite", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 275749, "caption": " In the image, a group of people are gathered in a room, with a man and a woman standing closely together", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "chair", "bottle", "mouse", "person", "laptop", "tv", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.125}}, {"image_id": 163518, "caption": "In the image, there is a woman standing in a kitchen-like environment with a tray filled with various salads. She is wearing a black apron and blue gloves, as she appears to be prepping the food for serving", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "dining table", "oven", "chair", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2}}, {"image_id": 156696, "caption": "This is a black and white image of a train station, with two people standing on the platform. The image is slightly blurred, as if it was taken in the past", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["handbag", "train", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 525202, "caption": " In the image, a pizza is placed on a counter set out on a table. The pizza has cheese on it, indicating a delicious treat for those around it", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "dining table", "chair", "spoon", "bottle", "knife", "person", "pizza", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2222222222222222}}, {"image_id": 423984, "caption": " The image features a plate filled with a variety of food items, including carrots, broccoli, and bread", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["carrot", "broccoli", "dining table"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 499486, "caption": " According to the picture, two cats are sleeping on a messy bed in an undisclosed location. One of the cats is on the left side of the bed, while the other is on the right side", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cat", "book", "bed"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 118124, "caption": " The image features a smiling man in a shirt wearing a tie while sitting in the back seat of a car", "mscoco_hallucinated_words": [["seat", "chair"]], "mscoco_gt_words": ["tie", "car", "person"], "hallucination_idxs": [17], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 1.0}}, {"image_id": 288729, "caption": "According to the picture, there is a small cake that has been made into a circus tent. Inside the tent, there are two dolls positioned in the middle", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["teddy bear", "cake", "bear", "person", "elephant"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2}}, {"image_id": 177721, "caption": "According to the picture, a person in a green shirt is seen performing a skateboard trick on a railing", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["skateboard", "dining table", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 372220, "caption": " The scene features a man with a white beard wearing a hat, standing in a crowded area", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["handbag", "cell phone", "horse", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 252625, "caption": "The scene is set along a city street with various stores and shops visible from the road, as well as a few signs indicating the presence of parking spaces and parking restrictions. There are several people on the street, two of them on bicycles, and one person walking on the sidewalk next to the street", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bicycle", "traffic light", "potted plant", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 493610, "caption": " In the image, a blue truck is driving down a dirt road with people standing around and walking in the area. There is a large group of people, with some seated and others standing, on the back of the truck, enjoying the ride", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bus", "car", "person", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 302789, "caption": " The image features a small bedroom that has a single bed against one wall and a suitcase sitting on the floor next to it", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "bed", "bottle", "sink", "handbag", "suitcase", "refrigerator"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2857142857142857}}, {"image_id": 30667, "caption": "The scene features a large brown dog sitting on a boat with two people's feet visible around it", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["boat", "dog", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 114108, "caption": " The image displays a dining table with several people seated around it. At the center of the table, there are two pizzas, one with cheese and the other topped with vegetables", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "dining table", "chair", "spoon", "knife", "person", "pizza", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.375}}, {"image_id": 328110, "caption": " In the picture, a woman is sitting on a bench with her baby in a stroller. The baby is holding the bottle, which is likely being fed", "mscoco_hallucinated_words": [["bottle", "bottle"]], "mscoco_gt_words": ["handbag", "bench", "backpack", "person"], "hallucination_idxs": [23], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2, "Recall": 0.5}}, {"image_id": 366111, "caption": "The image features several people riding bicycles in an urban setting, creating a lively atmosphere", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bicycle", "traffic light", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 532481, "caption": " The image depicts an exciting moment in the water with several people actively engaged in parasailing, kite boarding, or other water sports", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["surfboard", "kite", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 291634, "caption": " The scene features a sidewalk with several parked motorcycles lined up next to each other", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bicycle", "motorcycle", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 463678, "caption": " The image features a young man playing tennis on a court. He is in the middle of the court, wearing white and holding a tennis racket, ready to hit the tennis ball", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["tennis racket", "person", "sports ball"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 70815, "caption": "In a black and white image, a dog is walking down a sidewalk, perhaps on a leash, on the left side of the picture", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bicycle", "dog", "person", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 367872, "caption": "", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["baseball bat", "sports ball", "umbrella", "person", "baseball glove"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 353898, "caption": " In the image, a man is sitting on a bench surrounded by a large group of pigeons", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "backpack", "bench", "person", "bird"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 88269, "caption": "According to the picture, there is a bowl of soup and two grilled cheese sandwiches on a dining table. The soup is placed near the left edge of the table, while the sandwiches are situated closer to the right edge", "mscoco_hallucinated_words": [["table", "dining table"], ["table", "dining table"]], "mscoco_gt_words": ["spoon", "bowl", "sandwich"], "hallucination_idxs": [19, 31], "metrics": {"CHAIRs": 1, "CHAIRi": 0.4, "Recall": 0.6666666666666666}}, {"image_id": 463211, "caption": "The image depicts a little girl wearing a pink backpack walking near a school bus. There are two other children in the scene, with one of them being led by the little girl", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "bus", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 396269, "caption": "The image depicts a grand and elegant room with an ornate and colorful ceiling and walls, featuring a large vase of colorful flowers on the dining table", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "vase", "dining table"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 98979, "caption": "The image features a microwave sitting on a counter top next to a wine bottle. The microwave has a silver color, with the word \"Kenmore\" prominently displayed on the front", "mscoco_hallucinated_words": [["bottle", "bottle"]], "mscoco_gt_words": ["oven", "knife", "microwave"], "hallucination_idxs": [14], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.3333333333333333}}, {"image_id": 244455, "caption": " The scene features two motorcycles riding down the road, each wearing the full gear, including helmets, that typical for bikers. One of the motorcycles is more prominent, riding slightly in front of the other", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["motorcycle", "bicycle", "car", "person", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 379443, "caption": "According to the picture, there is an orange pair of scissors on a table, with a pair of scissors open and a spoon sitting next to them. The spoon and scissors are positioned in the foreground of the image, creating an interesting contrast with the black fabric", "mscoco_hallucinated_words": [["spoon", "spoon"], ["spoon", "spoon"]], "mscoco_gt_words": ["scissors", "dining table", "orange"], "hallucination_idxs": [24, 31], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2857142857142857, "Recall": 1.0}}, {"image_id": 536154, "caption": " A young boy with arms outstretched and a smile poses among many stuffed animals. The image features a blue background with a bunch of teddy bears and stuffed animals of various shapes and sizes surrounding the boy, who seems to be enjoying his time in the midst of them", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["teddy bear", "cat", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 374061, "caption": " In the image, a black and white cat is sleeping on a bed and cuddling a stuffed animal, likely a teddy bear", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["teddy bear", "cat", "bed", "couch", "bear"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 560018, "caption": "In the image, there is a large group of people on water scooters and surfboards enjoying a day of surfing on the ocean. There are multiple surfboards visible in the scene, with people riding them and spread out over the water", "mscoco_hallucinated_words": [["scooter", "motorcycle"]], "mscoco_gt_words": ["surfboard", "kite", "person"], "hallucination_idxs": [13], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2, "Recall": 0.6666666666666666}}, {"image_id": 353320, "caption": " In the image, there is a guitar sitting on top of a large brown electric guitar", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["handbag", "bench", "suitcase", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 256628, "caption": "The image features a golden retriever dog sitting on a wooden deck. The dog is wearing a collar and lying down on the floor, with its tongue slightly hanging out", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "bowl", "dog"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 158806, "caption": "The image depicts a large black and tan dog sitting outside, with a person in the background on the right side of the scene", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sandwich", "person", "dog"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 424270, "caption": "In the image, a little girl is sitting on a bed in the middle of the scene, surrounded by sheets and blankets", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "tv", "bed"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 368335, "caption": "According to the picture, there is a horse walking across a parking lot, with several cars blocking its path", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["horse", "car", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 483227, "caption": "The image depicts a group of young people standing on a tennis court. There are six people in the scene, four of them holding tennis racquets", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["tennis racket", "person", "sports ball"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 228306, "caption": " The image features a red double-decker bus driving down a street in front of a tall building with many apartments. The bus occupies a large portion of the scene, covering most of the left side and a considerable part of the right side", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bus", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 416384, "caption": "According to the picture, a woman in a pink bathing suit is sitting on a beach chair, looking at her cell phone", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "chair", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 364783, "caption": "The image shows a brightly colored bathroom with a small toilet and sink. The toilet is positioned near the center of the bathroom, and the sink is located nearby", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["potted plant", "chair", "bottle", "toothbrush", "sink", "toilet", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2857142857142857}}, {"image_id": 335041, "caption": "The image features a person, likely a woman, wearing a red jacket and black pants, skiing down a snow-covered street", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["skis", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 531327, "caption": "The image features a white bowl filled with a variety of colorful foods, including different types of carrots and broccoli", "mscoco_hallucinated_words": [["bowl", "bowl"]], "mscoco_gt_words": ["fork", "dining table", "spoon", "knife", "wine glass", "broccoli", "carrot"], "hallucination_idxs": [5], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.2857142857142857}}, {"image_id": 451228, "caption": "There is a busy street scene with several buses, including a red double-decker bus, travelling in the same direction", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bicycle", "bus", "traffic light", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 256365, "caption": " The image features a plate filled with several cupcakes decorated with blue frosting", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cake", "dining table", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 502936, "caption": " A group of people are standing around a tennis court, and a man is playing a game of tennis on the court. He is holding a tennis racket in his hand, getting ready to hit a tennis ball", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["tennis racket", "person", "sports ball"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 451449, "caption": "In the image, a black and white dog is sleeping in a dog bed with various books on top of it. The bed is situated in the lower part of the picture, with books arranged on the left side", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dog", "book", "bed"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 51054, "caption": " The scene in the image features a woman sitting in a bedroom, holding a cell phone up to her ear. The bed appears to be placed off to the right side of the room, while a pillow can be seen on the bed", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "bed", "bottle", "person", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 1268, "caption": "In the image, a group of people is gathered near a body of water, likely a river or a canal, possibly under a bridge", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "backpack", "boat", "handbag", "person", "bird"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.16666666666666666}}, {"image_id": 62692, "caption": " The image captures a woman in black and white clothing hitting a tennis ball with a racket on a tennis court. The woman appears to be in the middle of the court, swinging the racket and attempting to return the ball", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["tennis racket", "person", "sports ball"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 542771, "caption": "The image depicts a room with a chair sitting in front of a mirror and a table with chairs and vases of flowers scattered around. The chair appears to be vintage, and there are four chairs in the room, one slightly below the other chairs", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["vase", "dining table", "potted plant", "chair", "book", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 575406, "caption": " | Scene | ", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bus", "motorcycle", "potted plant", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 244834, "caption": "According to the picture, there are two people standing and walking down a rainy street", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["potted plant", "bicycle", "clock", "umbrella", "handbag", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.14285714285714285}}, {"image_id": 151159, "caption": "The image depicts a large outdoor park, with multiple people scattered around the space. Two men can be seen skateboarding in the park, one of them on the right side, and the other on the left side", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["skateboard", "bench", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 277073, "caption": "The scene features a man riding a motor scooter, and a woman is sitting behind him on the back", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "motorcycle", "bicycle", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 377879, "caption": "In the image, two military tanks are parked on train tracks", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["train", "bed", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 436814, "caption": " The scene shows a typical office with a computer sitting at a desk along with a laptop on top", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "mouse", "laptop", "dining table"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 63934, "caption": " The image shows a person on a skateboard, wearing a costume, riding in the street with various cars parked on either side of the road", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["skateboard", "car", "person", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 275611, "caption": " The image showcases a delicious-looking homemade Italian cheese pizza, placed on a silver pizza pan, sitting on top of a table", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["pizza", "dining table", "knife"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 516248, "caption": "In the image, there is a person sitting at a table with a computer setup", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "mouse", "keyboard", "person", "laptop", "tv"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 478380, "caption": "The scene features a large herd of sheep walking along a road. A person is driving down the road in a vehicle looking out the window at the sheep", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sheep", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 422326, "caption": " There is a parking lot filled with several motorcycles of different sizes and designs", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["motorcycle", "bicycle", "car", "person", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2}}, {"image_id": 110449, "caption": "The image features three people in a room, sitting or standing around a table. Two of the people are holding cell phones, which might suggest that they are using their mobile devices", "mscoco_hallucinated_words": [["cell phone", "cell phone"]], "mscoco_gt_words": ["remote", "dining table", "person", "laptop", "tv"], "hallucination_idxs": [22], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.4}}, {"image_id": 45550, "caption": "The image depicts a man posing for a photo, smiling and holding a plate containing some food, likely fried food, such as fried dough, accompanied by some pasta. There are several bottles and cups in the background, likely placed there by the restaurant's staff for patrons", "mscoco_hallucinated_words": [["bottle", "bottle"], ["cup", "cup"]], "mscoco_gt_words": ["clock", "bowl", "sandwich", "person"], "hallucination_idxs": [36, 38], "metrics": {"CHAIRs": 1, "CHAIRi": 0.6666666666666666, "Recall": 0.25}}, {"image_id": 444913, "caption": "In the image, a man is walking along a sidewalk with a large bush in the background", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["car", "person", "frisbee"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 82709, "caption": "The image captures a dog in action, leaping up in the air while catching a pink frisbee. The dog is in the center of the scene, surrounded by numerous people seated on the grass", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "frisbee", "bottle", "dog", "person", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 132796, "caption": "In the image, there are two people riding on the back of a large elephant", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "chair", "bench", "person", "elephant"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 303099, "caption": "Two cats are sitting on a toilet together in a bathroom, resting and possibly sharing the space", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bottle", "toilet", "cat"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 271565, "caption": "According to the image, there are several motorcycles parked down the street in a line. They are placed in various positions on the street, some closer to each other than others", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["motorcycle", "car", "person", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 205193, "caption": "According to the image, it is a kitchen scene featuring a few items in the foreground", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["oven", "microwave", "person", "toaster"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 272566, "caption": "The image captures a man sitting on the ground outside, surrounded by various types of bananas arranged in different baskets", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["banana", "person", "apple", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 170099, "caption": "In the image, there is a man standing in front of a couch, wearing a blue shirt and a red tie. He is also looking down, possibly at the couch or another surface nearby", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["tie", "orange", "couch", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 14940, "caption": "In the image, there are two stuffed animals \u2013 a cat and a dog \u2013 laying on a bed, with the cat closer to the viewer's right side and the dog on the left side", "mscoco_hallucinated_words": [["bed", "bed"]], "mscoco_gt_words": ["cat", "chair", "couch", "orange", "dog"], "hallucination_idxs": [19], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2, "Recall": 0.4}}, {"image_id": 408449, "caption": "According to the picture, a shirtless man is skateboarding down a street next to another man, who appears to be standing near the street, observing the activity. The street is quiet with no other people or vehicles around, giving the impression that it's an unusual scene", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "bus", "handbag", "skateboard", "car", "person", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.14285714285714285}}, {"image_id": 140702, "caption": " The image showcases two elephants walking through a field, with one of them being much larger than the other", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["elephant", "bird", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 354540, "caption": "In a kitchen filled with an oven, there is a man sitting on a bench with a laptop placed on the benchtop. The man is holding a remote, likely for a presentation or video conferencing", "mscoco_hallucinated_words": [["bench", "bench"], ["remote", "remote"]], "mscoco_gt_words": ["cell phone", "oven", "chair", "person", "toaster", "laptop", "microwave"], "hallucination_idxs": [15, 29], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.42857142857142855}}, {"image_id": 19763, "caption": "The image displays a close-up view of a piece of deep-dish pizza on a plate, placed on a table. The pizza appears to be partially consumed, with some slices remaining", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "dining table", "chair", "knife", "person", "pizza", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2857142857142857}}, {"image_id": 191301, "caption": "The image features a delicious-looking piece of cake or other dessert on a white platter, along with a couple of spoons placed on a table. There is also a cup and a bottle of an alcoholic beverage, likely a beer or wine, in the scene", "mscoco_hallucinated_words": [["bottle", "bottle"]], "mscoco_gt_words": ["dining table", "spoon", "cake", "person", "cup"], "hallucination_idxs": [34], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2, "Recall": 0.8}}, {"image_id": 124236, "caption": "The image showcases a kitchen that is dimly lit by the sun. Various pots and pans are positioned on a table, giving a cluttered appearance to the scene", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "dining table", "oven", "spoon", "toaster"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2}}, {"image_id": 344930, "caption": "A red fire hydrant sits next to the curb on a street, surrounded by grass and shrubs", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["orange", "car", "fire hydrant"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 14285, "caption": " In the image, a cat is lying on a bed in a bedroom with books on a table. The cat appears to be orange, and it's occupying the majority of the scene", "mscoco_hallucinated_words": [["table", "dining table"], ["orange", "orange"]], "mscoco_gt_words": ["remote", "cat", "bed", "chair", "book", "tv"], "hallucination_idxs": [18, 25], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.5}}, {"image_id": 82488, "caption": "The image shows two beds in a room, with one bed being larger than the other", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["remote", "dining table", "bed", "clock", "book", "orange"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.16666666666666666}}, {"image_id": 348251, "caption": " The scene depicts a man wearing skis, skiing down a snowy hill", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "skis", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 150703, "caption": "The image features a sandwich-like food item, with the toppings including various sliced vegetables, including tomatoes", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["hot dog", "dining table", "sandwich", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 381615, "caption": "In a windowed room, there is a wooden chair sitting underneath a window. The chair is adorned with various plants, including several potted plants hanging from a large hanging plant holder, as well as a few others placed in other areas around the room", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["vase", "potted plant", "chair", "book", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 352703, "caption": "In the image, there is a woman standing at a cooking area on the sidewalk, surrounded by chairs. She appears to be cooking food in a wok, preparing a dish for an event or occasion", "mscoco_hallucinated_words": [["chair", "chair"]], "mscoco_gt_words": ["bowl", "dining table", "oven", "spoon", "bottle", "handbag", "person", "cup"], "hallucination_idxs": [19], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.125}}, {"image_id": 111109, "caption": "The image captures a young boy wearing shorts while sitting on a chair", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["motorcycle", "chair", "tie", "person", "tv"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 226802, "caption": "This scene takes place on a red street with a lot of people walking around, providing a sense of activity", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bus", "motorcycle", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 49005, "caption": "The image captures a baseball game taking place on a field, surrounded by fans and players. A total of 14 baseball players are visible on the field, including both baseball pitchers and baseball players, such as the catcher, the batter, and several infielders", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["baseball bat", "person", "baseball glove"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 410114, "caption": "In the image, a large herd of horses is walking down a long, open road, along with a group of riders on their backs. The herd of horses takes up much of the road, with some scattered closer to the left side and others near the right", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["truck", "horse", "person", "cow"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 100274, "caption": " The image depicts a train track, with multiple trains on it. The trains are traveling in various directions, with some on the left side and others on the right side", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["train", "car", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 317254, "caption": "The image captures a man wearing a ski mask riding a motorcycle on a road in a city", "mscoco_hallucinated_words": [["ski", "skis"]], "mscoco_gt_words": ["motorcycle", "car", "person"], "hallucination_idxs": [7], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.6666666666666666}}, {"image_id": 425569, "caption": "The image features a large, empty kitchen with a long counter spanning most of the room. The counter is stocked with various kitchen appliances and cookware, including a mix of stainless steel pots and pans of different sizes", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "sink", "oven"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 28842, "caption": " The image captures a skateboarding scene with two people skateboarding down a hill in a park", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["skateboard", "dog", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 319607, "caption": " The image captures a busy street scene with a person riding a bicycle at the corner of a street with many cars. The road has a few traffic lights, one of which is at the intersection where the cyclist is located", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "bus", "bicycle", "traffic light", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 210372, "caption": " The image depicts a small red kitchen with a sink and a few appliances. The kitchen features red cabinets with a few drawers, as well as some white counters and a sink", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["refrigerator", "bottle", "sink"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 156915, "caption": "The image features various flowers and greens arranged in a vase on a table, creating a beautiful arrangement. The vase is filled with a large red rose and a red and white rose, along with a variety of green leaves", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["vase", "dining table", "potted plant"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 349642, "caption": "The image features two people sitting on a pair of adjacent benches, with a dog sitting between them. One person is closer to the left side of the image, while the other is closer to the right side", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bench", "dog", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 423008, "caption": "The image captures a large group of people gathered on a canal in front of numerous boats with colorful umbrellas", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["boat", "umbrella", "handbag", "person", "suitcase"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 45435, "caption": " The image showcases a person's hand holding a cell phone, specifically a silver or black phone", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "person", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 35827, "caption": " The image features a person sitting in front of a computer, working at his desk. He is surrounded by multiple keyboards, including a keyboard in front of him, another one on his right, and a third keyboard located further away from the first two", "mscoco_hallucinated_words": [["keyboard", "keyboard"], ["keyboard", "keyboard"], ["keyboard", "keyboard"]], "mscoco_gt_words": ["dining table", "chair", "bottle", "person", "laptop", "tv", "cup"], "hallucination_idxs": [22, 26, 41], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.42857142857142855}}, {"image_id": 72656, "caption": "In the picture, there are three children sitting at a small table eating together. The children are sitting on a bench located in front of the table", "mscoco_hallucinated_words": [["bench", "bench"]], "mscoco_gt_words": ["bowl", "dining table", "chair", "person", "pizza", "suitcase"], "hallucination_idxs": [22], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2, "Recall": 0.3333333333333333}}, {"image_id": 372087, "caption": " The image shows a large green and white train moving on a train track alongside the platform, where people are waiting. Some individuals are standing on the platform, near the train, while others are sitting further away from it", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["train", "bench", "suitcase", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 336209, "caption": "A young man is captured in the act of skateboarding on a ramp, enjoying a thrilling moment of skateboarding. The ramp appears to be at a skatepark or other outdoor facility", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["skateboard", "bench", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 46031, "caption": "There is an image of a laptop computer on top of a white desk in the image. The computer appears to be turned off, with a mouse positioned near the left side of the keyboard", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "dining table", "mouse", "keyboard", "laptop", "tv"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 283118, "caption": "According to the picture, the image depicts a family with a man, a woman, and a young girl sitting together at a dining table in a restaurant. They are smiling and enjoying each other's company", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "backpack", "dining table", "chair", "bottle", "handbag", "car", "person", "pizza"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2222222222222222}}, {"image_id": 429598, "caption": "The image features an old kitchen with wooden cabinets and flooring. It has a stove and oven, as well as a refrigerator and a sink", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sink", "bottle", "refrigerator", "oven"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 333365, "caption": " The scene is set in an airport with several airplanes visible. Three planes are positioned on a runway with one plane closer to the front and two planes farther away", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["car", "airplane", "person", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 424174, "caption": " The image shows a large plate filled with various kinds of apples and bananas, all placed together in the bowl", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "dining table", "banana", "orange", "apple"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 3035, "caption": "The scene features a large airport runway with multiple airplanes parked at various locations", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["car", "airplane", "person", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 177213, "caption": "The image displays a table with a white plate on it, containing a cheese pizza placed on the left side. To the right of the pizza, there is a knife, indicating that someone might have just finished eating or preparing food", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "dining table", "knife", "person", "pizza", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 438535, "caption": "The image is a black and white shot of a city street with a large clock, likely a subway station, prominently displayed in the scene. The street is narrow and busy, with many cars and people scattered in different parts of the street", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "clock", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 490711, "caption": "The image depicts a spacious and empty kitchen, featuring several white appliances and fixtures. A refrigerator is positioned towards the left side of the room, surrounded by a couple of cabinets and a sink", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sink", "banana", "refrigerator"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 163728, "caption": "According to the image, it features a sleeping kitten lying on a dining table next to a keyboard and mouse", "mscoco_hallucinated_words": [["keyboard", "keyboard"]], "mscoco_gt_words": ["dining table", "cat", "mouse", "laptop", "cup"], "hallucination_idxs": [18], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.6}}, {"image_id": 456756, "caption": " The image features two giraffes and a zebra, all together in a pen area", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["zebra", "giraffe", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 281028, "caption": "The image features a train or a bus with two rows of seats going down the middle. One row is situated closer to the window, while the other row is behind it", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["train", "chair", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 343937, "caption": "The scene captures a woman snowboarding down a hill in the snow", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["snowboard", "skis", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 277051, "caption": " The image depicts two birds, one smaller and the other a bit larger, sitting on a table next to some pizza slices on a plate", "mscoco_hallucinated_words": [["pizza", "pizza"]], "mscoco_gt_words": ["dining table", "chair", "bottle", "knife", "bird"], "hallucination_idxs": [22], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.4}}, {"image_id": 145666, "caption": " The image showcases a pot filled with various vegetables, including broccoli, carrots, and onions. The broccoli is spread across the pot, covering a large portion of the cooking area", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "broccoli", "dining table", "carrot"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 304984, "caption": " The image displays a delicious meal consisting of a sandwich and a side dish on a plate. The sandwich appears to be a French toast sandwich, with a piece of cake on the side", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "bowl", "cake", "sandwich", "wine glass", "orange"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 122467, "caption": "A person is shown holding a video game remote controller, likely for the Nintendo Wii, in their left hand. The remote controller is positioned in a way that highlights their injured hand", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["couch", "remote", "dining table", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 518287, "caption": "The image features a toothbrush with a smile in the middle. It's likely the brush has a unique design or is a custom piece", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["orange", "toothbrush", "dining table", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 145448, "caption": "According to the picture, there is a cat sitting on top of a flat sheet that is covering a car seat", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["motorcycle", "dining table", "cat", "chair", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 352900, "caption": " |  The image features a plate of pasta on a table with several pieces of broccoli distributed throughout", "mscoco_hallucinated_words": [["table", "dining table"]], "mscoco_gt_words": ["fork", "bowl", "broccoli", "knife"], "hallucination_idxs": [10], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.25}}, {"image_id": 153607, "caption": "According to the picture, there is a collection of three vases filled with water, each featuring a flower in a slightly different arrangement. The flowers appear to be orange, with one flower being placed in the middle, another on the left, and a third on the right side", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["orange", "bowl", "dining table", "vase"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 157581, "caption": " The image shows a dining table with a variety of wine bottles lined up on top of it", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "chair", "bottle", "wine glass", "person", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 227438, "caption": "According to the picture, a spacious bedroom is shown with a large bed sitting in the middle of the room. There is a nightstand on the right side of the bed, and a television sitting on the wall to the left of the bed", "mscoco_hallucinated_words": [["television", "tv"]], "mscoco_gt_words": ["chair", "couch", "clock", "bed"], "hallucination_idxs": [36], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.25}}, {"image_id": 116037, "caption": "This image showcases a baseball game in progress, with a batter standing in front of home plate ready to swing at a ball coming towards them. The batter is holding a baseball bat, while a catcher and an umpire are nearby, anticipating the swing", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["baseball bat", "person", "sports ball", "baseball glove"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 202658, "caption": "The image features a white toilet sitting on the ground outside", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "bowl", "toilet"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 18150, "caption": " The image shows a man and a young child sitting on a couch, playing together. The man appears to be eating a slice of pizza, with a child next to him eating a similar pizza", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "couch", "bottle", "person", "pizza"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 418711, "caption": "The image features a man on a bike with a large amount of bananas tied to it", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["banana", "bicycle", "car", "person", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 92107, "caption": "The image features a green bowl filled with food", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["spoon", "bowl", "broccoli", "dining table"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 491000, "caption": "According to the picture, there is a group of people walking down a narrow city street. They are located near a building in the middle of the scene, and several other people are standing and talking", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["motorcycle", "handbag", "car", "person", "dog"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2}}, {"image_id": 401163, "caption": "A man sits on a park bench surrounded by trees while a woman and another man stand in the park. The park bench is positioned in the center of the scene, with the woman on the right and the other man on the left", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bench", "dog", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 39663, "caption": "The image shows a variety of items arranged on the floor. The most prominent among these items is a backpack, which takes up the largest part of the area", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "scissors", "backpack", "book", "laptop"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2}}, {"image_id": 268293, "caption": "The image features a man, who is wearing a gray shirt, playing tennis and holding a tennis racket. He appears to be in the middle of a match, ready to return the ball with his racket", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["tennis racket", "person", "sports ball"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 474499, "caption": "The image depicts a small, clean kitchen with white cabinets and light wooden flooring. The kitchen has a combination oven/microwave (oven) located near the right side of the room and a sink located at the center, by the refrigerator", "mscoco_hallucinated_words": [["refrigerator", "refrigerator"]], "mscoco_gt_words": ["vase", "oven", "spoon", "bottle", "clock", "sink", "apple"], "hallucination_idxs": [43], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.2857142857142857}}, {"image_id": 358086, "caption": "According to the picture, a group of people, consisting of men and women, are engaged in various actions on a grass field", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "chair", "bottle", "person", "frisbee"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2}}, {"image_id": 89541, "caption": "In the picture, there is a tray filled with a variety of food items, primarily consisting of fruits. Among the fruits, there are several strawberries and blueberries, as well as other toppings and pastries", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["banana", "cake", "bowl", "dining table"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 239445, "caption": " The image shows a man standing in an open area outdoors, possibly at a park or a garden. He is holding two white frisbees, one in each hand, as he smiles while the frisbees are upside down", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "sports ball", "frisbee"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 105782, "caption": "According to the picture, a kangaroo is standing in a field with a colorful kite on top of it", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cat", "kite", "dog", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 487990, "caption": "A person is standing over a large table filled with various different foods", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fork", "bowl", "dining table", "donut", "spoon", "bottle", "cake", "knife", "person", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2}}, {"image_id": 138834, "caption": "According to the picture, there is a man in the snow wearing a black jacket, carrying his skis, and walking with them in tow. The snow is quite heavy, making it a bit challenging for the person to carry his equipment on his back", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["skis", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 492057, "caption": "In a bathroom, a man is standing in front of a mirror while taking a selfie with a cell phone. There are a few people visible in the background, some closer and others more in the distance", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "tie", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 388215, "caption": "The image captures a tennis court with a person in the center of the court, preparing to hit a tennis ball", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["tennis racket", "person", "sports ball"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 111409, "caption": "The image features a man riding a motorcycle down a street, likely on a city block", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bicycle", "motorcycle", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 451391, "caption": "This image displays a beautiful bouquet of greens on a table", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["broccoli", "dining table", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 92462, "caption": "The image depicts a street scene with several cows walking down the road, likely as part of a herding process", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "car", "person", "cow"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 397268, "caption": "The image shows a small bike store inside a building with various bicycles on display in the window, including a few behind chairs outside", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bicycle", "chair", "bench", "potted plant"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 127659, "caption": " The image shows a long train traveling along a train track, with people standing by the platform as they wait for the train to come to a stop", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["train", "bench", "dog", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 251857, "caption": "The image features two men riding skateboards in a city park, with one person performing tricks on his skateboard and the other person watching. They are positioned in different parts of the park, with one person closer to the right side of the image and the other closer to the left side", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["skateboard", "traffic light", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 243212, "caption": "According to the picture, a young child is standing in a park with a blue frisbee in their hand. There are several vehicles parked nearby, including cars, one of which is closer to the child", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dog", "car", "truck", "person", "frisbee"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 444304, "caption": "The image depicts a young man kneeling on the floor while holding a remote control. In front of him, there is a television set and multiple game controllers", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "remote", "tv", "bed"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 305000, "caption": "According to the picture, there are various vegetables and fruits displayed at a woman's stand in a marketplace", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["banana", "apple", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 44136, "caption": "The image features two men sitting at a table, possibly in a dining or banquet setting, enjoying a meal or event. Both men are dressed in tuxedos, and one is wearing a bow tie", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "tie", "bottle", "wine glass", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 154846, "caption": "The image features a large pepperoni pizza with mushrooms on it, placed on a table. There are several people in the scene, some of whom are dining or chatting, while others are simply enjoying the food", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["pizza", "dining table", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 567254, "caption": "A small child is the main subject in the image, standing in front of a TV", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "bottle", "tv", "vase"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 79261, "caption": "There is a man in a swimming pool in the middle of a street filled with water, cleaning and paddling the pool with a broom. The street is filled with people from all different places, sitting and standing around the area", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["handbag", "backpack", "clock", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 301402, "caption": "The image captures a man sitting at a dining room table, using his laptop. He is wearing a hat and a black jacket, and has his hands on the table, likely working on his laptop", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "potted plant", "chair", "bottle", "person", "laptop"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 415828, "caption": " The image features a group of people walking down a long sidewalk alongside some tall buildings in an urban setting. A man with an umbrella is in the center of the group, standing underneath it for shade", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "stop sign", "umbrella", "handbag", "traffic light", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2857142857142857}}, {"image_id": 543231, "caption": " In the image, a woman is playing Wii with her friend", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["remote", "bowl", "bed", "book", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2}}, {"image_id": 495357, "caption": "The scene is an outdoor street event where a little boy is sitting on the back of a motorcycle", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["handbag", "motorcycle", "dog", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 523175, "caption": "According to the picture, a bowl filled with soup is present on a table. The soup is topped with several pieces of carrots, as well as some green beans and a spoon", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["spoon", "bowl", "carrot", "dining table"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 184945, "caption": "The image depicts a parking lot or garage area with several motorcycles parked on the sidewalk", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bicycle", "motorcycle", "potted plant"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 49942, "caption": " The image features a young man holding an umbrella over his head. He is staring up and slightly to the right, with an expression that suggests a slight confusion", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["tie", "person", "umbrella"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 223019, "caption": "There is a blue train parked at a train station in the image", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "train", "handbag", "car", "person", "suitcase"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.16666666666666666}}, {"image_id": 42889, "caption": "The image displays a teddy bear sitting next to a laptop on a table", "mscoco_hallucinated_words": [["laptop", "laptop"], ["table", "dining table"]], "mscoco_gt_words": ["teddy bear", "bear", "keyboard"], "hallucination_idxs": [10, 13], "metrics": {"CHAIRs": 1, "CHAIRi": 0.6666666666666666, "Recall": 0.3333333333333333}}, {"image_id": 22112, "caption": "The image features a shelf or table filled with various objects, including a pair of vases, one filled with flowers and the other with greenery, as well as some other plants and sculptures.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "dining table", "potted plant", "vase"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 247587, "caption": " The image features a man standing on a white surfboard at a beach location. He is likely enjoying the waves and the warm sandy environment", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["surfboard", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 171962, "caption": "In the image, a large city bus is parked on the street with its bicycle rack and the back of the bus towards the viewer. There are several bicycles parked next to the bus on the street, and a person appears to be taking the time to observe them", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bicycle", "bus", "car", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 545056, "caption": " This image depicts a large field with many cows grazing on it. The cows are spread out across the grassy landscape, enjoying the pasture", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sheep", "dog", "car", "cow"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 401411, "caption": " The image features a man standing in the middle of a kitchen, likely at a restaurant or other food-related setting. There are several people in the scene, some of them further away from the man in the center", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "dining table", "oven", "book", "person", "carrot", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.14285714285714285}}, {"image_id": 2867, "caption": " The scene is set amid snowy ski slopes, with several people skiing together", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "skis", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 246963, "caption": " The scene features a group of motorcycle riders driving down the road together, with several of them positioned at the back of the pack", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["stop sign", "motorcycle", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 498225, "caption": " The scene features a group of people standing outside a bakery or cake shop, most likely in a bustling city or town. There are four distinct people in the image, two of them are women and the others are men", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "donut", "cake", "handbag", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 124601, "caption": " There is a small kitchen with two ovens in it, placed one above the other. One of the ovens is located at the top of the image, while the other is below", "mscoco_hallucinated_words": [["oven", "oven"], ["oven", "oven"]], "mscoco_gt_words": ["dining table", "bottle", "keyboard", "sink", "wine glass", "microwave", "laptop", "cup"], "hallucination_idxs": [7, 20], "metrics": {"CHAIRs": 1, "CHAIRi": 1.0, "Recall": 0.0}}, {"image_id": 581749, "caption": " The image features a variety of fruits and vegetables placed on a table, including oranges and broccoli", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["orange", "broccoli", "dining table"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 227960, "caption": "The image features a white square dish filled with food on a dining table. The food appears to consist of a mix of cooked broccoli and carrots", "mscoco_hallucinated_words": [["table", "dining table"], ["broccoli", "broccoli"]], "mscoco_gt_words": ["bowl", "spoon", "wine glass", "carrot", "cup"], "hallucination_idxs": [13, 25], "metrics": {"CHAIRs": 1, "CHAIRi": 0.6666666666666666, "Recall": 0.2}}, {"image_id": 286503, "caption": "The image features an elephant standing outdoors near a fence, likely in a zoo or park. The elephant is occupying the center of the scene, with a person standing nearby, likely observing the animal or taking part in some activity involving it", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["elephant", "person", "sports ball"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 315740, "caption": "The image features a large and clean kitchen with hardwood flooring, metal appliances, and modern touches. A sink is located near the center, surrounded by a variety of cabinets and drawers for storage", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "potted plant", "oven", "chair", "couch", "sink", "tv", "microwave"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.125}}, {"image_id": 142108, "caption": "The image depicts a group of women and young girls sitting and working around a dining table", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["banana", "dining table", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 542933, "caption": "", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["baseball bat", "chair", "sports ball", "bench", "person", "baseball glove"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 475043, "caption": "In the image, there is a group of five people gathered around a couch in a living room. Four of them are sitting on the couch while one person is standing", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "spoon", "couch", "bottle", "person", "laptop"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 456784, "caption": "The image depicts a person holding a knife and cutting a cake", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cake", "knife", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 33753, "caption": "The image features a wooden park bench sitting outside, and a remote control is placed on top of the bench", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "bench", "remote", "tv"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 448694, "caption": " In the image, two young men are playing a game of frisbee as they battle it out in a field with their friends watching and cheering them on", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["chair", "person", "frisbee"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 99053, "caption": " The image displays a delicious bowl of Chinese noodles with vegetables and meat. The bowl is filled with the noodles and vegetables, including broccoli and carrots, along with a fork and a spoon for serving and eating the dish", "mscoco_hallucinated_words": [["spoon", "spoon"]], "mscoco_gt_words": ["fork", "bowl", "dining table", "broccoli", "carrot"], "hallucination_idxs": [35], "metrics": {"CHAIRs": 1, "CHAIRi": 0.16666666666666666, "Recall": 0.8}}, {"image_id": 503210, "caption": "The image is of a living room filled with a couch, a TV, and a table. The couch is positioned against the far wall and extends across a large portion of the room, while the TV is placed near the center of the space", "mscoco_hallucinated_words": [["tv", "tv"], ["table", "dining table"], ["tv", "tv"]], "mscoco_gt_words": ["vase", "potted plant", "chair", "couch", "clock", "book", "orange"], "hallucination_idxs": [13, 17, 39], "metrics": {"CHAIRs": 1, "CHAIRi": 0.6, "Recall": 0.14285714285714285}}, {"image_id": 142257, "caption": " The image shows a busy city street, with a red car traveling down the road. Several traffic lights are visible, positioned above the street at various points, controlling the flow of traffic", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["traffic light", "car", "person", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}], "overall_metrics": {"CHAIRs": 0.12525252525252525, "CHAIRi": 0.06157270029673591, "Recall": 0.41950321987120515, "num_hallucinated_caps": 62.0, "num_caps": 495.0, "hallucinated_word_count": 83.0, "coco_word_count": 1348.0, "length_response": 30.272727272727273, "hallucinated_caps_ls": [144305, 493862, 401027, 343534, 209347, 12375, 2154, 104326, 233888, 183766, 169169, 344942, 185327, 401010, 313928, 388237, 122602, 265628, 5934, 347453, 259345, 443259, 537861, 240681, 178753, 250540, 526414, 331084, 328818, 188136, 151081, 477016, 558784, 230983, 381031, 118124, 328110, 88269, 98979, 379443, 560018, 531327, 110449, 45550, 14940, 354540, 191301, 14285, 352703, 317254, 35827, 72656, 163728, 277051, 352900, 227438, 474499, 42889, 124601, 227960, 99053, 503210]}}}