{"overall_metrics": {"CHAIRs": 0.27, "CHAIRi": 0.10577971646673937, "Recall": 0.4733485193621868, "num_hallucinated_caps": 135.0, "num_caps": 500.0, "hallucinated_word_count": 194.0, "coco_word_count": 1834.0, "length_response": 41.106, "hallucinated_caps_ls": [144305, 308003, 95908, 324008, 501311, 39053, 253630, 161227, 195645, 32625, 343534, 254368, 233888, 213905, 409346, 344942, 275929, 300124, 12669, 133146, 498747, 185327, 454161, 129707, 368367, 201555, 489909, 405183, 333712, 148977, 183571, 325836, 467887, 557998, 401010, 313928, 122602, 24104, 279407, 527497, 229659, 265628, 499594, 258209, 245664, 453731, 418692, 259345, 443299, 545594, 219546, 535403, 375769, 426172, 138078, 152499, 180764, 537861, 146504, 301837, 240681, 14773, 563938, 134768, 526414, 192656, 412407, 191691, 159979, 357, 134223, 198163, 217593, 475813, 53431, 441840, 381031, 9628, 330050, 254161, 423984, 118124, 288729, 252625, 302789, 30667, 353898, 88269, 536154, 560018, 353320, 416384, 531327, 1268, 436814, 63934, 45550, 303099, 205193, 272566, 14940, 191301, 124236, 14285, 82488, 150703, 49005, 410114, 210372, 429598, 490711, 145666, 227438, 18150, 474499, 89541, 487990, 127659, 444304, 543231, 495357, 523175, 184945, 223019, 42889, 401411, 2867, 246963, 124601, 581749, 286503, 142108, 475043, 456784, 99053]}, "results": {"sentences": [{"image_id": 144305, "caption": "A laptop computer is sitting on a desk, with a keyboard and mouse nearby. There is also a headset and a computer monitor on the desk. The laptop is connected to a network cable, and there is a computer mouse connected to the laptop.", "mscoco_hallucinated_words": [["mouse", "mouse"], ["monitor", "tv"], ["mouse", "mouse"]], "mscoco_gt_words": ["laptop", "keyboard", "dining table"], "hallucination_idxs": [13, 24, 43], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2727272727272727, "Recall": 1.0}}, {"image_id": 164091, "caption": "A doll and a stuffed animal are sitting in a crib, surrounded by a bed and a stuffed animal.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "teddy bear", "bed"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 308003, "caption": "A wooden bench is situated in a grassy area, with a tree nearby. The bench is covered in green paint, and it appears to be weathered. The tree provides shade, and the bench offers a comfortable spot for people to rest or sit and enjoy the natural surroundings.", "mscoco_hallucinated_words": [["person", "person"]], "mscoco_gt_words": ["dining table", "bench", "chair"], "hallucination_idxs": [43], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.3333333333333333}}, {"image_id": 54870, "caption": "A delicious meal is being served on a white plate, consisting of a chicken sandwich, lettuce, tomato, and a side of fries. The chicken sandwich is topped with cheese, and the lettuce and tomato are fresh and crisp. The meal is accompanied", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["knife", "sandwich", "fork"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 95908, "caption": "A white coffee mug sits on a wooden table, next to a computer mouse and a keyboard. The computer mouse is connected to a computer, and the keyboard is connected to the computer as well. The image shows a person using the computer and the mouse to navigate through a website or perform other tasks on the computer", "mscoco_hallucinated_words": [["person", "person"]], "mscoco_gt_words": ["laptop", "dining table", "keyboard", "mouse", "cup"], "hallucination_idxs": [43], "metrics": {"CHAIRs": 1, "CHAIRi": 0.07692307692307693, "Recall": 0.8}}, {"image_id": 329614, "caption": "A city street with a bus and cars is shown in the image. The bus is parked on the side of the road, and there are cars driving by. The scene is set in a city with a church and a building in the background.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "bus", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 324008, "caption": "A tray of food, including a sandwich, a banana, and a bowl of yogurt, is spread out on a table in an airplane.", "mscoco_hallucinated_words": [["sandwich", "sandwich"], ["bowl", "bowl"]], "mscoco_gt_words": ["person", "dining table", "banana", "orange", "airplane", "train", "cup"], "hallucination_idxs": [7, 14], "metrics": {"CHAIRs": 1, "CHAIRi": 0.4, "Recall": 0.42857142857142855}}, {"image_id": 52700, "caption": "A group of people are gathered around a table filled with various desserts, including cakes, cupcakes, and cookies. They are enjoying the desserts and socializing with each other.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "dining table", "spoon", "cake", "handbag", "fork"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 501311, "caption": "A baseball player is pitching a ball on a green field, surrounded by a crowd of people watching the game. The player is wearing a baseball uniform and holding a baseball bat, ready to hit the ball. The image captures the excitement and energy of the game, as the crowd cheers and the player prepar", "mscoco_hallucinated_words": [["baseball bat", "baseball bat"]], "mscoco_gt_words": ["person", "sports ball", "baseball glove"], "hallucination_idxs": [32], "metrics": {"CHAIRs": 1, "CHAIRi": 0.14285714285714285, "Recall": 0.6666666666666666}}, {"image_id": 247179, "caption": "A group of people dressed in traditional attire, including a man in a turban, are walking down a street in a city, accompanied by elephants decorated with lights. The scene is likely from a cultural event or festival, where the elephants are being paraded as part of the celebration.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["elephant", "clock", "person", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 577912, "caption": "A luxurious bathroom with a large bathtub, a sink, and a toilet is featured in the image. The bathroom has a white and beige color scheme, with a wooden floor and a window providing natural light. The bathroom is well-equipped with modern fixtures and", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["toilet", "sink", "bottle", "toothbrush"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 196341, "caption": "A group of people is walking through a large clock tower, admiring the intricate design and architecture of the structure. The clock tower is located in a city, and it appears to be a popular tourist attraction. The people are standing in front of the clock, looking at the time and taking in the unique", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "clock", "handbag"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 234433, "caption": "A bicycle sign is posted on a pole next to a staircase, indicating that riders should ride their bikes on the left side of the stairs.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "bicycle", "traffic light", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 455610, "caption": "A group of people are gathered around a red and green motorcycle, admiring its unique design and colorful paint job. The motorcycle is parked on the street, and there are people standing around it, taking pictures or simply enjoying the sight. The image captures the excitement and interest that the motorcycle", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["motorcycle", "traffic light", "person", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 39053, "caption": "A table is filled with various dishes, including a bowl of eggs, a plate of pancakes, and a bowl of yogurt. There are also several utensils, such as a spoon and a fork, on the table. The image shows a breakfast spread, with the food items", "mscoco_hallucinated_words": [["fork", "fork"]], "mscoco_gt_words": ["apple", "dining table", "spoon", "bowl", "cake", "cell phone", "cup"], "hallucination_idxs": [37], "metrics": {"CHAIRs": 1, "CHAIRi": 0.14285714285714285, "Recall": 0.5714285714285714}}, {"image_id": 493862, "caption": "A young man is standing in a grassy field, holding a tennis racket and looking up at the sky.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "dog", "tennis racket"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 269873, "caption": "A group of people is walking down a city street, passing by a streetcar. The streetcar is parked at a stop, and the people are walking in both directions. The scene is busy and lively, with people of different ages and genders walking together.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "bus", "traffic light", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 524656, "caption": "A kitchen with a stainless steel sink, a stove, and a refrigerator is filled with various kitchen utensils and appliances. The sink is clean and organized, while the stove and refrigerator are both in use. There are also several pots and pans on", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["spoon", "bottle", "wine glass", "oven", "bowl", "knife", "refrigerator", "microwave", "toaster", "sink", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2727272727272727}}, {"image_id": 369547, "caption": "A black and white dog is sitting on a beach, surrounded by sand and rocks.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bird", "cat", "dog"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 181446, "caption": "A man is standing in front of a refrigerator, holding a bottle of ketchup and looking at the contents of the fridge.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "bottle", "bowl", "refrigerator", "sink"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 128119, "caption": "A city bus is parked on a street, with a bike rack on the front. The bus is empty, and there are two bicycles attached to the rack. The scene is set in a busy urban environment, with a tall building visible in the background.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "bicycle", "cell phone", "handbag", "bus", "backpack"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.16666666666666666}}, {"image_id": 401027, "caption": "A sandwich with lettuce, tomato, and cheese sits on a white plate, surrounded by a black cup and a candle.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "knife", "sandwich", "fork", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 253630, "caption": "A large, dark brown wooden dining table is placed in the middle of a room, surrounded by a rug and a couch. The room has a TV and a chair, creating a comfortable and inviting atmosphere for socializing and enjoying meals.", "mscoco_hallucinated_words": [["couch", "couch"]], "mscoco_gt_words": ["dining table", "tv", "chair", "potted plant"], "hallucination_idxs": [23], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.75}}, {"image_id": 326021, "caption": "A woman is sitting at a table with a teddy bear and a sign that reads \"Badger Day - Are You Ready to See the Results?\" The woman is holding a red tablecloth, and the teddy bear is placed on top of the table. The sign suggests that the event is related to eye", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "dining table", "teddy bear"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 317320, "caption": "A man rides a bicycle on a busy street, passing by a yellow line on the pavement.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["motorcycle", "bicycle", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 507171, "caption": "A man is surfing on a wave in the ocean, riding a surfboard. He is wearing a wetsuit and a helmet, which suggests that he is an experienced surfer. The image captures the moment when he is in the air, performing a trick or stunt, as", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "cat", "surfboard"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 161227, "caption": "A black leather couch is sitting in front of a TV, with a remote control and a laptop on the coffee table. The couch is empty, and there is a TV remote on the table.", "mscoco_hallucinated_words": [["tv", "tv"], ["table", "dining table"], ["tv", "tv"], ["table", "dining table"]], "mscoco_gt_words": ["laptop", "chair", "couch", "cell phone", "keyboard", "remote"], "hallucination_idxs": [10, 22, 33, 37], "metrics": {"CHAIRs": 1, "CHAIRi": 0.4444444444444444, "Recall": 0.5}}, {"image_id": 25812, "caption": "A man is skiing down a snowy slope, enjoying the winter sports experience.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "skis", "snowboard"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 267537, "caption": "A group of women, dressed in formal attire, are sitting on bleachers at a stadium, enjoying a sporting event.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "tie", "umbrella", "bench"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 195645, "caption": "A group of people, including a man and a woman, are gathered around a table in a park, enjoying a meal together. They are sitting on benches and chairs, and there are wine glasses on the table. The scene is described as a \"family gathering\" and the people are sm", "mscoco_hallucinated_words": [["chair", "chair"]], "mscoco_gt_words": ["person", "dining table", "bottle", "wine glass", "bench", "handbag"], "hallucination_idxs": [32], "metrics": {"CHAIRs": 1, "CHAIRi": 0.1111111111111111, "Recall": 0.6666666666666666}}, {"image_id": 155671, "caption": "A busy street scene with a red light at an intersection, cars parked along the side of the road, and a pedestrian walking down the sidewalk.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["traffic light", "truck", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 412894, "caption": "A busy street scene in London features a group of people walking down the sidewalk, with a red double-decker bus passing by. The image captures the vibrant atmosphere of the city, showcasing the city's iconic landmarks, such as the London Underground sign, and the presence", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["traffic light", "handbag", "person", "backpack"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 32625, "caption": "A man is sitting at a table with a cup of coffee and a bowl of soup in front of him. There is also a glass of water on the table.", "mscoco_hallucinated_words": [["man", "person"]], "mscoco_gt_words": ["dining table", "bowl", "book", "fork", "cup"], "hallucination_idxs": [1], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2, "Recall": 0.6}}, {"image_id": 18688, "caption": "A baseball player is standing on the field, ready to pitch the ball to a batter. The batter is waiting at the plate, ready to hit the ball. The scene is set in a baseball stadium, with a crowd of people watching the game.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "baseball bat", "sports ball", "baseball glove"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 343534, "caption": "A young girl is sitting on a chair next to a stuffed animal, holding a teddy bear. She is wearing a pink sweater and black boots, and her hair is styled in a bun. The scene is set in a room with a couch and a table, creating a co", "mscoco_hallucinated_words": [["girl", "person"], ["couch", "couch"], ["table", "dining table"]], "mscoco_gt_words": ["potted plant", "chair", "dog", "teddy bear", "book"], "hallucination_idxs": [2, 47, 50], "metrics": {"CHAIRs": 1, "CHAIRi": 0.6, "Recall": 0.4}}, {"image_id": 370657, "caption": "A group of people, including a man, a woman, and a child, are riding motorcycles on a street in a small town. They are all wearing helmets and are surrounded by various baskets and bags, indicating that they are traveling with their belongings. The scene shows", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["motorcycle", "handbag", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 481596, "caption": "A man is sitting in the stands at a baseball game, eating a hot dog while watching the game.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "hot dog", "chair"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 460347, "caption": "A city street with a bus and multiple cars is shown in the image. The bus is parked on the side of the road, while cars are driving down the street.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "bus", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 398753, "caption": "A baseball game is taking place on a field, with a large crowd of people watching from the stands. The players are wearing baseball uniforms and are engaged in the game, with one player swinging a bat and another player catching a ball. The image captures the excitement and energy of the game, show", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "baseball bat", "sports ball", "baseball glove"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 67833, "caption": "A group of friends are enjoying a meal together at a restaurant, with a large pizza on the table. They are sharing a variety of food items, including bread, cheese, and vegetables, and are using utensils to eat their meal. The atmosphere is casual and relaxed,", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "dining table", "bottle", "wine glass", "bowl", "knife", "fork", "cup", "pizza"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2222222222222222}}, {"image_id": 272880, "caption": "A woman is holding a pizza slice and a pizza box, with a sign that reads \"Mystic Pizza\" on the box. She is eating the pizza and enjoying her meal.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "dining table", "knife", "fork", "cup", "pizza"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 254368, "caption": "A man is sitting on a bed, eating a sandwich while wearing a white bathrobe.", "mscoco_hallucinated_words": [["sandwich", "sandwich"]], "mscoco_gt_words": ["person", "pizza", "bed"], "hallucination_idxs": [10], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.6666666666666666}}, {"image_id": 193108, "caption": "A young baseball player is practicing his swing in a baseball field, with two other players nearby. The player is wearing a black and yellow jersey, and he is standing in front of a fence, ready to hit the ball. The image captures the moment of focus and determination as the player", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "baseball bat", "sports ball"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 459141, "caption": "A woman rides a bicycle with a large basket on the front, carrying a bag of groceries.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["motorcycle", "bicycle", "person", "potted plant"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 231534, "caption": "A man is standing next to a large airplane, which is parked on the tarmac. The airplane has a number of suitcases and luggage on it, indicating that it is about to take off. The man is looking at the airplane, possibly waiting for his flight or checking the lug", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "handbag", "truck", "airplane", "suitcase"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 227031, "caption": "A man and woman are standing at a table, holding a cake. They are likely celebrating a special occasion, such as a wedding or anniversary, and are about to cut the cake together. The man is holding a knife, and the woman is holding a cake server. The cake", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "dining table", "potted plant", "cake", "knife", "tie"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 209347, "caption": "A woman is sitting on a subway train, using her phone while waiting for the train to move. She is wearing a black jacket and has a red scarf around her neck. The train is in motion, and she is holding her phone in her hand, possibly checking her social media or browsing the", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "cell phone", "tie", "handbag", "train"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 523292, "caption": "A cat is sitting on a laptop, looking at the screen.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["laptop", "dining table", "tv", "chair", "cat"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 12375, "caption": "A white plate is filled with a variety of food items, including a pork chop, potatoes, and carrots. The dish is served on a table, and it appears to be a well-balanced meal.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "carrot", "broccoli"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 13550, "caption": "A young woman is sitting on a rock, holding an elephant's trunk, and smiling at the camera.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["elephant", "handbag", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 146837, "caption": "A young man is skateboarding down a sidewalk, performing a trick by jumping over a curb. The image captures the moment of his jump, showcasing his skill and agility on the skateboard.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["motorcycle", "person", "skateboard"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 67042, "caption": "A man is standing in a long, narrow corridor, looking at his phone. He is dressed in a suit and tie, and appears to be waiting or checking his phone while walking down the hallway.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "tie", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 209925, "caption": "A baseball player is pitching a ball on a field, with a catcher standing behind him. The player is wearing a baseball uniform and a baseball cap, while the catcher is wearing a catcher's mask and glove. The image captures the moment of the pitch, with the ball flying", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "sports ball", "baseball glove"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 2154, "caption": "A man is sitting on a bench next to a trash can, surrounded by a pile of trash and a shopping cart.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "umbrella", "bench", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 274931, "caption": "A black and white image of a city street shows a row of old cars parked along the sidewalk, with a streetlight in the background. The cars are parked in a row, creating a sense of nostalgia and old-fashioned charm.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fire hydrant", "traffic light", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 104326, "caption": "A spacious and well-lit kitchen with a dining table and chairs is the main focus of the image. The kitchen features a wooden floor and a large wooden table with chairs, creating a cozy and inviting atmosphere. The room is also filled with natural light, which enhances the overall amb", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["clock", "dining table", "oven", "potted plant", "chair", "knife", "microwave", "sink"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 233888, "caption": "A young boy is playing baseball in front of a television, using a baseball bat to hit a ball on the screen. The television is displaying a baseball game, with a player in the middle of a pitch. The boy is wearing a baseball uniform and a helmet, and he is standing in front of the TV", "mscoco_hallucinated_words": [["ball", "sports ball"]], "mscoco_gt_words": ["person", "tv", "potted plant", "baseball bat", "baseball glove"], "hallucination_idxs": [19], "metrics": {"CHAIRs": 1, "CHAIRi": 0.125, "Recall": 0.6}}, {"image_id": 213905, "caption": "Two women tennis players are standing on a tennis court, one holding a tennis racket and the other holding a tennis ball. They are likely in the middle of a match, as they are wearing tennis attire and are standing near a tennis net.", "mscoco_hallucinated_words": [["ball", "sports ball"]], "mscoco_gt_words": ["person", "tennis racket", "chair", "backpack"], "hallucination_idxs": [22], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.5}}, {"image_id": 277479, "caption": "A young girl is standing in front of a refrigerator, reaching for a jar of pickles. She is wearing a yellow shirt and has a bottle of ketchup in her hand.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "bottle", "refrigerator"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 300784, "caption": "A group of children are sitting on a bench, holding a large wooden sword and a shield. They are dressed in medieval-style clothing and appear to be engaged in a playful activity.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["couch", "dog", "bench", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 183766, "caption": "A delicious fruit tart is displayed on a white tablecloth, surrounded by three elegant dessert forks. The tart is topped with fresh berries and a sprinkle of gold leaf, making it a visually appealing and tasty treat.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "cake", "knife", "fork"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 169169, "caption": "A group of people are walking down a city street, passing by a large green and white sign that reads \"Spring in the City.\" The sign is placed on a pole, and it is surrounded by a few trees and a parked car. The scene suggests a lively and vibrant atmosphere in the city,", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "traffic light", "potted plant", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 409346, "caption": "A group of women are gathered around a table, enjoying a meal together. One woman is holding a plate of food, while another woman is holding a fork and a knife. They are likely sharing a dessert or a buffet-style meal, as there are multiple dishes on the table.", "mscoco_hallucinated_words": [["fork", "fork"], ["knife", "knife"]], "mscoco_gt_words": ["spoon", "dining table", "person", "bowl", "cake"], "hallucination_idxs": [30, 33], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2857142857142857, "Recall": 0.4}}, {"image_id": 522262, "caption": "A row of bicycles is parked on a sidewalk, with a building in the background.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "bicycle", "traffic light", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 79014, "caption": "A man is holding a yellow ball in his hand, and he is standing in front of a fence.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "sports ball", "orange"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 344942, "caption": "A small wooden toy, possibly a wooden man, is sitting on a computer monitor, looking at the screen.", "mscoco_hallucinated_words": [["man", "person"]], "mscoco_gt_words": ["laptop", "tv", "clock"], "hallucination_idxs": [8], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.6666666666666666}}, {"image_id": 275929, "caption": "A pair of white toilets sits on the stairs, with one toilet on the bottom step and the other on the top step. The toilets are surrounded by a wooden railing, and there is a small wooden bench nearby. The image captures a scene of two toilets", "mscoco_hallucinated_words": [["bench", "bench"]], "mscoco_gt_words": ["bowl", "toilet", "sink"], "hallucination_idxs": [40], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2, "Recall": 0.3333333333333333}}, {"image_id": 465601, "caption": "A group of people, including an elderly man and a woman, are walking down a cobblestone street in a small town. They are holding umbrellas to protect themselves from the rain, which is falling around them. The scene is reminiscent of a quaint, charming town,", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "bench", "umbrella", "handbag"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 300124, "caption": "A small, old couch is sitting on the sidewalk in front of a house, with a microwave oven on top of it.", "mscoco_hallucinated_words": [["oven", "oven"]], "mscoco_gt_words": ["dining table", "microwave", "couch", "chair"], "hallucination_idxs": [19], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.5}}, {"image_id": 46919, "caption": "A man is walking down a snowy mountain slope, wearing a red jacket and carrying a backpack. He is using snowshoes to traverse the snowy terrain, which is covered in trees and snow. The man is walking uphill, possibly on a hiking trail, and appears to", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "skis", "backpack"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 434022, "caption": "A white train engine is pulling a long line of black coal cars down a railroad track, with smoke billowing from its exhaust.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "train", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 490491, "caption": "A street sign is mounted on a brick wall, with a tree growing out of the wall. The tree is surrounded by a fence, and there is a street sign on the fence. The image captures the unique and quirky nature of the urban landscape, where a tree has grown through a brick wall", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "car", "stop sign"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 175878, "caption": "A group of friends are gathered outside, enjoying each other's company while using their smartphones. They are standing in front of a window, possibly in a living room or a balcony, and appear to be engaged in a conversation or sharing content on their devices. The scene captures the modern-", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "cell phone", "backpack"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 12669, "caption": "A group of people, including a woman, are gathered around a table in a gallery, enjoying a wine tasting. They are standing and talking while holding wine glasses, and the woman is holding a wine bottle. The scene suggests a social and enjoyable atmosphere, where people can come together to appreciate", "mscoco_hallucinated_words": [["table", "dining table"], ["bottle", "bottle"]], "mscoco_gt_words": ["person", "vase", "wine glass", "handbag"], "hallucination_idxs": [13, 40], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2857142857142857, "Recall": 0.5}}, {"image_id": 192496, "caption": "A train is parked on a railroad track, with a passenger car and a locomotive engine visible. The train is painted in a blue and white color scheme, and it appears to be in a station or on a platform.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "train", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 133146, "caption": "A spacious living room with a brown leather couch, a brown armchair, and a brown recliner is filled with various decorative items, such as a vase, a lamp, and a book. The room also features a fireplace, a coffee table, and a large window.", "mscoco_hallucinated_words": [["table", "dining table"]], "mscoco_gt_words": ["tv", "chair", "couch", "book", "vase"], "hallucination_idxs": [46], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2, "Recall": 0.6}}, {"image_id": 53744, "caption": "A close-up image of a plate with a sandwich, tomato, and lettuce on it.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "knife", "sandwich"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 375902, "caption": "A young woman is skiing down a snowy slope, wearing a blue and white outfit and carrying a pair of skis. She is participating in a ski race, and there are flags and a finish line visible in the background.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "skis", "backpack"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 498747, "caption": "A group of friends are gathered around a man who is holding a cell phone, possibly taking a selfie or making a call. They are all smiling and enjoying each other's company. The scene is set in a living room, with a table and chairs present. The man is wearing a swe", "mscoco_hallucinated_words": [["table", "dining table"], ["chair", "chair"]], "mscoco_gt_words": ["bird", "cell phone", "bottle", "person"], "hallucination_idxs": [47, 49], "metrics": {"CHAIRs": 1, "CHAIRi": 0.4, "Recall": 0.5}}, {"image_id": 52435, "caption": "A group of people are enjoying a day at the beach, with some people swimming in the ocean and others sunbathing on the sand.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bird", "umbrella", "surfboard", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 301977, "caption": "A cow stands in front of a store filled with various drinks and snacks, looking at the shelves.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bottle", "cow", "refrigerator"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 261097, "caption": "A young man wearing a tennis outfit and holding a tennis racket walks across a blue tennis court, looking at the audience.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "tennis racket", "bench", "chair"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 227204, "caption": "A group of three women, including an elderly woman, are sitting at a dining table, enjoying a meal together. They are eating a variety of foods, including fruits, bread, and a bowl of soup. The elderly woman is holding a cup of coffee, and the other", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "dining table", "bottle", "spoon", "bowl", "cell phone", "banana", "knife", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4444444444444444}}, {"image_id": 353981, "caption": "A vintage airplane is parked on a runway, with a man standing next to it. The airplane has a large wing and is surrounded by a trailer. The man is likely a mechanic or an airport employee, and he is inspecting the aircraft. The image captures a moment", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "airplane", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 185327, "caption": "A group of elephants is walking down a street in a city, with a car passing by. The elephants are likely part of a circus or a traveling show, and they are being led by a man on a bicycle. The scene is quite unusual and interesting, as it combines", "mscoco_hallucinated_words": [["elephant", "elephant"], ["elephant", "elephant"], ["bicycle", "bicycle"]], "mscoco_gt_words": ["person", "car", "cow", "bus", "horse"], "hallucination_idxs": [3, 20, 42], "metrics": {"CHAIRs": 1, "CHAIRi": 0.6, "Recall": 0.4}}, {"image_id": 348654, "caption": "A black iPhone is placed on a white table, with a black phone stand and a black headset on top of it. The phone stand is elevating the phone, and the headset is connected to the phone. The image shows a well-organized and visually appealing setup, with the phone and head", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["laptop", "cell phone", "dining table", "tv"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 482432, "caption": "A toothbrush and toothpaste are sitting on a bathroom sink, next to a tube of skin brightening scrub. The toothbrush is clean and ready to be used, while the toothpaste is partially squeezed out of its tube. The skin brightening scr", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "sink", "toothbrush"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 454161, "caption": "A delicious pizza is being enjoyed by two people at a table, with a glass of wine nearby. The pizza is topped with various ingredients, including vegetables, meat, and cheese. The scene is cozy and inviting, showcasing the joy of sharing a meal with", "mscoco_hallucinated_words": [["person", "person"]], "mscoco_gt_words": ["dining table", "wine glass", "fork", "pizza"], "hallucination_idxs": [8], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.5}}, {"image_id": 144723, "caption": "A small dog is flying through the air with a frisbee in its mouth, showcasing its impressive flying skills and agility.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dog", "frisbee", "truck", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 129707, "caption": "A person is holding a cell phone, which is a device used for communication and navigation. The cell phone is connected to a car's audio system, allowing the user to make hands-free calls and listen to music or GPS directions while driving.", "mscoco_hallucinated_words": [["car", "car"]], "mscoco_gt_words": ["person", "cell phone", "book"], "hallucination_idxs": [25], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.6666666666666666}}, {"image_id": 379842, "caption": "A white Nintendo Wii controller and a book are sitting on a table next to a stack of video games, including Super Mario Bros. and Super Mario Bros. 2. The controller is likely being used to play the games, and the book may be a guide or reference for the games.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "remote", "book"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 203110, "caption": "A bright orange streetcar is traveling down a city street, passing by a group of people.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "orange", "car", "truck", "bus", "train"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 556478, "caption": "A caption for the image could be: \"A delicious pizza is being prepared in a kitchen, with two different types of pizza dough on the counter. One is a traditional pizza dough, while the other is a gluten-free pizza dough. The pizza maker is", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bottle", "cup", "pizza", "oven"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 103815, "caption": "A baseball player is pitching a ball while a batter is swinging at the ball in the background. The image captures the moment of action and tension between the pitcher and the batter, showcasing the excitement and intensity of the game.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "baseball bat", "sports ball", "baseball glove"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 451943, "caption": "A bed or beds are visible in a room, with a lamp and a table nearby. The room is well-lit and has a comfortable atmosphere, making it a cozy and inviting space for relaxation or sleep.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "bed", "backpack", "suitcase"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 268854, "caption": "A woman is walking on a beach, carrying a large basket of goods, while a group of boats and a wooden pier are visible in the background.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "handbag", "boat"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 34464, "caption": "A group of people, including a man and a woman, are playing in the ocean on a beach. They are holding onto a red kayak, which is floating in the water. The man is wearing a life jacket, and the woman is wearing a swimsuit. They are enjoying their", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "surfboard", "boat"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 495513, "caption": "A man and a woman are holding hot dogs and grilling them over a fire. They are both smiling and enjoying the outdoor activity together.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "hot dog", "fork"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 529256, "caption": "A brown dog and a white dog are laying on a red bed, possibly in a bedroom or living room. The dogs are close to each other and appear to be sleeping or resting.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dog", "book", "bed"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 37907, "caption": "A cat sits on a TV stand, looking at a TV screen.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["tv", "cat", "potted plant"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 506401, "caption": "A city street with a traffic light at the intersection, a statue of a wolf, and a group of people walking in the area.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "cat", "car", "truck", "traffic light"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 406611, "caption": "A group of people, including skiers and snowboarders, are gathered at the top of a ski slope, enjoying the winter sports and the snowy environment.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "skis", "backpack"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 267225, "caption": "A large truck with a satellite dish on its roof is parked next to a group of cars and a school bus, creating a scene of vehicles and people in a parking lot.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "tv", "car", "remote", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 278365, "caption": "A couple is sitting on a patio, enjoying a meal together. They are eating pizza and drinking beer, and there are several pizza boxes on the table. The woman is wearing a blue jacket, and the man is wearing a black shirt. They seem to be", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "dining table", "chair", "cell phone", "cup", "pizza"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 69757, "caption": "A group of people, including a woman and a man, are gathered around a table with a cake and a glass of wine. They are enjoying a celebration, possibly a birthday party or a special occasion. The woman is cutting the cake, while the man is looking on. The scene is captured", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "dining table", "wine glass", "chair", "cake", "knife", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.42857142857142855}}, {"image_id": 432213, "caption": "A delicious sandwich with fries is being enjoyed by a group of people at a restaurant. The sandwich is topped with lettuce, tomato, and cheese, and it is served on a bun. The fries are crispy and golden brown, adding a satisfying side dish to", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "dining table", "wine glass", "bowl", "knife", "sandwich"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 368367, "caption": "A young woman is sitting at a table, enjoying a meal while using her cell phone.", "mscoco_hallucinated_words": [["table", "dining table"]], "mscoco_gt_words": ["person", "cell phone", "cup"], "hallucination_idxs": [7], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.6666666666666666}}, {"image_id": 201555, "caption": "A construction site is shown in the image, with a large dirt road and multiple vehicles present. The road is being dug up, and there are workers in the process of laying down new pipes. The scene is set in a residential area, with a sign indicating the location of a nearby grand national", "mscoco_hallucinated_words": [["worker", "person"]], "mscoco_gt_words": ["traffic light", "truck", "car"], "hallucination_idxs": [29], "metrics": {"CHAIRs": 1, "CHAIRi": 1.0, "Recall": 0.0}}, {"image_id": 92131, "caption": "A group of people, including a woman and a man, are standing in front of a green bus, possibly waiting for it to arrive or depart. The bus has a large advertisement on the side, which reads \"Hong Kong.\"", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "bus", "handbag"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 21779, "caption": "A young woman is lying on the floor, surrounded by luggage and a red backpack. She is smiling and appears to be enjoying the moment.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "backpack", "suitcase"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 565148, "caption": "A baseball player is standing at home plate, ready to swing at the ball, while a crowd of people watches from the stands.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "baseball bat", "sports ball", "baseball glove"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 160183, "caption": "A fire truck is parked in front of a building, with a ladder extended from the side of the vehicle. The truck is surrounded by people, and there are several firefighters standing around the truck. The scene suggests that the firefighters are preparing for a firefight", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "truck", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 555456, "caption": "A group of people, including a man in a black jacket, are skiing down a snowy slope. They are all wearing ski gear and appear to be enjoying the winter sport.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "skis", "snowboard"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 235595, "caption": "A group of motorcycles is parked in a parking lot, with some of them being Harley-Davidson models. The image shows a variety of colors and styles, indicating that the motorcycles belong to different owners or are part of a motorcycle club. The presence of multiple motorcycles", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "potted plant", "parking meter", "motorcycle", "car", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.16666666666666666}}, {"image_id": 489909, "caption": "A basket of fresh fruits and vegetables, including oranges, bananas, and cucumbers, is displayed on a table. The fruits and vegetables are arranged in a neat and colorful arrangement, making them visually appealing.", "mscoco_hallucinated_words": [["table", "dining table"]], "mscoco_gt_words": ["bowl", "banana", "orange"], "hallucination_idxs": [20], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.6666666666666666}}, {"image_id": 501080, "caption": "A pink Christmas cactus is sitting in a white vase, surrounded by a dark background.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "dining table", "vase", "potted plant"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 405183, "caption": "A group of friends are gathered around a table, playing a video game on a Nintendo Wii console. One girl is holding a controller and talking to the others while they play. The scene is filled with laughter and excitement, showcasing the joy and camaraderie that comes with playing video games together", "mscoco_hallucinated_words": [["table", "dining table"]], "mscoco_gt_words": ["person", "tv", "potted plant", "chair", "couch", "book", "remote", "handbag"], "hallucination_idxs": [8], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.125}}, {"image_id": 409138, "caption": "A green city bus is parked on a street, with a large advertisement on the side. The bus is stopped at a red light, and there is a person standing next to it.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "bus", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 411840, "caption": "Two women tennis players are walking on a grass tennis court, with one holding a tennis racket and the other holding a tennis ball. They are walking in opposite directions, possibly preparing for a match or practicing their skills.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "backpack", "chair", "sports ball", "tennis racket"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 333712, "caption": "A close-up image of a slice of pizza on a plate, with a fork and knife placed next to it, is shown. The pizza slice is topped with bacon, onions, and mushrooms, and it appears to be a delicious and savory dish.", "mscoco_hallucinated_words": [["fork", "fork"], ["knife", "knife"]], "mscoco_gt_words": ["spoon", "dining table", "pizza"], "hallucination_idxs": [14, 16], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.3333333333333333}}, {"image_id": 148977, "caption": "A teddy bear is sitting on a table, wearing headphones and listening to music. It is surrounded by a book and a cup of coffee, creating a cozy and relaxing atmosphere.", "mscoco_hallucinated_words": [["cup", "cup"]], "mscoco_gt_words": ["dining table", "bottle", "bear", "teddy bear", "book", "keyboard"], "hallucination_idxs": [24], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.5}}, {"image_id": 399058, "caption": "A man rides a dung cart down a road, with a large elephant standing next to the cart.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "bicycle", "orange", "truck", "elephant"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 183571, "caption": "A man is standing on a red train car, holding a dog while the train is moving.", "mscoco_hallucinated_words": [["train", "train"], ["car", "car"], ["train", "train"]], "mscoco_gt_words": ["person", "dog", "boat"], "hallucination_idxs": [7, 8, 15], "metrics": {"CHAIRs": 1, "CHAIRi": 0.6, "Recall": 0.6666666666666666}}, {"image_id": 325836, "caption": "A vintage motorcycle is displayed on a red carpet, surrounded by people at an event. The motorcycle has a unique design, featuring a black and orange paint job, and is adorned with various accessories, such as a sidecar and a large exhaust pipe. The event likely celebrates the", "mscoco_hallucinated_words": [["orange", "orange"]], "mscoco_gt_words": ["motorcycle", "bicycle", "handbag", "person"], "hallucination_idxs": [28], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.5}}, {"image_id": 437910, "caption": "A small, cramped bathroom with a toilet and sink is shown in the image. The bathroom is cluttered with various items, including a newspaper and a toilet paper roll. The sink is located in the corner of the room, and there is a toilet in the center", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["toilet", "bottle", "sink"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 155885, "caption": "A group of boats and fishing nets are seen floating in the water, with a large number of seagulls flying overhead. The scene is set against a picturesque backdrop of a small town, with boats and buildings visible in the distance.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bird", "person", "boat"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 467887, "caption": "A man is sitting in a living room, wearing a red shirt and glasses, and using a laptop computer. He is sitting on a couch and has a cup of coffee next to him.", "mscoco_hallucinated_words": [["cup", "cup"]], "mscoco_gt_words": ["laptop", "dining table", "person", "chair", "couch", "mouse"], "hallucination_idxs": [31], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.5}}, {"image_id": 174402, "caption": "A man in a blue shirt and white tennis shoes is standing on a tennis court, holding a tennis racket. He is looking down and appears to be preparing to hit a tennis ball.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "sports ball", "tennis racket"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 352734, "caption": "A young boy is eating a slice of cake from a plate, with a spoon in his hand.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "dining table", "spoon", "cake", "fork"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 346716, "caption": "A group of vintage red double-decker buses is driving down a city street, creating a colorful and lively scene. The buses are parked on the side of the road, and people are walking around them. The image captures the nostalgic charm of the past, showc", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "bus", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 451144, "caption": "Two men are standing on a snowy mountain, looking out at the vast landscape below. One man is wearing a red jacket, and the other man is wearing a black jacket. They are both holding ski poles and appear to be enjoying the scenic view.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "skis", "backpack"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 295656, "caption": "A group of people, including a man and a woman, are enjoying a meal together at a restaurant. They are eating pizza and drinking beer, and they seem to be having a good time. The man is holding a slice of pizza in his hand, while the woman is holding a", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "tv", "clock", "chair", "car", "tie", "pizza"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2857142857142857}}, {"image_id": 129886, "caption": "A group of people, including a man and a woman, are skiing down a snowy slope. They are using ski lifts to get up the mountain and enjoy the winter sports experience. The image captures the excitement and fun of skiing in the snowy environment.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "skis", "snowboard"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 557998, "caption": "A young woman sits at a wooden table, looking at a notebook and a glass of wine. She is surrounded by lush greenery and a wooden fence, creating a serene and natural setting.", "mscoco_hallucinated_words": [["notebook", "laptop"]], "mscoco_gt_words": ["person", "dining table", "bottle", "wine glass", "chair"], "hallucination_idxs": [12], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.4}}, {"image_id": 401010, "caption": "A white bed with a white pillow and a white blanket is situated in a room with a window. The room has a mirror and a desk, and there is a lamp on the desk. The bed is in a bedroom, and it appears to be a comfortable and well-lit space.", "mscoco_hallucinated_words": [["desk", "dining table"], ["desk", "dining table"]], "mscoco_gt_words": ["tv", "sink", "chair", "bed"], "hallucination_idxs": [27, 36], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.25}}, {"image_id": 567562, "caption": "A family of three is sitting at a table, enjoying a meal together. The mother and two children are eating pizza and salad, while the father is holding a bottle of soda. The children are smiling and having a good time, while the mother is also enjoying her meal", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "dining table", "bottle", "spoon", "chair", "bowl", "book", "broccoli", "fork", "cup", "pizza"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.36363636363636365}}, {"image_id": 313928, "caption": "A yellow surfboard sits on the beach next to a table with a white umbrella and a chair, while a yellow beach chair is nearby. The scene is set against a blue ocean backdrop, creating a picturesque and inviting atmosphere.", "mscoco_hallucinated_words": [["umbrella", "umbrella"]], "mscoco_gt_words": ["dining table", "bottle", "wine glass", "chair", "surfboard"], "hallucination_idxs": [14], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2, "Recall": 0.6}}, {"image_id": 490284, "caption": "A black dog is sitting on a couch, resting its head on a person's arm.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "dog", "couch"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 346940, "caption": "A kitchen scene with a stove, a pot, and a frying pan on the stove is filled with steam. The steam is rising from the pots and pans, creating a misty atmosphere in the kitchen.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "knife", "oven"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 222782, "caption": "A woman walks down a city street, passing by a vintage gas station with a sign that reads \"AMOCO GAS.\" The woman is dressed in a coat and hat, and she appears to be walking in a cold weather. The presence of the gas station suggests that the location is likely in a", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "cell phone", "truck", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 255934, "caption": "A mother elephant and her baby are walking together in a zoo, with the mother leading the way and the baby following closely behind.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["elephant", "cow", "handbag", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 278627, "caption": "A group of friends enjoying a meal at a restaurant, with a variety of dishes on their plates, including chicken, fish, and vegetables. They are smiling and having a good time together, making the dining experience a memorable one.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "dining table", "bottle", "spoon", "chair", "potted plant", "fork", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 400851, "caption": "A group of people is enjoying a sunny day at the beach, lounging on the sand and sitting on a bench. They are surrounded by a large crowd of people, creating a lively atmosphere. The image captures the joy and relaxation of the beachgoers, who are enjoying", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "bench", "chair", "umbrella", "sports ball", "backpack", "boat"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2857142857142857}}, {"image_id": 472610, "caption": "A woman is standing in a field with her dog, surrounded by cows and a barn. She is smiling and holding her dog close, enjoying the scenic and peaceful environment.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "dog", "cow"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 78565, "caption": "A group of people, including a man and a woman, are standing on the beach, watching a group of sailboats sailing in the water. The sailboats are in the distance, and the people are enjoying the beautiful day and the activity on the water.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "dog", "boat"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 388237, "caption": "A group of young people are skateboarding on a sidewalk, enjoying their time together and engaging in a fun activity.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "bottle", "chair", "skateboard"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 289640, "caption": "A group of people are gathered around a table, enjoying a fun night out. They are playing with a yellow frisbee, which is placed on a table. The image captures the joy and camaraderie of the group as they engage in a casual and entertaining activity together.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "dining table", "wine glass", "frisbee", "chair", "orange", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.42857142857142855}}, {"image_id": 122602, "caption": "A caption for the image could be: \"A helpful language and vision assistant is assisting a user with a task using natural language. The assistant is sitting at a desk with a computer, a pair of scissors, and a bottle of glue. The assistant is using the scissors and", "mscoco_hallucinated_words": [["computer", "laptop"]], "mscoco_gt_words": ["dining table", "bottle", "scissors"], "hallucination_idxs": [35], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2, "Recall": 1.0}}, {"image_id": 24104, "caption": "A man is sitting at a desk with a computer, a monitor, and a keyboard. There is a cup of coffee on the desk, and the man is using a computer to work. The desk is cluttered with various items, such as a printer, a lamp, and a book. The", "mscoco_hallucinated_words": [["man", "person"], ["man", "person"]], "mscoco_gt_words": ["laptop", "dining table", "tv", "book", "bed", "keyboard", "mouse", "cup"], "hallucination_idxs": [1, 30], "metrics": {"CHAIRs": 1, "CHAIRi": 0.18181818181818182, "Recall": 0.75}}, {"image_id": 183709, "caption": "A group of people, including a man and a woman, are standing on a city street, looking at a red light at an intersection. They are waiting for the light to turn green before crossing the street.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "car", "handbag", "traffic light"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 59710, "caption": "A black refrigerator is sitting on a wooden floor, with its door open and a white towel hanging from the handle. The refrigerator is empty, with the shelves removed, and there is a white towel on the floor next to it.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "chair", "refrigerator"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 279407, "caption": "A young boy is standing in a baseball field, wearing a green and yellow baseball uniform, holding a baseball bat. He is likely participating in a baseball game or practice, and is ready to hit the ball.", "mscoco_hallucinated_words": [["baseball bat", "baseball bat"]], "mscoco_gt_words": ["person", "bottle", "bench", "baseball glove", "sports ball"], "hallucination_idxs": [20], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.4}}, {"image_id": 314729, "caption": "A vintage black and white photograph shows a man wearing a baseball uniform, holding a baseball bat, and standing in front of a white background.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "baseball bat", "sports ball"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 527497, "caption": "A person is sitting at a desk in a modern office, surrounded by computer monitors and a keyboard. The desk is covered with various computer components, such as a mouse, a keyboard, and a computer monitor. The person is using a computer to work, and there is a phone on the desk as", "mscoco_hallucinated_words": [["person", "person"], ["person", "person"], ["phone", "cell phone"]], "mscoco_gt_words": ["laptop", "dining table", "tv", "keyboard", "mouse"], "hallucination_idxs": [1, 43, 55], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2, "Recall": 1.0}}, {"image_id": 411564, "caption": "A man is sitting on a chair in a kitchen, looking at his phone while resting his feet on the counter.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "dining table", "bottle", "chair", "cell phone", "refrigerator"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 320350, "caption": "A man and a woman are walking on a snowy lake with their dogs, enjoying a winter outing. They are holding ski poles and appear to be having a fun time together.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "dog", "skis"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 401857, "caption": "A baseball player is swinging a bat at a baseball, while a pitcher is throwing the ball. The player is on the field, and the pitcher is on the mound. The image captures the action and excitement of a baseball game, where the player is trying to hit the ball and the pitcher", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "bench", "baseball bat", "baseball glove", "sports ball", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 285302, "caption": "A young boy is sitting at a dining table, surrounded by various materials and tools. He is wearing a striped pajama shirt and is engaged in a creative activity, possibly making a craft or working on a project. The image captures the boy's concentration and focus on his task,", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "dining table", "scissors", "chair"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 61959, "caption": "A yellow school bus is driving down a city street, passing by a red light at an intersection. The bus is surrounded by a busy city scene, with cars and pedestrians present.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bus", "traffic light", "truck", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 229659, "caption": "A man is sitting at a table in a restaurant, using a laptop computer while a woman is sitting across from him. They are both looking at the computer screen, possibly discussing something or working together on a project. The laptop is open on the table, and there is a cup of coffee on the table as well", "mscoco_hallucinated_words": [["cup", "cup"]], "mscoco_gt_words": ["laptop", "dining table", "bottle", "person", "tv", "clock", "chair"], "hallucination_idxs": [55], "metrics": {"CHAIRs": 1, "CHAIRi": 0.1111111111111111, "Recall": 0.42857142857142855}}, {"image_id": 473118, "caption": "A young man is riding a skateboard down a ramp, performing a trick in the air. He is wearing a blue shirt and jeans, and his skateboard is white. The image captures the moment of his jump, showcasing his skill and athleticism.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "bicycle", "skateboard"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 391222, "caption": "A man and a woman are standing on a snowy hillside, looking at a map or a sign. They are likely outdoor enthusiasts, as they are dressed in winter clothing and carrying backpacks. The man is wearing a black jacket, and the woman is wearing a purple", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "skis", "backpack"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 416104, "caption": "A group of people are sitting at a table outside, enjoying their drinks and conversation under a blue umbrella.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "dining table", "bottle", "wine glass", "chair", "umbrella"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 511852, "caption": "A man and a woman are skiing down a snowy slope, enjoying the winter sports experience.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "skis", "backpack"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 59386, "caption": "A group of giraffes are gathered around a tree, with one giraffe eating leaves from the tree while the others stand nearby.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["giraffe", "zebra", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 540180, "caption": "A green traffic light is mounted on a pole in the middle of a street, with cars passing by in the background.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "traffic light", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 153692, "caption": "A man rides a bicycle across a street, with a dog by his side, while navigating through a busy intersection.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "bicycle", "backpack", "dog", "car", "traffic light"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 265628, "caption": "A man is standing in front of a toilet in a bathroom, looking at his phone. The toilet is located in a small room with a wooden door, and there is a sink nearby. The man is likely using his phone to check his email or browse the internet while he is in the", "mscoco_hallucinated_words": [["phone", "cell phone"], ["sink", "sink"], ["phone", "cell phone"]], "mscoco_gt_words": ["bowl", "toilet", "person"], "hallucination_idxs": [16, 35, 44], "metrics": {"CHAIRs": 1, "CHAIRi": 0.42857142857142855, "Recall": 0.6666666666666666}}, {"image_id": 499594, "caption": "A white plate is filled with a delicious dish of grilled steak, broccoli, and carrots, accompanied by a side of pasta. The dish is served on a blue tablecloth, adding a touch of elegance to the meal. The combination of flavors and text", "mscoco_hallucinated_words": [["carrot", "carrot"]], "mscoco_gt_words": ["dining table", "bottle", "knife", "broccoli", "fork", "cup"], "hallucination_idxs": [16], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.16666666666666666}}, {"image_id": 5934, "caption": "A baseball glove is sitting on a bench, with a baseball inside it. The glove is brown and has a white logo on it. The baseball is a white baseball with an American flag on it.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["sports ball", "baseball glove", "bench"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 47828, "caption": "A bright blue bridge illuminated at night, with a boat floating in the water below, creates a stunning and serene scene. The bridge's blue lighting adds a touch of elegance and beauty to the nighttime landscape, while the boat's presence adds a sense of movement and activity to the", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "car", "boat"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 47916, "caption": "A group of dogs, including a white dog and a brown dog, are playing in a grassy field, chasing each other and running around.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bench", "frisbee", "dog", "car", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2}}, {"image_id": 255483, "caption": "A man is sitting at a desk with a pile of papers and a pen, possibly working on an article or writing a letter. He is surrounded by various documents and appears to be in the process of writing or reading.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "dining table", "scissors", "book"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 131138, "caption": "A man is sitting at a desk with a computer, a monitor, and a keyboard. There is a coffee cup on the desk, and a whiteboard is visible in the background. The man is likely working on a project or using the computer for personal or professional purposes.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["laptop", "spoon", "person", "dining table", "tv", "potted plant", "keyboard", "mouse", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 258209, "caption": "A man sits on a bench in front of a brick wall, looking at his phone.", "mscoco_hallucinated_words": [["phone", "cell phone"]], "mscoco_gt_words": ["person", "bicycle", "book", "bench"], "hallucination_idxs": [16], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.5}}, {"image_id": 347453, "caption": "A city street is filled with red double-decker buses, creating a bustling and vibrant atmosphere. The buses are parked along the side of the road, and some of them have passengers on board. The image captures the hustle and bustle of city life, show", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "bench", "car", "bus", "traffic light"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 285820, "caption": "A living room with a large window, a couch, and a TV is shown in the image. The room is well-lit and has a comfortable atmosphere, making it a great space for relaxation and entertainment.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "tv", "bench", "bowl", "couch", "cell phone", "book"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2857142857142857}}, {"image_id": 245664, "caption": "A man is sitting at a desk with a computer, a laptop, and a glass of wine. There is a window behind him, and a television is visible in the background. The man is likely working or relaxing in his office, enjoying a drink while using his computer or laptop.", "mscoco_hallucinated_words": [["man", "person"], ["man", "person"]], "mscoco_gt_words": ["laptop", "dining table", "tv", "wine glass", "book", "keyboard", "mouse", "cup"], "hallucination_idxs": [1, 37], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.375}}, {"image_id": 453731, "caption": "A dog is laying on a wooden table, surrounded by various items such as a barrel, a bottle, and a wooden crate. The dog is likely enjoying the warmth and comfort of the wooden surface, and the presence of the items may provide it with a sense of security or familiarity.", "mscoco_hallucinated_words": [["table", "dining table"]], "mscoco_gt_words": ["bottle", "dog", "cup"], "hallucination_idxs": [7], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.6666666666666666}}, {"image_id": 524601, "caption": "A group of friends is gathered around a couch, playing a video game together. They are all holding Nintendo Wii controllers and are engaged in a fun and competitive gaming session. The image captures the excitement and camaraderie of the group as they enjoy their time together playing the game.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "chair", "couch", "book", "refrigerator", "remote"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.16666666666666666}}, {"image_id": 253262, "caption": "A group of people are standing near a parked airplane, possibly waiting for it to take off or having just arrived at the airport.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "tie", "truck", "airplane", "suitcase"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 87052, "caption": "A couple is standing in a kitchen, looking at a refrigerator. They are likely discussing or preparing food for a meal. The man is wearing a black shirt and the woman is wearing a green shirt. They are both standing in front of the refrigerator, which", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "bottle", "oven", "bowl", "refrigerator", "vase", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2857142857142857}}, {"image_id": 357578, "caption": "A fire truck is parked on a city street, with a car parked next to it. The fire truck is red and has a ladder on its side, while the car is white and has a bumper sticker on its rear window.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "traffic light", "truck", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 418692, "caption": "A couple is sitting on a couch in a living room, reading books and enjoying their time together. The room is well-lit, and there is a lamp on the coffee table. The couple is comfortable and relaxed, engaging in a leisurely activity.", "mscoco_hallucinated_words": [["table", "dining table"]], "mscoco_gt_words": ["person", "chair", "couch", "cell phone", "book", "remote"], "hallucination_idxs": [33], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.3333333333333333}}, {"image_id": 259345, "caption": "A man with a beard and a pink umbrella is sitting on a bench, smiling and enjoying the sunshine.", "mscoco_hallucinated_words": [["bench", "bench"]], "mscoco_gt_words": ["person", "umbrella", "chair"], "hallucination_idxs": [13], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.6666666666666666}}, {"image_id": 119709, "caption": "A woman is preparing a batch of donuts on a kitchen counter, carefully arranging them on a tray. She is wearing a red apron and has a pair of sunglasses on, adding a touch of style to her outfit. The woman is likely making the donuts for a special", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "dining table", "chair", "donut"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 443299, "caption": "A young couple is sitting on a bench in a train station, both using their smartphones. They are in a busy and crowded environment, but they are engrossed in their personal devices, oblivious to their surroundings.", "mscoco_hallucinated_words": [["train", "train"]], "mscoco_gt_words": ["person", "bench", "cell phone", "handbag", "backpack"], "hallucination_idxs": [10], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.4}}, {"image_id": 120776, "caption": "A group of people is gathered around a large metal sculpture in a city setting, possibly in front of a restaurant or a park. The sculpture is made up of several interconnected metal pieces, creating a unique and eye-catching design. The people are enjoying their time together, possibly discussing the art", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "tie", "umbrella"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 411765, "caption": "A young man is playing tennis on a court, using a tennis racket to hit a tennis ball back and forth with another player. The image captures the moment when the man is swinging his racket to hit the ball, with the ball flying through the air.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "sports ball", "tennis racket"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 447991, "caption": "A group of people, including a young woman, are walking down a city street, passing by a vintage Volkswagen bus parked on the sidewalk. The scene is set at night, with the city lights illuminating the surrounding buildings and the street. The woman is wearing a blue shirt and", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "bicycle", "cell phone", "car", "handbag", "truck", "traffic light"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.14285714285714285}}, {"image_id": 276719, "caption": "A group of people, including a man and a woman, are standing in front of a row of cars, which are parked on a street. The cars are mostly old and vintage, and there is a dog walking around the area. The scene is likely a car show or a gathering of car enthus", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "chair", "motorcycle", "dog", "car", "handbag", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.42857142857142855}}, {"image_id": 422328, "caption": "A horse is standing in the snow, pulling a sled with a pile of hay on it. The horse is wearing a harness and is likely being used for transportation or work in the snowy environment.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "skis", "car", "snowboard", "horse"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2}}, {"image_id": 354559, "caption": "A young woman is posing for a photo, holding a stuffed animal and wearing a black and white striped outfit. She is smiling and looking directly at the camera, creating a playful and fun atmosphere in the image.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "bear", "teddy bear"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 438788, "caption": "A group of people are gathered around a table, enjoying a delicious cake. The cake is a white chocolate cake with chocolate chips and a layer of frosting on top. The people are smiling and taking bites of the cake, indicating that they are enjo", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "cake", "dining table", "knife"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 468005, "caption": "A large, brown elephant is standing on a wooden platform, with its trunk raised and its tusks visible. It is standing in front of a green fence, and there are people nearby.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["elephant", "backpack", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 545594, "caption": "A man is standing on a city bus, holding a backpack and wearing a colorful shirt. He is surrounded by other passengers, who are seated on the bus. The man is looking down at his phone, possibly checking his location or a message. The image captures the daily commute of people", "mscoco_hallucinated_words": [["phone", "cell phone"]], "mscoco_gt_words": ["person", "orange", "backpack", "chair"], "hallucination_idxs": [39], "metrics": {"CHAIRs": 1, "CHAIRi": 0.16666666666666666, "Recall": 0.5}}, {"image_id": 219546, "caption": "A Christmas dinner table is filled with various dishes, including a ham, a turkey, and a roast beef. The table is set with a red and white tablecloth, and there are multiple forks, knives, and spoons on the table. The scene is festive and inviting", "mscoco_hallucinated_words": [["turkey", "bird"]], "mscoco_gt_words": ["spoon", "dining table", "bottle", "chair", "bowl", "knife", "fork"], "hallucination_idxs": [15], "metrics": {"CHAIRs": 1, "CHAIRi": 0.14285714285714285, "Recall": 0.5714285714285714}}, {"image_id": 386645, "caption": "A dilapidated building with a sign that reads \"Chinatown\" is shown in the image. The building appears to be in a state of disrepair, with broken windows and a crumbling facade. The image captures the essence of a once-thriving business district that", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["motorcycle", "person", "truck", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 155131, "caption": "A woman is playing tennis on a grassy court, with a tennis racket in her hand. She is wearing a white tennis outfit and is in the process of hitting a tennis ball.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "bench", "tie", "sports ball", "tennis racket"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 188752, "caption": "A man is standing in front of a fruit stand, surrounded by various fruits, including bananas and apples. He is looking at a banana hanging from a string, and the fruit stand is filled with other fruits and vegetables.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["apple", "banana", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 228350, "caption": "A group of people are gathered around a table in a restaurant, enjoying a meal together. The restaurant has a casual atmosphere, with a red umbrella and a white tablecloth. The people are dressed in formal attire, adding to the elegance of the setting.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "dining table", "wine glass", "chair", "bowl", "umbrella", "tie", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.375}}, {"image_id": 437720, "caption": "A woman is sitting at a desk, typing on a typewriter while wearing a red dress. She is surrounded by a red chair and a rug, and there is a vase of flowers on the desk. The woman is working on a piece of writing, possibly a letter or a story, and is", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["laptop", "dining table", "person", "chair", "vase"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.8}}, {"image_id": 378831, "caption": "A woman is walking down a street, carrying a large bag of groceries. She is wearing a green shirt and a red hat, and is walking past a fire hydrant.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "fire hydrant", "handbag"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 375503, "caption": "A staircase with a wooden banister and a clock is located in a room.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["laptop", "dining table", "tv", "person", "clock", "chair"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.16666666666666666}}, {"image_id": 330369, "caption": "A red fishing boat is docked at a pier, with a man standing on the pier and a woman standing on the boat. The boat is surrounded by water, and there is a large fishing net on the boat.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bird", "person", "boat"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 288576, "caption": "A man is playing with a frisbee in a park, throwing it up in the air and catching it with his hands. The man is wearing a hat and is surrounded by a group of children playing on a playground.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "bicycle", "frisbee"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 32190, "caption": "A small horse figurine stands on the sidewalk in front of a building, looking out at the street.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "horse", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 535403, "caption": "A woman is standing in front of a sink, with a toothbrush and a hair dryer on the counter. There is a mirror above the sink, and a hair dryer is also on the counter. The sink is clean and has a toothbrush on it.", "mscoco_hallucinated_words": [["woman", "person"], ["toothbrush", "toothbrush"], ["toothbrush", "toothbrush"]], "mscoco_gt_words": ["clock", "bottle", "potted plant", "toilet", "hair drier", "sink"], "hallucination_idxs": [1, 12, 46], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.16666666666666666}}, {"image_id": 449798, "caption": "A desk with a computer, mouse, and keyboard is surrounded by various toys and figurines, creating a unique and playful workspace.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["laptop", "dining table", "cell phone", "book", "keyboard", "mouse"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 375769, "caption": "A young boy is sitting at a table, eating a sandwich while looking at a bicycle parked outside.", "mscoco_hallucinated_words": [["sandwich", "sandwich"]], "mscoco_gt_words": ["person", "dining table", "bicycle", "chair", "umbrella", "hot dog", "car", "cup"], "hallucination_idxs": [11], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.375}}, {"image_id": 426172, "caption": "A colorful and inviting wine bar is showcased in the image, featuring a variety of wine bottles, wine glasses, and other wine-related items. The wine bar is set up in a cozy and welcoming atmosphere, with a table and chairs for guests to enjoy their wine. The", "mscoco_hallucinated_words": [["wine glass", "wine glass"]], "mscoco_gt_words": ["dining table", "bottle", "chair", "knife", "book"], "hallucination_idxs": [19], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.6}}, {"image_id": 20650, "caption": "A sandwich with broccoli, cheese, and a side of fries is being enjoyed on a plate.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "bowl", "orange", "sandwich", "broccoli", "fork"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 138078, "caption": "A young baseball player stands on the field, wearing a red baseball uniform and holding a baseball bat. He is looking up at the sky, possibly waiting for a pitch or contemplating his next move. The image captures the player's determination and focus on the game, as he prepares to make", "mscoco_hallucinated_words": [["baseball bat", "baseball bat"]], "mscoco_gt_words": ["person", "sports ball", "baseball glove"], "hallucination_idxs": [17], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.3333333333333333}}, {"image_id": 152499, "caption": "A group of people, including children and adults, are gathered around a swimming pool, enjoying a fun day together. They are playing with a variety of pool toys, including a beach ball, a pool noodle, and a water gun. The scene is filled with laughter and joy, capt", "mscoco_hallucinated_words": [["ball", "sports ball"]], "mscoco_gt_words": ["person", "dining table", "potted plant", "chair", "umbrella", "surfboard"], "hallucination_idxs": [36], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.16666666666666666}}, {"image_id": 180764, "caption": "A man is sitting on a couch, eating a doughnut while looking at his phone.", "mscoco_hallucinated_words": [["couch", "couch"], ["phone", "cell phone"]], "mscoco_gt_words": ["person", "microwave", "bottle", "donut"], "hallucination_idxs": [6, 15], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.5}}, {"image_id": 147762, "caption": "A delicious dessert is served on a white plate, consisting of a chocolate cake with a scoop of ice cream on top. The cake is decorated with a small pile of chopped nuts, adding a crunchy texture and a touch of flavor to the dessert", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cake", "dining table", "fork"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 113860, "caption": "A black and white boat is floating on the water, surrounded by trees and a green landscape.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "umbrella", "boat"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 460866, "caption": "A toothbrush and toothpaste are sitting on a bathroom counter, with a toothbrush holder and a tube of toothpaste next to them.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "bowl", "toothbrush", "sink", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2}}, {"image_id": 177015, "caption": "A man is sitting on a couch, using a laptop computer while a cat is sitting on his lap.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["laptop", "person", "apple", "chair", "couch", "cat", "refrigerator"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5714285714285714}}, {"image_id": 333998, "caption": "A kitchen with a refrigerator, stove, and sink is shown in the image. There is a dishwasher in the corner, and a countertop with a sink and a faucet. The kitchen is clean and well-organized, with a few dishes on the counter.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "bottle", "oven", "bowl", "refrigerator", "microwave", "sink", "cup", "suitcase"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 47131, "caption": "A group of men are gathered around a train wreck, with one man standing on the train and another man standing on the ground. The train is in disarray, with its wheels and cars scattered across the ground. The men are likely trying to assess the damage and determine the best course of action to take in", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "train", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 425447, "caption": "A white pickup truck is parked on a street, with a man standing next to it. The truck has a hose attached to its side, and the man is holding a nozzle. The scene suggests that the man is using the hose to clean the truck, possibly washing it", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "fire hydrant", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 295105, "caption": "A man is standing in a kitchen, looking at a refrigerator while holding a bag of groceries. He is wearing a black shirt and jeans, and appears to be preparing to cook or prepare food. The image captures a moment of the man's daily routine, as he", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "apple", "bottle", "oven", "bowl", "refrigerator", "sink"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2857142857142857}}, {"image_id": 443259, "caption": "A modern kitchen with white cabinets, a stainless steel countertop, and a large island serves as the focal point of the room. The kitchen features a large, open layout, allowing for easy movement and interaction between the various elements. The presence of a dining table and a large bowl of fruit", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "bottle", "oven", "potted plant", "chair", "bowl", "orange", "refrigerator", "sink"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2222222222222222}}, {"image_id": 537861, "caption": "A train is traveling down the tracks, with a passenger train car in the foreground. The train car has a yellow and blue color scheme, and it is pulling a passenger train car behind it. The image shows the train car's front end, with a large window and a small door on the side.", "mscoco_hallucinated_words": [["car", "car"], ["car", "car"], ["car", "car"], ["car", "car"]], "mscoco_gt_words": ["person", "train", "bench"], "hallucination_idxs": [12, 19, 35, 44], "metrics": {"CHAIRs": 1, "CHAIRi": 0.4444444444444444, "Recall": 0.3333333333333333}}, {"image_id": 145020, "caption": "A Disney character, possibly Mickey Mouse, is standing in front of a Christmas tree at Disneyland. The character is dressed in a festive outfit and holding a sign that reads \"Merry Christmas.\" The image captures the holiday spirit and joyful atmosphere of the park during the Christmas season.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bird", "mouse", "teddy bear", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 249969, "caption": "A delicious and festive holiday meal is presented on a white plate, featuring a variety of dishes, including a roasted chicken, mashed potatoes, and vegetables. The meal is accompanied by a side of cranberry sauce and a glass of wine. The arrangement of the", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["spoon", "dining table", "bird", "wine glass", "knife", "broccoli", "fork", "carrot"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 146504, "caption": "A man is sitting at a desk, using a computer mouse to navigate through a computer program. He is wearing a white shirt and a tie, and there is a cup of coffee on the desk next to him. The image captures a moment of concentration and focus as the man works on his computer", "mscoco_hallucinated_words": [["tie", "tie"]], "mscoco_gt_words": ["laptop", "dining table", "person", "keyboard", "mouse", "cup"], "hallucination_idxs": [27], "metrics": {"CHAIRs": 1, "CHAIRi": 0.1, "Recall": 0.8333333333333334}}, {"image_id": 40037, "caption": "A tall clock tower stands in front of a building, with a large clock face visible on the tower. The clock is set to 12:30, and the building appears to be a historic structure. The image captures the essence of a bustling city street, with a car parked nearby", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "clock", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 343218, "caption": "A young man is playing tennis on a court, using a tennis racket and a tennis ball. He is standing in front of a net, preparing to hit the ball.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "sports ball", "tennis racket", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 301837, "caption": "A modern kitchen with white cabinets and countertops features a stainless steel refrigerator, a dishwasher, and a microwave. The kitchen also includes a sink, a stove, and a large window that allows natural light to enter the space. The overall design of the", "mscoco_hallucinated_words": [["microwave", "microwave"]], "mscoco_gt_words": ["apple", "clock", "oven", "refrigerator", "sink"], "hallucination_idxs": [19], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.6}}, {"image_id": 309071, "caption": "A man is seen standing next to a parked bicycle, possibly preparing to ride it. He is wearing a blue shirt and a pair of shorts, and he has a helmet on his head. The man is also holding a bike lock in his hand, which suggests that he is", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "bicycle", "bench", "potted plant", "backpack"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 240681, "caption": "A young man is standing next to a red motorcycle, looking at his phone while wearing a backpack. The motorcycle is parked on the side of a road, and the man is standing in front of it, possibly waiting for someone or checking his phone for directions. The image captures a moment of", "mscoco_hallucinated_words": [["phone", "cell phone"], ["phone", "cell phone"]], "mscoco_gt_words": ["motorcycle", "backpack", "person", "car"], "hallucination_idxs": [14, 48], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2857142857142857, "Recall": 0.75}}, {"image_id": 178753, "caption": "A young girl is sitting in a red chair, smiling and looking at her phone. She is in a sports arena, possibly waiting for a game or event to begin.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "cell phone", "chair"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 278890, "caption": "A man is using his cell phone while standing in a store, possibly looking at a product or browsing online. He is holding the phone in his hand and appears to be engaged in a conversation with someone else, possibly a friend or a salesperson. The image captures a moment of interaction between the man and the", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "dining table", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 47781, "caption": "A modern bedroom with a red bed and a black nightstand is shown in the image. The room features a large window, a lamp, and a mirror, creating a cozy and inviting atmosphere.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "tv", "book", "bed", "vase"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2}}, {"image_id": 542792, "caption": "A large baseball bat stands in front of a building, with a baseball field visible in the background. The bat is a symbol of the sport and the city's connection to it. The presence of the bat and the baseball field suggests that the city is home to a baseball team or has a strong interest in the sport", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "baseball bat", "sports ball"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 293703, "caption": "A group of three men are sitting at a table, enjoying their meals. They are having a conversation while eating their pizza and salads. The atmosphere is casual and relaxed, with the men dressed in casual attire.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "dining table", "bottle", "chair", "bowl", "knife", "fork", "cup", "pizza"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 318777, "caption": "A group of baseball players is standing on the field, ready to play a game. They are wearing their respective team's uniforms and are positioned on the field, waiting for the game to begin. The image captures the excitement and anticipation of the players as they prepare to compete against each other", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "sports ball", "baseball glove", "chair"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 14773, "caption": "A colorful car-shaped sandwich sits on a plate, surrounded by french fries and a hamburger. The sandwich is placed on top of a car-shaped plate, which adds a playful touch to the meal. The combination of the car-shaped sandwich,", "mscoco_hallucinated_words": [["sandwich", "sandwich"], ["hamburger", "sandwich"], ["sandwich", "sandwich"], ["sandwich", "sandwich"]], "mscoco_gt_words": ["spoon", "dining table", "person", "bottle", "hot dog", "car", "fork", "cup"], "hallucination_idxs": [3, 15, 18, 42], "metrics": {"CHAIRs": 1, "CHAIRi": 1.0, "Recall": 0.0}}, {"image_id": 521863, "caption": "A man is skateboarding on a sidewalk in front of a building, with people walking by and a bicycle parked nearby.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "bicycle", "skateboard"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 250540, "caption": "A group of men riding motorcycles, including one man wearing a helmet, are parked on the side of a street. They are all dressed in casual attire and appear to be enjoying their time together.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "motorcycle", "cell phone", "car", "handbag"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 211604, "caption": "A young woman is lying on a wooden deck, wearing a tennis outfit and a hat, and is resting her head on her hand. She is likely taking a break from playing tennis or enjoying the sunny weather.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "sports ball", "tennis racket"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 298067, "caption": "A plate of grilled meat and a beer are sitting on a table, with a close-up of the meat and a bottle of beer in the background.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "dining table", "bottle", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 563938, "caption": "A group of friends are sitting on a couch, looking at a tablet or a phone. They are engaged in a conversation, possibly discussing a topic or sharing a funny story. The scene is casual and relaxed, with the friends enjoying each other's company.", "mscoco_hallucinated_words": [["phone", "cell phone"]], "mscoco_gt_words": ["person", "bottle", "bench", "couch", "tie"], "hallucination_idxs": [16], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.2}}, {"image_id": 461311, "caption": "A group of people, including children and adults, are gathered in a park, enjoying a fun day out. They are flying kites in the open sky, with the wind gently lifting the colorful and decorated kites. The scene is filled with laughter and joy, as people of all", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "car", "kite", "handbag", "backpack"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 47940, "caption": "A young man is lying on a bed, surrounded by books and a stuffed animal. He is reading a book and has a stuffed animal sitting next to him. The image captures a moment of relaxation and leisure, where the young man is engaging in a quiet activity, enjoying his time", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["laptop", "book", "person", "bed"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 261318, "caption": "A man is sitting on a red chair, using his cell phone while waiting for his luggage at the airport.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "bench", "chair", "cell phone", "handbag", "suitcase"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 134768, "caption": "A black computer mouse is sitting on a desk next to a pair of speakers, with a keyboard nearby. The speakers are turned on, and there is a black cable connected to them. The image captures a moment of a person using their computer, possibly listening to music or working on a project. The", "mscoco_hallucinated_words": [["person", "person"]], "mscoco_gt_words": ["laptop", "keyboard", "dining table", "mouse"], "hallucination_idxs": [44], "metrics": {"CHAIRs": 1, "CHAIRi": 0.16666666666666666, "Recall": 1.0}}, {"image_id": 526414, "caption": "A woman is sitting at a desk in a room filled with various items, including a sewing machine, a TV, and a bookshelf. She is surrounded by books and other materials, and there is a window behind her. The image captures a moment of her working on a sewing project, possibly", "mscoco_hallucinated_words": [["woman", "person"]], "mscoco_gt_words": ["laptop", "dining table", "tv", "bowl", "couch", "cat", "scissors", "book", "remote", "cup"], "hallucination_idxs": [1], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.3}}, {"image_id": 273132, "caption": "An elderly woman sits on a bench, surrounded by her belongings, and enjoys the sunshine while waiting for her bus.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "bench", "handbag"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 505213, "caption": "A man is eating a hot dog in a park, enjoying the winter weather.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "hot dog", "sandwich"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 192656, "caption": "A baseball player is standing on a grass field, wearing a black and white uniform, and holding a baseball bat. He is in the middle of a pitch, ready to swing and hit the ball. The image captures the player's determination and focus on the game, as he prepares to make contact", "mscoco_hallucinated_words": [["baseball bat", "baseball bat"]], "mscoco_gt_words": ["person", "sports ball", "baseball glove"], "hallucination_idxs": [20], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.6666666666666666}}, {"image_id": 272728, "caption": "A vase filled with colorful flowers sits on a table, surrounded by a green rug and a wooden chair. The flowers are arranged in a beautiful and artistic manner, adding a touch of elegance and beauty to the room.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "chair", "vase", "potted plant"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 509811, "caption": "A group of students are sitting at tables in a library, using their laptops and working on their assignments. The room is filled with computers and tables, creating a modern and functional learning environment.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["laptop", "dining table", "apple", "person", "chair", "book"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 412407, "caption": "A woman is holding a cell phone and talking to someone, possibly a friend or family member, while sitting on a couch. She is using the phone to communicate with the person on the other end of the call.", "mscoco_hallucinated_words": [["couch", "couch"]], "mscoco_gt_words": ["cell phone", "clock", "person"], "hallucination_idxs": [23], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2, "Recall": 0.6666666666666666}}, {"image_id": 353658, "caption": "A woman is walking down a street in a city, carrying an umbrella to protect herself from the rain. She is surrounded by people shopping at a market, and there are various items on display, such as fruits and vegetables. The scene captures the hustle and bustle of city", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "clock", "umbrella", "handbag", "carrot", "suitcase"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 441363, "caption": "A man in red shorts and a white shirt is playing tennis on a court, with a tennis racket in hand. He is swinging the racket and preparing to hit the ball.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "sports ball", "tennis racket"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 331084, "caption": "A group of people are preparing a meal on a table, with various ingredients and utensils laid out. They are chopping vegetables, slicing meat, and arranging ingredients on a cutting board. The scene suggests that they are preparing a meal together, possibly for", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["spoon", "person", "dining table", "bowl", "knife", "carrot", "pizza"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2857142857142857}}, {"image_id": 282553, "caption": "A man and a woman are walking down a dirt path in a grassy field, with a large stone monument in the background. The couple is likely enjoying a leisurely stroll or a scenic walk, taking in the natural beauty of the area. The presence of the stone monument adds an interesting", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "cell phone", "handbag"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 328818, "caption": "A young woman is sitting on a bench, putting on her shoes while holding a bicycle.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "bicycle", "bottle", "bench"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 3103, "caption": "A man in a yellow helmet and black pants is performing a trick on a skateboard, flying through the air while riding down a ramp.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "clock", "skateboard"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 188136, "caption": "A large, green kitchen with a stainless steel sink and a variety of pots and pans is filled with fresh fruits and vegetables. The kitchen is well-equipped with utensils and appliances, and there are several bowls and containers on the countertop. The scene suggests that", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "dining table", "bowl", "orange", "carrot", "sink"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 449675, "caption": "A white plate with a sandwich on it sits on a table, surrounded by a glass of water and a fork. The sandwich is made of meat and vegetables, and it appears to be a delicious and satisfying meal.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["spoon", "dining table", "bottle", "knife", "sandwich", "fork", "carrot", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.375}}, {"image_id": 191691, "caption": "A man is shaving in a bathroom, using a razor to remove his facial hair. He is standing in front of a sink, with a towel on the counter and a toothbrush on the sink. The man is wearing a bathrobe, and his face is covered in sh", "mscoco_hallucinated_words": [["sink", "sink"], ["sink", "sink"]], "mscoco_gt_words": ["person", "bottle", "toothbrush"], "hallucination_idxs": [24, 37], "metrics": {"CHAIRs": 1, "CHAIRi": 0.4, "Recall": 0.6666666666666666}}, {"image_id": 89378, "caption": "A man is standing next to a red motorcycle, wearing a black helmet and a black jacket. He is holding a black helmet in his hand, and the motorcycle is parked on the side of a road.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["motorcycle", "bicycle", "backpack", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 99874, "caption": "A young woman is sitting at a table, wearing sunglasses and holding a cell phone. She is likely waiting for someone or taking a break from her activities.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "dining table", "bottle", "cell phone", "cat", "handbag"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 437895, "caption": "A colorful bed with a hanging bed frame and a bedspread is shown in the image. The bed is adorned with a variety of patterns and colors, creating a visually appealing and unique design.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["vase", "potted plant", "bed"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 557447, "caption": "A man in a suit and tie is sitting at a desk in a conference room, looking at a piece of paper. He is likely discussing or reviewing a document or presentation, possibly related to a business meeting or conference. The man is engaged in a thoughtful and focused conversation, using his pen to highlight", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "dining table", "spoon", "knife", "tie", "fork"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 159979, "caption": "A group of people are gathered on a boat, enjoying a meal together. The boat is filled with various food items, including bowls, plates, and cups, and there are umbrellas overhead to provide shade. The scene suggests a casual and relaxed atmosphere, where people can", "mscoco_hallucinated_words": [["cup", "cup"]], "mscoco_gt_words": ["bowl", "umbrella", "person", "boat"], "hallucination_idxs": [30], "metrics": {"CHAIRs": 1, "CHAIRi": 0.14285714285714285, "Recall": 1.0}}, {"image_id": 357, "caption": "A baseball game is taking place on a green field, with a player standing on the base and another player in the process of throwing the ball.", "mscoco_hallucinated_words": [["ball", "sports ball"]], "mscoco_gt_words": ["person", "baseball bat", "baseball glove"], "hallucination_idxs": [27], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.3333333333333333}}, {"image_id": 538891, "caption": "A young woman is standing on a tennis court, holding a tennis racket and looking at the camera. She is wearing a white tennis shirt and shorts, and her hair is tied back. She is ready to serve the ball, and her focus is on the camera.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "sports ball", "tennis racket"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 561967, "caption": "A train is traveling down a railroad track, passing by a group of railroad cars.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["train", "traffic light", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 565778, "caption": "A blue train is traveling down a track, passing through a tunnel, and crossing a bridge. The train is carrying passengers, and it is lit up by the headlights of the engine.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "train", "traffic light", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 7125, "caption": "A group of people, including a man and a woman, are riding bicycles along a path near a river. They are enjoying the scenic view and the fresh air while engaging in a leisurely activity.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "bicycle", "bottle", "dog", "backpack"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 221350, "caption": "A man is holding a red tie with a heart-shaped pattern, which is a unique and eye-catching accessory.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "dining table", "chair", "tie", "handbag"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 280930, "caption": "A young girl is standing in front of a kitchen counter, holding a tray of freshly baked cookies. She is smiling and looking at the camera, capturing a moment of joy and satisfaction with her delicious treat.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "bottle", "oven", "refrigerator"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 151081, "caption": "A small airplane is flying over a field, with a fence and a road in the background.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "airplane", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 122232, "caption": "A woman is playing tennis on a grassy field, with a tennis racket in her hand and a ball on the ground. She is standing in front of a white net, and there are several tennis balls scattered around her.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "sports ball", "tennis racket"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 134223, "caption": "A plate of food, including a sandwich, fries, and a salad, is placed on a white table. The sandwich is a hot dog, and it is accompanied by a side of fries and a salad. The plate is set up on a table with a white tablecloth, and", "mscoco_hallucinated_words": [["sandwich", "sandwich"], ["sandwich", "sandwich"]], "mscoco_gt_words": ["bowl", "dining table", "hot dog", "broccoli"], "hallucination_idxs": [7, 23], "metrics": {"CHAIRs": 1, "CHAIRi": 0.4, "Recall": 0.5}}, {"image_id": 198163, "caption": "A man is sitting at a table, surrounded by various colorful ceramic pieces, including bowls, plates, and cups. He is engaged in painting or decorating the ceramics, using a brush and paint to add color and designs to the items. The man is likely an artist or", "mscoco_hallucinated_words": [["cup", "cup"]], "mscoco_gt_words": ["bowl", "dining table", "person"], "hallucination_idxs": [21], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2, "Recall": 1.0}}, {"image_id": 3742, "caption": "A bowl of fresh apples sits on a table next to a window, with a vase of red roses nearby. The apples are arranged in a neat and colorful pattern, adding a touch of elegance to the scene. The presence of the roses adds a romantic and inviting atmosphere", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "dining table", "apple", "vase"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 217593, "caption": "A young boy is standing in a field, wearing a baseball uniform and holding a baseball bat. He is ready to swing and hit the ball, as he is surrounded by other people, including a woman and a man, who are watching him. The image captures the excitement and anticipation of the young boy as", "mscoco_hallucinated_words": [["ball", "sports ball"]], "mscoco_gt_words": ["person", "chair", "baseball bat", "baseball glove", "handbag"], "hallucination_idxs": [27], "metrics": {"CHAIRs": 1, "CHAIRi": 0.14285714285714285, "Recall": 0.4}}, {"image_id": 279078, "caption": "A young girl is standing in front of a refrigerator filled with various bottles of beer. She is holding a bottle of beer and looking at the refrigerator, possibly admiring the selection of beverages.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "bottle", "refrigerator"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 572081, "caption": "A man is playing tennis on a court, with a net in the middle. He is wearing a tennis outfit and holding a tennis racket. The image shows the tennis court in a stadium setting, with a large crowd watching the match.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "chair", "couch", "sports ball", "tennis racket"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 477016, "caption": "A young girl and her mother are standing in front of a colorful kitchen, looking at a large aquarium filled with fish. The mother is holding a baby, and the girl is holding a toy. The scene is likely a family moment, where they are enjoying each other's company and the unique aqu", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "oven", "potted plant", "handbag", "sink", "backpack"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.16666666666666666}}, {"image_id": 301266, "caption": "A group of young people are gathered around a table, with various items on it. They are engaged in a cooking activity, possibly a cooking class or a group project, where they are learning to prepare and cook food together. The image captures the excitement and camaraderie of the group as they work", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "dining table", "spoon", "book", "fork", "sink", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2857142857142857}}, {"image_id": 475813, "caption": "A young girl is standing in front of a table, holding a toy phone and looking at the camera.", "mscoco_hallucinated_words": [["table", "dining table"], ["phone", "cell phone"]], "mscoco_gt_words": ["person", "remote", "handbag"], "hallucination_idxs": [9, 14], "metrics": {"CHAIRs": 1, "CHAIRi": 0.6666666666666666, "Recall": 0.3333333333333333}}, {"image_id": 558784, "caption": "A man is standing on a grassy field, holding a golf club and looking at a lake in the background.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "frisbee", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 308543, "caption": "A man is holding two silver spoons in his hand, with one spoon resting on the edge of a sink. The image captures a moment of the man preparing to wash the spoons in the sink.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["spoon", "sink", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 359164, "caption": "Two dogs, a small brown one and a larger white one, are playing in a grassy area. The brown dog is running around, while the white dog is chasing it. They appear to be having fun and enjoying each other's company.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "dog", "chair", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 539951, "caption": "A small kitchen with a white and gray color scheme is showcased in the image. The kitchen features a stove, a sink, and a refrigerator, all made from Lego bricks. The kitchen is designed to look like a miniature version of a real kitchen, complete with a checkered", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["clock", "sink", "oven", "refrigerator"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 143479, "caption": "An elderly man is holding a tray of hot dogs, and a woman is standing next to him. They are both outside, possibly at a picnic or barbecue, and the man is handing the tray to the woman. The woman is smiling and appears to be enjoying the hot dogs", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "hot dog", "chair"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 475024, "caption": "A vase filled with colorful flowers sits on a table, adding a touch of beauty and warmth to the room.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "orange", "vase", "potted plant"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 238065, "caption": "A young man is riding a skateboard on a wooden ramp, performing a trick in the air.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "chair", "skateboard"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 314016, "caption": "A small bathroom is filled with various items, including a toilet, a sink, a mirror, and a bottle of alcohol. The sink is covered with a towel, and there is a note on the mirror. The bathroom is clean and well-organized, with a toilet", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["toilet", "bottle", "sink", "book"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 322163, "caption": "A group of people, including a chef and several others, are gathered around a kitchen counter, preparing food. They are using various kitchen tools and utensils to prepare the meal, which includes a pizza. The chef is using a pizza cutter to slice the pizza, while others are using", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "dining table", "bottle", "oven", "potted plant", "bowl", "microwave", "remote", "pizza"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2222222222222222}}, {"image_id": 230983, "caption": "A young man is performing a skateboard trick on a sidewalk, jumping over a green plastic barrel. The man is wearing a black shirt and jeans, and he is in the middle of a street. The image captures the excitement and skill of the skateboarder as he", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "skateboard", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 564629, "caption": "A large kitchen with a stove, oven, and refrigerator is visible in the image. The kitchen is located in a motorhome, which is parked in a parking lot. The motorhome has a large window, allowing natural light to enter the kitchen. The kitchen is well-equipped", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["microwave", "sink", "oven", "refrigerator"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 53431, "caption": "A man is sitting on a chair, using a laptop while wearing a blue shirt, a tie, and a hat. He is sitting in front of a brick wall, and there is a small table next to him.", "mscoco_hallucinated_words": [["tie", "tie"], ["table", "dining table"]], "mscoco_gt_words": ["laptop", "person", "chair"], "hallucination_idxs": [18, 39], "metrics": {"CHAIRs": 1, "CHAIRi": 0.4, "Recall": 1.0}}, {"image_id": 441840, "caption": "A young boy is playing baseball in a field, swinging a bat and trying to hit a ball. He is surrounded by other kids and adults, who are watching and cheering him on. The image captures the excitement and energy of a fun day at the ballpark, where children can engage in", "mscoco_hallucinated_words": [["ball", "sports ball"]], "mscoco_gt_words": ["person", "car", "baseball bat", "baseball glove", "truck"], "hallucination_idxs": [18], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2, "Recall": 0.2}}, {"image_id": 53465, "caption": "A group of people is gathered around a table, enjoying a delicious cake. The cake is decorated with the words \"Welcome to the Jungle\" and has a pink and white color scheme. The people are smiling and having a good time, indicating that they are celebrating a special", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["spoon", "dining table", "person", "bowl", "cake", "fork", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.42857142857142855}}, {"image_id": 381031, "caption": "A bowl of peanut butter and jelly sandwiches, a glass of orange juice, and a jar of peanut butter are arranged on a table.", "mscoco_hallucinated_words": [["bowl", "bowl"], ["sandwich", "sandwich"], ["orange", "orange"]], "mscoco_gt_words": ["spoon", "dining table", "bottle", "apple", "donut", "microwave", "cup"], "hallucination_idxs": [1, 7, 12], "metrics": {"CHAIRs": 1, "CHAIRi": 0.75, "Recall": 0.14285714285714285}}, {"image_id": 530520, "caption": "Two men are sitting on a grassy lawn, using their laptops and discussing something.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["laptop", "clock", "person", "motorcycle", "backpack"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 539555, "caption": "A young man is performing a trick on a skateboard, jumping and spinning in the air while wearing a white t-shirt and a pair of red sneakers.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "frisbee", "skateboard"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 279521, "caption": "Two men are standing next to a city bus, looking at it. One man is wearing a hat, and the other man is wearing a jacket. They are likely waiting for the bus to arrive or discussing their plans. The image captures a moment of casual conversation between the two men, as", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "car", "handbag", "bus", "train", "backpack"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.16666666666666666}}, {"image_id": 560439, "caption": "A group of people, including a man and a woman, are walking down a snowy slope, possibly on a ski trail. They are wearing winter clothing and carrying skis, indicating that they are participating in winter sports. The image captures the joy and excitement of the group as they enjoy their time", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "skis", "handbag", "snowboard", "backpack"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 248353, "caption": "A group of people, including a man and a woman, are skiing down a snowy hill. They are all wearing ski gear and appear to be enjoying their time on the slopes.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "skis", "snowboard"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 9628, "caption": "A man is riding a jet ski while performing a trick in the water, with a red kite flying in the background.", "mscoco_hallucinated_words": [["jet", "airplane"], ["ski", "skis"], ["kite", "kite"]], "mscoco_gt_words": ["person", "surfboard", "boat"], "hallucination_idxs": [5, 6, 18], "metrics": {"CHAIRs": 1, "CHAIRi": 0.75, "Recall": 0.3333333333333333}}, {"image_id": 330050, "caption": "A man and a woman are playing tennis on a court, with the man holding a tennis racket and the woman holding a tennis racket and a tennis ball. They are standing in front of a net, and the woman is smiling while the man is looking at her.", "mscoco_hallucinated_words": [["ball", "sports ball"]], "mscoco_gt_words": ["person", "tennis racket", "bench"], "hallucination_idxs": [29], "metrics": {"CHAIRs": 1, "CHAIRi": 0.1111111111111111, "Recall": 0.6666666666666666}}, {"image_id": 254161, "caption": "A man is standing in the middle of a city square, surrounded by tall buildings and a large flag. He is holding a smartphone and appears to be taking a photo of the scene. The city square is filled with people, and the man is capturing the moment with his phone.", "mscoco_hallucinated_words": [["smartphone", "cell phone"], ["phone", "cell phone"]], "mscoco_gt_words": ["kite", "handbag", "person"], "hallucination_idxs": [25, 54], "metrics": {"CHAIRs": 1, "CHAIRi": 0.4, "Recall": 0.3333333333333333}}, {"image_id": 275749, "caption": "A group of friends are gathered around a computer screen in a room, possibly a living room or a study area. They are watching a video or playing a game together, with one person sitting in front of the computer and others standing around it. The scene is casual and social, showcasing the bond and cam", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["laptop", "dining table", "bottle", "person", "tv", "chair", "mouse", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 163518, "caption": "A woman in a chef's uniform is preparing a large salad for a group of people. She is standing at a table with a variety of fresh vegetables, and she is using a plastic container to scoop up the ingredients. The woman is carefully arranging the salad ingredients", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "dining table", "oven", "chair", "bowl"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 156696, "caption": "A train is parked on a platform, with a man standing next to it. The train has a large, colorful design on its side, and it appears to be a passenger train. The man is looking at the train, possibly admiring its design or waiting for it to depart. The image captures a", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "train", "handbag", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 525202, "caption": "A group of friends is enjoying a delicious pizza at a restaurant, with a large pizza on a wooden table in front of them. They are taking bites and laughing together, enjoying their meal.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "spoon", "bottle", "dining table", "chair", "knife", "fork", "cup", "pizza"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2222222222222222}}, {"image_id": 423984, "caption": "A delicious plate of pasta, featuring a bowl of creamy white sauce, is being enjoyed by a person. The dish is accompanied by a slice of bread and a few carrots, making it a well-rounded and satisfying meal.", "mscoco_hallucinated_words": [["bowl", "bowl"], ["person", "person"]], "mscoco_gt_words": ["dining table", "carrot", "broccoli"], "hallucination_idxs": [8, 19], "metrics": {"CHAIRs": 1, "CHAIRi": 0.6666666666666666, "Recall": 0.3333333333333333}}, {"image_id": 499486, "caption": "A cat and a kitten are sitting on a bed, surrounded by a messy room.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cat", "book", "bed"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 118124, "caption": "A young man is sitting in a car, looking at his phone while wearing glasses and a tie. He is likely in a professional setting, possibly at work or attending a meeting. The image captures a moment of focus and concentration, as the man is engaged in a task on his phone.", "mscoco_hallucinated_words": [["phone", "cell phone"], ["phone", "cell phone"]], "mscoco_gt_words": ["person", "tie", "car"], "hallucination_idxs": [12, 56], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 1.0}}, {"image_id": 288729, "caption": "A cake in the shape of a circus tent is sitting on a table, surrounded by a blue and white striped tablecloth. The cake features a small elephant and a man in a red and white striped shirt, both of which are decorated with fondant. The cake", "mscoco_hallucinated_words": [["table", "dining table"]], "mscoco_gt_words": ["person", "cake", "bear", "teddy bear", "elephant"], "hallucination_idxs": [13], "metrics": {"CHAIRs": 1, "CHAIRi": 0.16666666666666666, "Recall": 0.6}}, {"image_id": 177721, "caption": "A young man is performing a skateboard trick on a ramp, jumping over a barrier and landing on a skateboard ramp.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "dining table", "skateboard"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 372220, "caption": "A man wearing a black hat and a white beard is walking down a street while holding a cell phone. He is surrounded by people, and he appears to be talking to someone on the phone.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "cell phone", "horse", "handbag"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 252625, "caption": "A busy street in a city is filled with people, bicycles, and cars. There are several shops and restaurants along the street, and a red light is visible at the intersection. The scene is vibrant and lively, showcasing the hustle and bustle of urban life", "mscoco_hallucinated_words": [["car", "car"]], "mscoco_gt_words": ["person", "bicycle", "traffic light", "potted plant"], "hallucination_idxs": [14], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.5}}, {"image_id": 493610, "caption": "A group of people are riding on a truck, which is parked on a dirt road. The truck is filled with passengers, and it appears to be a public transportation vehicle. The image captures the scene of people traveling together in a shared vehicle, which is a common mode of transport", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "bus", "truck", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 302789, "caption": "A suitcase and a backpack are sitting on a bed in a small room, possibly a dorm room or a shared living space. The bed is covered with a blanket, and there is a small table nearby. The presence of the suitcase and backpack suggests that the room is occupied by someone who is", "mscoco_hallucinated_words": [["table", "dining table"]], "mscoco_gt_words": ["bottle", "bed", "refrigerator", "handbag", "sink", "backpack", "suitcase"], "hallucination_idxs": [38], "metrics": {"CHAIRs": 1, "CHAIRi": 0.14285714285714285, "Recall": 0.42857142857142855}}, {"image_id": 30667, "caption": "A brown dog is sitting on a bench with two people, possibly a man and a woman, in a park. The dog is laying down and appears to be comfortable, while the people are sitting next to it.", "mscoco_hallucinated_words": [["bench", "bench"]], "mscoco_gt_words": ["person", "dog", "boat"], "hallucination_idxs": [7], "metrics": {"CHAIRs": 1, "CHAIRi": 0.14285714285714285, "Recall": 0.6666666666666666}}, {"image_id": 114108, "caption": "A group of friends are enjoying a delicious meal together, with a pizza on the table. The pizza is topped with various ingredients, including cheese, tomato sauce, and herbs. The friends are engaged in conversation and laughing, making the moment a joyful and", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "dining table", "spoon", "chair", "knife", "fork", "cup", "pizza"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 328110, "caption": "A young woman is sitting on a bench, holding her baby in a baby carrier. She is surrounded by people walking down the street, creating a lively atmosphere. The woman is enjoying the time spent with her baby, taking in the sights and sounds of the city while also engaging with the people", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["backpack", "bench", "handbag", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 366111, "caption": "A group of men riding bicycles down a city street, passing by a street sign, and a parked car.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "bicycle", "traffic light", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 532481, "caption": "A man is flying a kite on a beach, with a large wave in the background.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["kite", "surfboard", "person", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 291634, "caption": "A group of motorcycles is parked on the sidewalk in front of a building, creating a colorful and lively scene. The motorcycles are arranged in a row, with some of them being parked on the sidewalk and others on the street. The image captures the vibrant atmosphere", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["motorcycle", "bicycle", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 463678, "caption": "A man in white tennis attire is standing on a tennis court, holding a tennis racket and preparing to serve the ball. He is wearing a white shirt and white shorts, and his tennis shoes are visible. The image captures the moment before he makes contact with the ball, showc", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "sports ball", "tennis racket"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 70815, "caption": "A small dog sits on the sidewalk, looking up at a man on a bicycle as they pass by.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "bicycle", "dog", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 367872, "caption": "A baseball player is swinging a bat at a baseball, with a crowd of people watching in the background.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "umbrella", "baseball bat", "baseball glove", "sports ball"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2}}, {"image_id": 353898, "caption": "A man sits on a stone bench surrounded by a group of white pigeons, reading a book.", "mscoco_hallucinated_words": [["book", "book"]], "mscoco_gt_words": ["person", "bird", "bench", "cell phone", "backpack"], "hallucination_idxs": [17], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.6}}, {"image_id": 88269, "caption": "A plate with a bowl of tomato soup and a slice of toast is sitting on a table.", "mscoco_hallucinated_words": [["table", "dining table"]], "mscoco_gt_words": ["spoon", "sandwich", "bowl"], "hallucination_idxs": [17], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.3333333333333333}}, {"image_id": 463211, "caption": "A young girl and her friend are walking down a street, with the girl wearing a backpack and the friend holding a backpack. They are both smiling and looking at each other, possibly enjoying each other's company or discussing something. The image captures a moment of friendship and companionship between", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "bus", "backpack"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 396269, "caption": "A beautiful floral arrangement sits on a gold-colored chair in a grand room, surrounded by intricate wallpaper and ornate furniture.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "vase", "chair"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 98979, "caption": "A black microwave oven is sitting on a countertop in a kitchen, with a window visible behind it.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["microwave", "knife", "oven"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 244455, "caption": "Two police officers on motorcycles are riding down a street, with one officer waving at the camera. The officers are dressed in black and wearing helmets, and they are riding in a formation. The image captures the moment when they are passing by a group of people, possibly spectators", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "bicycle", "motorcycle", "car", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 379443, "caption": "A pair of scissors is cutting a black mesh fabric, with a pair of orange scissors nearby.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "scissors", "orange"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 536154, "caption": "A young girl is sitting on a bed surrounded by a large collection of stuffed animals, including teddy bears, dolls, and other soft toys. She is smiling and enjoying the company of her stuffed friends.", "mscoco_hallucinated_words": [["bed", "bed"]], "mscoco_gt_words": ["person", "cat", "teddy bear"], "hallucination_idxs": [7], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.6666666666666666}}, {"image_id": 374061, "caption": "A black cat is laying on a couch, holding a stuffed animal in its paws. The cat is sleeping and appears to be enjoying the softness of the couch and the comfort of the stuffed animal.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["couch", "bear", "cat", "teddy bear", "bed"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 560018, "caption": "A group of people are enjoying a day at the beach, riding waves on surfboards and kayaks. The image captures the excitement and fun of water sports, with the surfers and kayakers riding the waves and enjoying the sunny day at the beach.", "mscoco_hallucinated_words": [["kayak", "boat"]], "mscoco_gt_words": ["kite", "surfboard", "person"], "hallucination_idxs": [17], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.6666666666666666}}, {"image_id": 353320, "caption": "A guitar case and a suitcase are sitting on a bench at a train station, with a suitcase on top of the guitar case.", "mscoco_hallucinated_words": [["train", "train"]], "mscoco_gt_words": ["person", "bench", "handbag", "suitcase"], "hallucination_idxs": [13], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.5}}, {"image_id": 256628, "caption": "A golden retriever dog is lying on a wooden deck, enjoying the sun and fresh air.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "dog", "chair"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 158806, "caption": "A dog is sitting on a blue plate, eating a sandwich.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "dog", "sandwich"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 424270, "caption": "A young girl is sitting on a bed, surrounded by a pile of blankets and pillows. She is wearing a white dress and appears to be enjoying her cozy and comfortable environment.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "tv", "bed"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 368335, "caption": "A horse is standing in a parking lot, looking at a car.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["horse", "truck", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 483227, "caption": "A group of young children, including a boy and a girl, are gathered around a tennis court, participating in a tennis lesson. They are standing in front of a net, holding tennis rackets and balls, and are engaged in a fun and interactive learning experience.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "sports ball", "tennis racket"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 228306, "caption": "A red double-decker bus is parked on the side of a street, with its front end visible.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "bus", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 416384, "caption": "A woman is sitting on a wooden bench, using her phone while wearing a pink swimsuit.", "mscoco_hallucinated_words": [["bench", "bench"]], "mscoco_gt_words": ["person", "cell phone", "chair"], "hallucination_idxs": [7], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.6666666666666666}}, {"image_id": 364783, "caption": "A red bathroom with a toilet, sink, and shower is shown in the image. The bathroom has a red and white color scheme, with red tiles on the floor and walls, and white fixtures such as the toilet, sink, and shower. The bathroom also", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bottle", "potted plant", "chair", "toilet", "toothbrush", "sink", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2857142857142857}}, {"image_id": 335041, "caption": "A man and a woman are walking down a snow-covered street, each carrying a ski pole. They are walking in the middle of a snow-covered city street, surrounded by buildings and cars. The scene shows the winter season in the city, with snow covering the ground and the streets.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "skis", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 531327, "caption": "A bowl of colorful vegetables, including broccoli, carrots, and green beans, is placed on a white plate. The vegetables are arranged in a pattern, with the broccoli in the center and the carrots and green beans surrounding it. A fork is placed next", "mscoco_hallucinated_words": [["bowl", "bowl"]], "mscoco_gt_words": ["spoon", "dining table", "wine glass", "knife", "broccoli", "fork", "carrot"], "hallucination_idxs": [1], "metrics": {"CHAIRs": 1, "CHAIRi": 0.16666666666666666, "Recall": 0.42857142857142855}}, {"image_id": 451228, "caption": "A group of people riding bicycles and walking on a busy street in London, England, is captured in this image. The street is filled with red double-decker buses and other vehicles, and the people are either riding bicycles or walking on the sidewalk. The scene shows the h", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bicycle", "bus", "traffic light", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 256365, "caption": "A plate of blue cupcakes with white frosting and a swirl design sits on a white plate, surrounded by a few other cupcakes. The cupcakes are decorated with colorful sprinkles and a blue and white striped pattern.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cake", "dining table", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 502936, "caption": "A man is playing tennis on a court, with a tennis racket in hand and a tennis ball in the air. He is wearing a white shirt and shorts, and is standing in front of a green fence.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "sports ball", "tennis racket"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 451449, "caption": "A small dog is lying in a bed of books, surrounded by various books and other items. The dog is likely a pet, and its presence in the bookshelf suggests that it is a comfortable and cozy spot for it to rest.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dog", "book", "bed"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 51054, "caption": "An elderly woman is sitting on a bed, holding a cell phone and looking at it intently. She is likely using the phone to make a call or check her messages. The image captures a moment of her daily life, showcasing her reliance on technology to stay connected with her loved ones or complete", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "bottle", "cell phone", "bed", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 1268, "caption": "A woman is sitting on a bench, taking a picture of a swan on the riverbank, while a man is standing nearby. The scene is set against a beautiful backdrop of a city skyline, with a bridge and a building visible in the distance. The woman is capturing the moment with her camera", "mscoco_hallucinated_words": [["bench", "bench"]], "mscoco_gt_words": ["person", "bird", "cell phone", "handbag", "backpack", "boat"], "hallucination_idxs": [6], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2, "Recall": 0.3333333333333333}}, {"image_id": 62692, "caption": "A young woman is playing tennis on a court, with a net in the background. She is wearing a black and white tennis outfit and is holding a tennis racket. She is standing in front of a net, ready to hit the ball.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "sports ball", "tennis racket"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 542771, "caption": "A woman is sitting at a desk in a room with a window, surrounded by various objects such as a chair, a table, and a vase.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "dining table", "potted plant", "chair", "book", "vase"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 575406, "caption": "A red and blue bus is parked on a street in front of a building, with a yellow and blue bus in the background.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["motorcycle", "bus", "person", "potted plant"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 244834, "caption": "A couple is walking down a sidewalk, holding an umbrella to protect them from the rain. They are walking together, enjoying each other's company, and smiling as they stroll through the city.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "clock", "bicycle", "potted plant", "umbrella", "car", "handbag"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.14285714285714285}}, {"image_id": 151159, "caption": "A group of friends are playing a game of skateboarding on a basketball court, with one person riding a skateboard and another person holding a skateboard. They are having fun and enjoying the outdoor activity together.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "bench", "skateboard"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 277073, "caption": "A man riding a scooter is driving down a busy street in the city, surrounded by cars and other vehicles.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "bicycle", "motorcycle", "car", "backpack"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 377879, "caption": "A large military tank is being transported on a trailer, which is being pulled by a truck. The tank is surrounded by a fence, and there is a sign on the trailer that reads \"Tank Transporter.\" The image captures the moment when the tank is being loaded onto the trailer", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["train", "truck", "bed"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 436814, "caption": "A young woman is sitting at a desk in a room with a door, surrounded by various objects such as a computer, a chair, and a book. She is using a laptop and appears to be working on a project or studying. The room is well-lit and organized, with a window visible in the background", "mscoco_hallucinated_words": [["woman", "person"], ["book", "book"]], "mscoco_gt_words": ["laptop", "mouse", "dining table", "chair"], "hallucination_idxs": [2, 29], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.75}}, {"image_id": 63934, "caption": "A nun rides a skateboard down a sidewalk in front of a city building, wearing a habit and carrying a backpack.", "mscoco_hallucinated_words": [["backpack", "backpack"]], "mscoco_gt_words": ["person", "truck", "skateboard", "car"], "hallucination_idxs": [21], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.25}}, {"image_id": 275611, "caption": "A delicious pizza is being served on a metal tray, with a slice of cheese and pepperoni on top. The pizza is placed on a table, and there are utensils nearby for guests to use. The image captures the moment when the pizza is being served, and it", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "knife", "pizza"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 516248, "caption": "A young woman is sitting at a computer desk, using a computer mouse to navigate through a computer program. She is wearing a black jacket and has a laptop on her lap. The image captures the moment when she is about to click on a button or icon on the computer screen.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["laptop", "dining table", "tv", "person", "keyboard", "mouse"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 478380, "caption": "A man is driving a bus down a road, surrounded by a large group of sheep.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "car", "sheep"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 422326, "caption": "A group of motorcycles and a sidecar are parked in a parking lot, creating a colorful and lively scene. The motorcycles are arranged in a row, with one of them having a sidecar attached. The sidecar is designed to accommodate a passenger, adding a unique and fun", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "bicycle", "motorcycle", "car", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 110449, "caption": "Two men are standing behind a counter, one of them is DJing while the other man is holding a microphone. They are both wearing casual clothing and are engaged in their respective tasks.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["laptop", "dining table", "tv", "person", "remote"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2}}, {"image_id": 45550, "caption": "A man is holding a plate of fried chicken and a cup of sauce, posing for a photo in a restaurant.", "mscoco_hallucinated_words": [["cup", "cup"]], "mscoco_gt_words": ["bowl", "clock", "sandwich", "person"], "hallucination_idxs": [11], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.25}}, {"image_id": 444913, "caption": "A man is standing in a grassy area, holding a golf club and looking at the camera. He is wearing a baseball cap and a jacket, and appears to be enjoying the outdoors.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "frisbee", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 82709, "caption": "A dog is flying through the air while playing fetch with a frisbee on a grassy field.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "backpack", "bottle", "frisbee", "dog", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 132796, "caption": "A group of people, including a man and a woman, are riding on the back of an elephant through the jungle.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "bench", "chair", "elephant", "backpack"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 303099, "caption": "Two cats, a black and white cat and a grey cat, sit on top of a toilet seat and a bathroom sink, respectively. They appear to be enjoying their time in the bathroom, possibly playing or resting. The image captures a lighthearted and playful moment between the", "mscoco_hallucinated_words": [["sink", "sink"]], "mscoco_gt_words": ["toilet", "bottle", "cat"], "hallucination_idxs": [23], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2, "Recall": 0.6666666666666666}}, {"image_id": 271565, "caption": "A group of motorcyclists rides down a street, with a few cars parked along the side of the road. The motorcyclists are wearing helmets and riding in a line, while the cars are parked in a row. The scene suggests a group of motorcyclists", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "motorcycle", "truck", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 205193, "caption": "A cup of tea and a bag of tea leaves are sitting on a counter next to a microwave oven. The cup of tea is filled with hot water, and the bag of tea leaves is placed on top of the cup. The scene suggests that someone is preparing to make a cup of tea using the", "mscoco_hallucinated_words": [["cup", "cup"], ["cup", "cup"], ["cup", "cup"], ["cup", "cup"]], "mscoco_gt_words": ["person", "microwave", "toaster", "oven"], "hallucination_idxs": [1, 22, 43, 55], "metrics": {"CHAIRs": 1, "CHAIRi": 0.6666666666666666, "Recall": 0.5}}, {"image_id": 272566, "caption": "A man sits on a bench surrounded by various fruits, including bananas, apples, and oranges, at a market.", "mscoco_hallucinated_words": [["bench", "bench"], ["orange", "orange"]], "mscoco_gt_words": ["apple", "banana", "cup", "person"], "hallucination_idxs": [5, 17], "metrics": {"CHAIRs": 1, "CHAIRi": 0.4, "Recall": 0.75}}, {"image_id": 170099, "caption": "A man in a suit stands in front of a large image of a couch and a fireplace, both of which are covered in orange cushions. He is holding a microphone and appears to be giving a speech or presentation.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "tie", "couch", "orange"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 14940, "caption": "A cat is laying on a bed, holding a stuffed animal, and looking at the camera.", "mscoco_hallucinated_words": [["bed", "bed"]], "mscoco_gt_words": ["chair", "couch", "cat", "dog", "orange"], "hallucination_idxs": [6], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.2}}, {"image_id": 408449, "caption": "A young man is skateboarding down a city street, wearing a black shirt and jeans, while a man in a suit is walking past him. The skateboarder is performing a trick, and the man in the suit is looking at him with a curious expression. The scene captures the", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "car", "handbag", "truck", "skateboard", "bus", "backpack"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.14285714285714285}}, {"image_id": 140702, "caption": "A young elephant is walking alongside its mother in a grassy field, with the mother holding a baby elephant in her trunk. The baby elephant is suckling on its mother's trunk, while the mother looks on. This image captures the close bond between the mother and", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["elephant", "bird", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 354540, "caption": "A man is sitting on a kitchen counter, surrounded by various cables and wires. He is holding a cord and appears to be working on an electrical project.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["laptop", "person", "oven", "chair", "cell phone", "microwave", "toaster"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.14285714285714285}}, {"image_id": 19763, "caption": "A large pizza sits on a white plate, surrounded by two glasses of beer. The pizza is cut into slices, and it appears to be a popular choice for a meal or snack. The presence of the beer suggests that the pizza might be enjoyed with a drink, adding", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "dining table", "chair", "knife", "fork", "cup", "pizza"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.14285714285714285}}, {"image_id": 191301, "caption": "A delicious chocolate cake sits on a white plate, accompanied by a spoon and a fork. The cake is topped with whipped cream and a cherry, making it a visually appealing dessert.", "mscoco_hallucinated_words": [["fork", "fork"]], "mscoco_gt_words": ["person", "dining table", "spoon", "cake", "cup"], "hallucination_idxs": [16], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.4}}, {"image_id": 124236, "caption": "A kitchen table is filled with various cooking utensils and dishes, including a pot, a pan, and a bowl. The table is also surrounded by a green chair and a stove. The scene appears to be a kitchen setting, where someone is preparing food or cleaning up after a me", "mscoco_hallucinated_words": [["chair", "chair"]], "mscoco_gt_words": ["spoon", "dining table", "oven", "bowl", "toaster"], "hallucination_idxs": [31], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2, "Recall": 0.6}}, {"image_id": 344930, "caption": "A red fire hydrant stands on a grassy street, surrounded by cars and a parked vehicle.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["fire hydrant", "orange", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 14285, "caption": "A cat is sitting on a bed, surrounded by various items such as a TV, a computer, and a clock. The cat is looking at the camera, possibly curious about the presence of the camera or the people in the room. The image captures the cat's natural curiosity and the cluttered room,", "mscoco_hallucinated_words": [["computer", "laptop"], ["clock", "clock"], ["person", "person"]], "mscoco_gt_words": ["tv", "chair", "cat", "book", "bed", "remote"], "hallucination_idxs": [18, 22, 42], "metrics": {"CHAIRs": 1, "CHAIRi": 0.375, "Recall": 0.5}}, {"image_id": 82488, "caption": "A pair of beds or a bed and a couch are seen in a room, with a lamp and a clock on the nightstand. The room is decorated with a yellow and orange color scheme, adding a warm and inviting atmosphere.", "mscoco_hallucinated_words": [["couch", "couch"]], "mscoco_gt_words": ["clock", "dining table", "orange", "book", "bed", "remote"], "hallucination_idxs": [9], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2, "Recall": 0.5}}, {"image_id": 348251, "caption": "A man is skiing down a snowy slope, wearing a green jacket, black pants, and a backpack. He is holding a ski pole and appears to be enjoying the winter sport.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "skis", "backpack"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 150703, "caption": "A man is holding a hot dog and a beer, sitting at a table with a cup of beer in front of him.", "mscoco_hallucinated_words": [["man", "person"]], "mscoco_gt_words": ["dining table", "hot dog", "sandwich", "cup"], "hallucination_idxs": [1], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.75}}, {"image_id": 381615, "caption": "A window-sill garden filled with various plants and flowers is visible in the image. The plants are arranged in a decorative manner, and there is a chair nearby. The plants add a touch of greenery and beauty to the room, making it a cozy and inviting space.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["potted plant", "chair", "book", "vase", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2}}, {"image_id": 352703, "caption": "A woman is cooking a dish on a stove, using a spatula to stir the ingredients. She is wearing a black apron and a white hat, and there is a large pot on the stove. The scene is taking place at an outdoor event, with people gathered around", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["spoon", "dining table", "person", "bottle", "oven", "bowl", "handbag", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 111109, "caption": "A young boy is sitting on a chair, wearing shorts and a white shirt, and smiling at the camera.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "tv", "chair", "motorcycle", "tie"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 226802, "caption": "A busy street scene with a mix of cars, buses, and pedestrians is captured in the image. The street is lined with buildings, and there are several vehicles parked along the sidewalk. The scene is quite crowded, with people walking and cars driving through the area.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "bus", "motorcycle", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 49005, "caption": "A baseball game is taking place on a grass field, with several players participating in the game. The players are wearing baseball uniforms and are positioned on the field, ready to play. The image captures the excitement and energy of the game, as the players prepare to hit the ball and run around the", "mscoco_hallucinated_words": [["ball", "sports ball"]], "mscoco_gt_words": ["person", "baseball bat", "baseball glove"], "hallucination_idxs": [54], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.3333333333333333}}, {"image_id": 410114, "caption": "A group of cows is walking down a dirt road, with a car driving past them in the background.", "mscoco_hallucinated_words": [["car", "car"]], "mscoco_gt_words": ["person", "horse", "cow", "truck"], "hallucination_idxs": [13], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.25}}, {"image_id": 100274, "caption": "A train is parked on a railroad track, surrounded by a large, empty parking lot. The train is covered in graffiti, and there are several cars parked nearby. The scene is set against a blue sky, giving the impression of a peaceful and serene environment.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["train", "truck", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 317254, "caption": "A man rides a black motorcycle down a city street, passing by a red car. The man is wearing a helmet and riding in a casual, relaxed manner, enjoying the ride.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "motorcycle", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 425569, "caption": "A large kitchen with various utensils and cooking equipment is shown in the image. The kitchen is filled with pots, pans, and other cooking tools, as well as a large stove and oven. There are also several silverware sets and dishes on the countertops. The kitchen", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "sink", "oven"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 28842, "caption": "A man is riding a skateboard down a grassy hill, enjoying the outdoor activity and the sunny day.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "dog", "skateboard"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 319607, "caption": "A man rides a bicycle on a city street, passing by a building with a red traffic light. The street is lined with cars and has a bike lane, indicating that it is a busy and active area.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "bicycle", "backpack", "car", "bus", "traffic light"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 210372, "caption": "A red kitchen with a white sink and a stove is shown in the image. The kitchen has a dishwasher, a refrigerator, and a microwave. There is also a window in the kitchen, and the room is well-lit. The kitchen appears to be clean and organized", "mscoco_hallucinated_words": [["stove", "oven"], ["microwave", "microwave"]], "mscoco_gt_words": ["bottle", "sink", "refrigerator"], "hallucination_idxs": [9, 27], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.6666666666666666}}, {"image_id": 156915, "caption": "A bouquet of red roses sits in a vase on a wooden table, surrounded by white flowers. The arrangement of flowers is beautiful and eye-catching, adding a touch of elegance to the room.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "vase", "potted plant"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 349642, "caption": "A man is sitting on a bench, with his dog sitting next to him. The man is wearing a jacket, and the dog is a small brown dog. They are both sitting on the bench, enjoying the outdoors together.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "dog", "bench"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 423008, "caption": "A bustling market scene is captured in the image, with numerous boats and people gathered around the waterfront. The boats are filled with various goods, and people are shopping and socializing. The atmosphere is lively and vibrant, showcasing the local culture and commerce of the area.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "boat", "umbrella", "handbag", "suitcase"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 45435, "caption": "A person is holding a smartphone in their hand, with the screen displaying a white and black image.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "cell phone", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 35827, "caption": "A man is sitting at a desk in a room, surrounded by various electronic devices and papers. He is working on a computer, possibly on a project or writing an email. The room is well-lit, and there is a window in the background, providing natural light. The man is wearing a casual", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["laptop", "dining table", "bottle", "person", "tv", "chair", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.42857142857142855}}, {"image_id": 72656, "caption": "Three young boys are sitting at a small wooden table, enjoying a meal together. They are eating pizza and drinking soda, and one of the boys is holding a toy. The scene shows the boys' camaraderie and enjoyment of their shared meal.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "dining table", "chair", "bowl", "pizza", "suitcase"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 372087, "caption": "A green train is parked on a platform, with a yellow train in the background.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "train", "bench", "suitcase"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 336209, "caption": "A young man is riding a skateboard on a concrete floor, performing a trick in front of a large building.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "bench", "skateboard"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 46031, "caption": "A laptop computer is sitting on a desk, surrounded by various electronic devices, such as a mouse, a keyboard, and a computer mousepad. The desk is also covered with a green plant, adding a touch of natural beauty to the space.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["laptop", "dining table", "tv", "cell phone", "keyboard", "mouse"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 283118, "caption": "A family of three, including a mother and two children, is sitting at a table in a restaurant, enjoying their meal together.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "dining table", "bottle", "chair", "cell phone", "car", "handbag", "backpack", "pizza"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2222222222222222}}, {"image_id": 429598, "caption": "A kitchen with a brick wall, wooden cabinets, and a stainless steel refrigerator is shown in the image. The kitchen also features a wooden table and a stove, as well as a sink and a dishwasher. The overall design of the kitchen is rustic and traditional,", "mscoco_hallucinated_words": [["table", "dining table"]], "mscoco_gt_words": ["bottle", "sink", "oven", "refrigerator"], "hallucination_idxs": [27], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.75}}, {"image_id": 333365, "caption": "A large airplane is parked at an airport, surrounded by other airplanes and a baggage carousel.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "airplane", "truck", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 424174, "caption": "A colorful fruit bowl filled with various fruits, including bananas, apples, and oranges, sits on a wooden table. The bowl is surrounded by a variety of other fruits, such as pineapples, grapes, and lemons. The image showcases a diverse", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["apple", "dining table", "bowl", "banana", "orange"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 3035, "caption": "A large airplane is parked on a runway, surrounded by various airport amenities such as a baggage claim and a ticket counter. The airplane is positioned next to a large, open area, which could be a tarmac or a parking lot. The image captures the busy", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "airplane", "truck", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 177213, "caption": "A man is sitting at a table, holding a pizza in his hand, and smiling. The pizza is on a white plate, and it appears to be a delicious and freshly made dish. The man is enjoying his meal, and the image captures a moment of satisfaction and enjoy", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "dining table", "knife", "fork", "cup", "pizza"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 438535, "caption": "A large clock is mounted on a pole in the middle of a city street, surrounded by tall buildings and a busy cityscape. The clock is a prominent feature in the urban landscape, and its presence serves as a reminder of the importance of time and the need to stay on schedule.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "clock", "backpack", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 490711, "caption": "A white refrigerator is sitting in a kitchen, surrounded by cabinets and countertops. The refrigerator has a stainless steel door and is filled with various items, including a bottle of water, a coffee mug, and a bag of groceries. The kitchen is clean", "mscoco_hallucinated_words": [["bottle", "bottle"]], "mscoco_gt_words": ["banana", "sink", "refrigerator"], "hallucination_idxs": [31], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.3333333333333333}}, {"image_id": 163728, "caption": "A cute cat is lying on a table, with a mouse on its head. The cat is sleeping, and the mouse is on its nose, which is likely a playful and cute pose.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["laptop", "dining table", "cat", "mouse", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 456756, "caption": "A giraffe stands in a zoo enclosure, looking at the camera with its long neck and legs.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "giraffe", "zebra"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 281028, "caption": "A passenger train car with two seats in the front, one of which is occupied by a man, and a window view of a city street.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "train", "chair", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 343937, "caption": "A young woman is skiing down a snowy slope, wearing a white jacket and a helmet. She is standing on a snowboard, balancing herself on the edge of the board as she rides down the mountain.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "skis", "snowboard"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 277051, "caption": "Two small birds perched on a table, pecking at a piece of bread.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bird", "dining table", "bottle", "chair", "knife"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 145666, "caption": "A bowl filled with chopped broccoli is sitting on a stove, ready to be cooked. The broccoli is chopped into small pieces, and it appears to be in the process of being steamed or boiled. The image shows a close-up view of the chopped brocc", "mscoco_hallucinated_words": [["stove", "oven"]], "mscoco_gt_words": ["bowl", "carrot", "dining table", "broccoli"], "hallucination_idxs": [10], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.5}}, {"image_id": 304984, "caption": "A delicious sandwich, a glass of orange juice, and a bowl of chicken salad are all laid out on a white plate, making for a satisfying and healthy meal.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["wine glass", "bowl", "cake", "orange", "sandwich", "fork"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 122467, "caption": "A man is holding a Nintendo Game Boy, with his hand wrapped around the controller and the console.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "remote", "dining table", "couch"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 518287, "caption": "A white toothbrush with a smiling face is sitting in a tube of toothpaste, ready to be used for brushing teeth.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["dining table", "orange", "cup", "toothbrush"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 145448, "caption": "A black cat is sitting on top of a motorcycle, with its paws resting on the handlebars.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "dining table", "chair", "motorcycle", "cat", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 352900, "caption": "A delicious plate of pasta is being served on a white plate, with a fork and knife placed next to it. The pasta is covered in a creamy sauce, and it appears to be a popular dish.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "knife", "fork", "broccoli"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 153607, "caption": "A blue glass vase with a flower in it sits on a table, surrounded by other objects. The vase is decorated with a blue and white striped pattern, adding a touch of color and elegance to the scene. The flower, which is a bright orange daisy, adds a pop of v", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "dining table", "orange", "vase"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 157581, "caption": "A collection of wine bottles and glasses sits on a table, arranged in a neat and organized manner. The wine bottles are labeled with different names, such as Chardonnay, Merlot, and Cabernet Sauvignon, while the glasses are filled with wine. This image show", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "dining table", "bottle", "wine glass", "chair", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 227438, "caption": "A luxurious bedroom with a large bed and a desk is shown in the image. The bedroom has a warm and inviting atmosphere, with a lamp and a window providing natural light. The room is decorated with a few pieces of furniture, such as a chair and a table, and there", "mscoco_hallucinated_words": [["desk", "dining table"], ["table", "dining table"]], "mscoco_gt_words": ["couch", "clock", "chair", "bed"], "hallucination_idxs": [9, 52], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.5}}, {"image_id": 116037, "caption": "A young girl is playing baseball at a field, swinging a bat and running towards home plate. She is wearing a black and yellow uniform, and there are other players in the background.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "baseball bat", "sports ball", "baseball glove"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 202658, "caption": "A pink toilet sits next to a white toilet, both of which are in a bathroom setting. The pink toilet has a Hello Kitty design on it, adding a playful touch to the bathroom.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "toilet", "chair"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 18150, "caption": "A young boy is sitting on a bed, eating a pizza while a man, possibly his father, is sitting next to him. The man is holding a pizza box and handing it to the boy. The scene is likely a family moment, where the father is sharing a meal with his son.", "mscoco_hallucinated_words": [["bed", "bed"]], "mscoco_gt_words": ["person", "bottle", "couch", "backpack", "pizza"], "hallucination_idxs": [7], "metrics": {"CHAIRs": 1, "CHAIRi": 0.1111111111111111, "Recall": 0.4}}, {"image_id": 418711, "caption": "A man rides a bicycle down a dirt road, carrying a large basket filled with bananas. The man is wearing a white shirt and a hat, and he is surrounded by a group of people who are watching him. The scene is set in a rural area, with a few trees and", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "bicycle", "banana", "car", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6}}, {"image_id": 92107, "caption": "A bowl of creamy corn soup sits on a green tablecloth, surrounded by a spoon and a piece of bread. The soup is made with corn, broccoli, and other vegetables, and it is served in a green bowl.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["spoon", "dining table", "bowl", "broccoli"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 491000, "caption": "A group of people walk down a cobblestone street in a historic city, passing by a row of colorful buildings.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "motorcycle", "dog", "car", "handbag"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2}}, {"image_id": 401163, "caption": "A man sits on a bench in a park, surrounded by trees and a small dog.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "dog", "bench"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 39663, "caption": "A backpack, a laptop, a notebook, a pencil case, a pink pen, a black pen, a pair of scissors, a small bag, and a book are all laid out on a floor. The items are neatly arranged, and the backpack is open, revealing", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["laptop", "cell phone", "scissors", "book", "backpack"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.8}}, {"image_id": 268293, "caption": "A man in a blue shirt and white shorts is playing tennis, using a tennis racket to hit a tennis ball. He is standing on a grassy field, and the sun is shining down on him.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "sports ball", "tennis racket"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 474499, "caption": "A kitchen with a stove, oven, and refrigerator is filled with various cooking utensils, pots, and pans. There are also several bottles of condiments and spices on the countertop. The kitchen is clean and organized, with a dishwasher in", "mscoco_hallucinated_words": [["refrigerator", "refrigerator"]], "mscoco_gt_words": ["spoon", "apple", "bottle", "clock", "oven", "vase", "sink"], "hallucination_idxs": [9], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.2857142857142857}}, {"image_id": 358086, "caption": "A group of young women are playing soccer in a field, with one woman in the air, possibly attempting to score a goal.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "bottle", "frisbee", "chair", "backpack"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2}}, {"image_id": 89541, "caption": "A yellow lunch box filled with various food items, including a sandwich, a cookie, and a slice of cake, sits on a table.", "mscoco_hallucinated_words": [["sandwich", "sandwich"]], "mscoco_gt_words": ["bowl", "dining table", "banana", "cake"], "hallucination_idxs": [12], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.5}}, {"image_id": 239445, "caption": "A young man is holding a frisbee and smiling while standing in a park.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "sports ball", "frisbee"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 105782, "caption": "A young kangaroo is standing in a grassy field, looking up at a tree.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["kite", "cat", "dog", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.0}}, {"image_id": 487990, "caption": "A group of friends is gathered around a table, enjoying a meal together. One person is holding a guitar and playing it while others are eating and socializing. The scene is filled with various food items, including pizza, cupcakes, and a cake. The atmosphere is lively and fun", "mscoco_hallucinated_words": [["pizza", "pizza"]], "mscoco_gt_words": ["spoon", "person", "bottle", "dining table", "donut", "bowl", "cake", "knife", "fork", "cup"], "hallucination_idxs": [41], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2, "Recall": 0.3}}, {"image_id": 138834, "caption": "A man is walking down a snowy road, carrying a pair of skis on his back. He is wearing a black jacket and a ski helmet, and appears to be enjoying the winter weather.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "skis", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 492057, "caption": "A man in a green jacket and a tie is standing in front of a mirror, taking a selfie with his phone. He is smiling and appears to be happy with the image he is capturing.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["cell phone", "tie", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 388215, "caption": "A young man is playing tennis on a court, holding a tennis racket and preparing to hit the ball. He is wearing a white shirt and white shorts, and is standing in front of a net.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "sports ball", "tennis racket"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 111409, "caption": "A man rides a motorcycle down a ramp, with his helmet on and his hands on the handlebars. He is wearing a white shirt and jeans, and the motorcycle has a red and white color scheme. The man is enjoying the thrill of riding the motorcycle down", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["motorcycle", "bicycle", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 451391, "caption": "A man is holding a bunch of fresh, green broccoli in a market, showcasing the vegetable's vibrant colors and freshness.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "dining table", "broccoli"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 92462, "caption": "A group of cows is walking down a street in a small town, likely in a rural or agricultural area. The cows are walking in a line, with one cow leading the way. The scene is likely a common sight in such towns, where cows are often used for farming and transportation.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "cow", "backpack", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 397268, "caption": "A bicycle shop is showcased in the image, with a variety of bicycles and accessories displayed on the sidewalk outside. The shop is located in a small town, and the bicycles are arranged in a neat and organized manner. The image captures the essence of a bicy", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bicycle", "chair", "bench", "potted plant"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 127659, "caption": "A man is sitting on a bench next to a train station, looking at his phone. The train station is empty, and there are no other people around. The man is likely waiting for a train or checking his schedule.", "mscoco_hallucinated_words": [["phone", "cell phone"]], "mscoco_gt_words": ["person", "dog", "train", "bench"], "hallucination_idxs": [16], "metrics": {"CHAIRs": 1, "CHAIRi": 0.125, "Recall": 0.75}}, {"image_id": 251857, "caption": "A young man is skateboarding on a sidewalk, while a group of people watches him.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "traffic light", "skateboard", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 243212, "caption": "A young boy is holding a frisbee in a grassy field, looking at the camera with a smile on his face.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "frisbee", "dog", "car", "truck"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 444304, "caption": "A man is sitting on a couch, watching a television with a remote control in his hand. The television is showing a person on a screen, possibly a character from a video game or a movie. The man is likely engrossed in the content being displayed on the screen, and the television is a common household", "mscoco_hallucinated_words": [["couch", "couch"]], "mscoco_gt_words": ["person", "tv", "remote", "bed"], "hallucination_idxs": [6], "metrics": {"CHAIRs": 1, "CHAIRi": 0.125, "Recall": 0.75}}, {"image_id": 305000, "caption": "A woman is standing at a fruit stand, surrounded by various fruits and vegetables. She is wearing a black shirt and a hat, and she is looking at the produce on display. The fruit stand is located in a small, rural town, and the woman appears to be a local vendor.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["apple", "banana", "person"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.3333333333333333}}, {"image_id": 44136, "caption": "Two men, dressed in black tuxedos, are sitting at a table in a banquet hall, enjoying a beer together.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "dining table", "bottle", "wine glass", "tie"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 154846, "caption": "A group of people are enjoying a delicious pizza on a large metal tray, with various toppings and slices of pizza on the tray.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "dining table", "pizza"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 567254, "caption": "A young boy is sitting in front of a television, holding a pink toy and looking at the screen.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "tv", "bottle", "vase"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 79261, "caption": "A man is standing in the middle of a fountain, holding a broom and wearing a white shirt. He is surrounded by water, and there is a sign nearby that reads \"No Swimming.\"", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "clock", "handbag", "backpack"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 301402, "caption": "A young man is sitting in a chair, using a laptop computer while wearing a hat and a scarf. He is surrounded by people, possibly friends or family members, who are gathered around him. The scene appears to be a casual and social setting, where the young man is engaging in an activity on", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["laptop", "person", "bottle", "dining table", "potted plant", "chair"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 415828, "caption": "A group of people is gathered in front of a building in a city, possibly enjoying a sunny day. They are standing in a parking lot, and there is a car parked nearby. The scene appears to be a social gathering or a casual event, with people chatting and laughing together", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "backpack", "umbrella", "car", "handbag", "stop sign", "traffic light"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2857142857142857}}, {"image_id": 543231, "caption": "A young woman is holding a small white plastic tube, looking at it intently while sitting on a couch. She is surrounded by people, possibly friends or family members, who are watching her. The image captures a moment of curiosity and engagement as the woman examines the tube, possibly using", "mscoco_hallucinated_words": [["couch", "couch"]], "mscoco_gt_words": ["person", "bowl", "book", "bed", "remote"], "hallucination_idxs": [19], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.2}}, {"image_id": 495357, "caption": "A man rides a motorcycle down a city street, surrounded by people and cars.", "mscoco_hallucinated_words": [["car", "car"]], "mscoco_gt_words": ["motorcycle", "dog", "handbag", "person"], "hallucination_idxs": [14], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.5}}, {"image_id": 523175, "caption": "A bowl of hearty soup filled with vegetables, meat, and potatoes sits on a table, ready to be enjoyed by the person holding a spoon. The soup is made with a variety of ingredients, including carrots, celery, and onions, and is served in a", "mscoco_hallucinated_words": [["person", "person"]], "mscoco_gt_words": ["spoon", "carrot", "dining table", "bowl"], "hallucination_idxs": [24], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2, "Recall": 1.0}}, {"image_id": 184945, "caption": "A group of motorcycles is parked along a sidewalk, creating a colorful and lively scene. The bikes are arranged in a row, with some of them leaning against the wall. The image captures the vibrant atmosphere of the city, where people can enjoy riding and parking", "mscoco_hallucinated_words": [["person", "person"]], "mscoco_gt_words": ["motorcycle", "bicycle", "potted plant"], "hallucination_idxs": [45], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.6666666666666666}}, {"image_id": 49942, "caption": "A young man is standing under an umbrella, looking down at the ground. He is wearing a suit and tie, and his hair is messy. The image captures a moment of contemplation or introspection, as the man is lost in thought while holding the umbrella.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "tie", "umbrella"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 1.0}}, {"image_id": 223019, "caption": "A man is standing in front of a train, looking at the camera. The train is a blue and white train with a large orange sign on the side. The man is wearing a suit and tie, and he appears to be waiting for the train to depart. The image captures the moment of the man'", "mscoco_hallucinated_words": [["orange", "orange"], ["tie", "tie"]], "mscoco_gt_words": ["person", "car", "handbag", "train", "backpack", "suitcase"], "hallucination_idxs": [26, 39], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2222222222222222, "Recall": 0.3333333333333333}}, {"image_id": 42889, "caption": "A teddy bear sits on a red table, wearing glasses and holding a microphone. The teddy bear is surrounded by various electronic devices, including a computer, a cell phone, and a headset. The image captures a playful and funny scene, showcasing the teddy bear", "mscoco_hallucinated_words": [["table", "dining table"], ["computer", "laptop"], ["cell phone", "cell phone"]], "mscoco_gt_words": ["keyboard", "bear", "teddy bear"], "hallucination_idxs": [7, 28, 31], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.3333333333333333}}, {"image_id": 22112, "caption": "A small bowl filled with fresh herbs sits on a wooden table next to a vase containing flowers. The herbs and flowers create a visually appealing and fragrant display, adding a touch of natural beauty to the room.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bowl", "dining table", "vase", "potted plant"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}, {"image_id": 247587, "caption": "A man is standing on a surfboard, riding the waves on the beach.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "surfboard", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 171962, "caption": "A green city bus is parked at a bus stop, with a bike rack attached to the side of the vehicle. The bus stop is located on a street with a bridge in the background.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["bicycle", "bus", "person", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 545056, "caption": "A group of cows grazes in a green field, surrounded by a fence.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["car", "dog", "cow", "sheep"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.25}}, {"image_id": 401411, "caption": "A chef is preparing a meal in a kitchen, surrounded by various ingredients and utensils. He is using a knife to cut up vegetables and meat, and a spatula to flip the food on a grill. The chef is working in a well-organized kitchen,", "mscoco_hallucinated_words": [["knife", "knife"]], "mscoco_gt_words": ["person", "dining table", "oven", "bowl", "book", "carrot", "cup"], "hallucination_idxs": [21], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.14285714285714285}}, {"image_id": 2867, "caption": "A group of people, including a man and a woman, are standing on a snowy slope, possibly preparing to ski or snowboard. They are wearing various outdoor gear, such as ski jackets, hats, and backpacks, and are holding skis and snowboards. The scene", "mscoco_hallucinated_words": [["snowboard", "snowboard"], ["snowboard", "snowboard"]], "mscoco_gt_words": ["person", "skis", "backpack"], "hallucination_idxs": [24, 48], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2222222222222222, "Recall": 1.0}}, {"image_id": 246963, "caption": "A group of motorcyclists riding on a road, with one motorcycle in the foreground and several others in the background, creating a line of bikes.", "mscoco_hallucinated_words": [["bike", "bicycle"]], "mscoco_gt_words": ["motorcycle", "person", "stop sign"], "hallucination_idxs": [26], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.3333333333333333}}, {"image_id": 498225, "caption": "A group of people is gathered in front of a bakery window, admiring the delicious pastries and cakes on display. They are likely discussing their preferences and enjoying the variety of treats available.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "donut", "cake", "cell phone", "handbag"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 124601, "caption": "A kitchen with a countertop, sink, and stove is filled with various items, including a coffee maker, a laptop, and a dishwasher. The scene appears to be a busy and cluttered space, with the coffee maker and laptop on the countertop, and the dish", "mscoco_hallucinated_words": [["stove", "oven"]], "mscoco_gt_words": ["laptop", "dining table", "bottle", "wine glass", "keyboard", "microwave", "sink", "cup"], "hallucination_idxs": [9], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.25}}, {"image_id": 581749, "caption": "A large bag of fresh vegetables, including broccoli, carrots, and lettuce, is sitting on a table surrounded by other food items. The bag is filled with various vegetables, and the table is covered with a plastic sheet to protect the food from dust and other contaminants.", "mscoco_hallucinated_words": [["carrot", "carrot"]], "mscoco_gt_words": ["dining table", "orange", "broccoli"], "hallucination_idxs": [10], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.6666666666666666}}, {"image_id": 227960, "caption": "A bowl of Brussels sprouts is filled with a creamy sauce, and a spoon is used to scoop out the vegetables. The image shows a close-up of the bowl, highlighting the delicious and nutritious meal.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["spoon", "wine glass", "bowl", "carrot", "cup"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.4}}, {"image_id": 286503, "caption": "A large elephant is standing in a zoo enclosure, surrounded by a fence and a wooden structure. The elephant is looking at the camera, and there is a bird hanging from a tree branch in the background.", "mscoco_hallucinated_words": [["bird", "bird"]], "mscoco_gt_words": ["elephant", "sports ball", "person"], "hallucination_idxs": [31], "metrics": {"CHAIRs": 1, "CHAIRi": 0.3333333333333333, "Recall": 0.3333333333333333}}, {"image_id": 315740, "caption": "A modern kitchen with a wooden countertop and stainless steel appliances is filled with various kitchen utensils and a sink. The kitchen has a large window, allowing natural light to enter and illuminate the space.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["tv", "oven", "potted plant", "chair", "bowl", "couch", "microwave", "sink"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.125}}, {"image_id": 142108, "caption": "A group of people, including a man and a woman, are gathered around a table with a large, white sheet on it. They are engaged in a cooking activity, possibly making sandwiches or preparing food for a meal. The man is holding a knife, and the woman is holding a piece", "mscoco_hallucinated_words": [["sandwich", "sandwich"], ["knife", "knife"]], "mscoco_gt_words": ["person", "dining table", "banana"], "hallucination_idxs": [36, 49], "metrics": {"CHAIRs": 1, "CHAIRi": 0.25, "Recall": 0.6666666666666666}}, {"image_id": 542933, "caption": "A baseball player is standing on the field, ready to hit a baseball during a game. The player is wearing a baseball uniform and holding a bat, while the crowd is watching from the stands.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "bench", "chair", "baseball bat", "baseball glove", "sports ball"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.16666666666666666}}, {"image_id": 475043, "caption": "A group of friends are sitting around a table, enjoying their drinks and laughing together. They are using their laptops and smartphones to stay connected and share content. The scene captures the modern way of socializing, where technology plays a significant role in connecting people and enhancing their interactions", "mscoco_hallucinated_words": [["table", "dining table"], ["smartphone", "cell phone"]], "mscoco_gt_words": ["spoon", "person", "bottle", "laptop", "bowl", "couch"], "hallucination_idxs": [8, 23], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.3333333333333333}}, {"image_id": 456784, "caption": "A man is holding a knife and cutting a cake, possibly a birthday cake, in front of a table.", "mscoco_hallucinated_words": [["table", "dining table"]], "mscoco_gt_words": ["person", "cake", "knife"], "hallucination_idxs": [20], "metrics": {"CHAIRs": 1, "CHAIRi": 0.2, "Recall": 1.0}}, {"image_id": 33753, "caption": "A small television is sitting on a bench in a park, surrounded by greenery.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["tv", "remote", "bench", "chair"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.5}}, {"image_id": 448694, "caption": "A group of young men are playing a game of ultimate frisbee in a park, with one man throwing the frisbee and another man catching it.", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "frisbee", "chair"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.6666666666666666}}, {"image_id": 99053, "caption": "A bowl of noodles, possibly stir-fried vegetables, and meat is being eaten by a person.", "mscoco_hallucinated_words": [["person", "person"]], "mscoco_gt_words": ["dining table", "bowl", "broccoli", "fork", "carrot"], "hallucination_idxs": [16], "metrics": {"CHAIRs": 1, "CHAIRi": 0.5, "Recall": 0.2}}, {"image_id": 503210, "caption": "A living room with a couch, a piano, and a large window is shown in the image. The room is decorated with orange and yellow accents, and there are several pillows and cushions on the couch. The piano is placed in the corner of the room, and the large window allows", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["clock", "potted plant", "chair", "couch", "orange", "book", "vase"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.2857142857142857}}, {"image_id": 142257, "caption": "A busy street scene with multiple cars driving down the road, including a red car and a blue car. The cars are driving in both directions, and there are traffic lights at the intersection. The image captures the hustle and bustle of city life, with people going about their daily routines and comm", "mscoco_hallucinated_words": [], "mscoco_gt_words": ["person", "traffic light", "truck", "car"], "hallucination_idxs": [], "metrics": {"CHAIRs": 0, "CHAIRi": 0.0, "Recall": 0.75}}], "overall_metrics": {"CHAIRs": 0.27, "CHAIRi": 0.10577971646673937, "Recall": 0.4733485193621868, "num_hallucinated_caps": 135.0, "num_caps": 500.0, "hallucinated_word_count": 194.0, "coco_word_count": 1834.0, "length_response": 41.106, "hallucinated_caps_ls": [144305, 308003, 95908, 324008, 501311, 39053, 253630, 161227, 195645, 32625, 343534, 254368, 233888, 213905, 409346, 344942, 275929, 300124, 12669, 133146, 498747, 185327, 454161, 129707, 368367, 201555, 489909, 405183, 333712, 148977, 183571, 325836, 467887, 557998, 401010, 313928, 122602, 24104, 279407, 527497, 229659, 265628, 499594, 258209, 245664, 453731, 418692, 259345, 443299, 545594, 219546, 535403, 375769, 426172, 138078, 152499, 180764, 537861, 146504, 301837, 240681, 14773, 563938, 134768, 526414, 192656, 412407, 191691, 159979, 357, 134223, 198163, 217593, 475813, 53431, 441840, 381031, 9628, 330050, 254161, 423984, 118124, 288729, 252625, 302789, 30667, 353898, 88269, 536154, 560018, 353320, 416384, 531327, 1268, 436814, 63934, 45550, 303099, 205193, 272566, 14940, 191301, 124236, 14285, 82488, 150703, 49005, 410114, 210372, 429598, 490711, 145666, 227438, 18150, 474499, 89541, 487990, 127659, 444304, 543231, 495357, 523175, 184945, 223019, 42889, 401411, 2867, 246963, 124601, 581749, 286503, 142108, 475043, 456784, 99053]}}}