category,total_questions,hit_all,miss_all,rot0,rot90,rot180,rot270
attribute_comparison,200,0.305,0.075,0.635,0.63,0.61,0.655
attribute_recognition,200,0.555,0.095,0.79,0.745,0.72,0.74
dynamic_temporal,200,0.12,0.25,0.41,0.375,0.385,0.43
hallucination_detection,200,0.355,0.14,0.585,0.65,0.6,0.61
object_counting,200,0.06,0.26,0.35,0.395,0.355,0.37
object_localization,200,0.16,0.19,0.43,0.455,0.475,0.46
object_presence,200,0.375,0.195,0.62,0.59,0.565,0.63
scene_understanding,200,0.735,0.035,0.875,0.85,0.85,0.875
spatial_relationship,200,0.245,0.045,0.63,0.635,0.61,0.61
visual_grounding,200,0.0,0.66,0.13,0.12,0.07,0.12
Average,2000,0.291,0.195,0.546,0.544,0.524,0.55
