category,total_questions,hit_all,miss_all,rot0,rot90,rot180,rot270
attribute_comparison,200,0.615,0.275,0.67,0.68,0.66,0.67
attribute_recognition,200,0.405,0.185,0.58,0.605,0.61,0.635
dynamic_temporal,200,0.2,0.395,0.39,0.375,0.35,0.385
hallucination_detection,200,0.835,0.035,0.915,0.885,0.91,0.895
object_counting,200,0.075,0.405,0.345,0.275,0.295,0.35
object_localization,200,0.165,0.165,0.45,0.5,0.475,0.56
object_presence,200,0.39,0.225,0.6,0.615,0.575,0.615
scene_understanding,200,0.74,0.04,0.89,0.845,0.87,0.85
spatial_relationship,200,0.19,0.22,0.495,0.535,0.51,0.465
visual_grounding,200,0.01,0.69,0.095,0.115,0.095,0.145
Average,2000,0.362,0.264,0.543,0.543,0.535,0.557
