category,total_questions,hit_all,miss_all,rot0,rot90,rot180,rot270
attribute_comparison,200,0.635,0.305,0.665,0.655,0.67,0.66
attribute_recognition,200,0.385,0.13,0.59,0.68,0.685,0.62
dynamic_temporal,200,0.09,0.34,0.375,0.365,0.335,0.35
hallucination_detection,200,0.28,0.24,0.555,0.525,0.535,0.5
object_counting,200,0.18,0.435,0.365,0.395,0.345,0.34
object_localization,200,0.115,0.085,0.55,0.505,0.54,0.545
object_presence,200,0.32,0.235,0.555,0.57,0.52,0.535
scene_understanding,200,0.81,0.04,0.905,0.91,0.88,0.865
spatial_relationship,200,0.04,0.17,0.405,0.37,0.38,0.31
visual_grounding,200,0.37,0.105,0.665,0.68,0.655,0.655
Average,2000,0.323,0.208,0.563,0.566,0.554,0.538
