category,total_questions,hit_all,miss_all,rot0,rot90,rot180,rot270
attribute_comparison,200,0.455,0.28,0.575,0.595,0.61,0.59
attribute_recognition,200,0.63,0.09,0.75,0.775,0.805,0.805
dynamic_temporal,200,0.195,0.2,0.515,0.49,0.51,0.475
hallucination_detection,200,0.625,0.105,0.77,0.785,0.805,0.78
object_counting,200,0.23,0.36,0.42,0.45,0.45,0.415
object_localization,200,0.39,0.115,0.605,0.67,0.665,0.655
object_presence,200,0.415,0.22,0.595,0.585,0.595,0.6
scene_understanding,200,0.81,0.04,0.87,0.89,0.875,0.89
spatial_relationship,200,0.44,0.035,0.75,0.745,0.75,0.715
visual_grounding,200,0.005,0.715,0.08,0.125,0.115,0.09
Average,2000,0.42,0.216,0.593,0.611,0.618,0.602
