category,total_questions,hit_all,miss_all,rot0,rot90,rot180,rot270
attribute_comparison,200,0.495,0.245,0.59,0.595,0.65,0.625
attribute_recognition,200,0.515,0.12,0.705,0.71,0.705,0.715
dynamic_temporal,200,0.15,0.31,0.44,0.415,0.415,0.415
hallucination_detection,200,0.14,0.505,0.295,0.31,0.31,0.3
object_counting,200,0.3,0.325,0.505,0.45,0.53,0.51
object_localization,200,0.71,0.03,0.865,0.905,0.85,0.875
object_presence,200,0.815,0.035,0.92,0.91,0.915,0.89
scene_understanding,200,0.72,0.075,0.87,0.815,0.82,0.84
spatial_relationship,200,0.57,0.055,0.82,0.76,0.845,0.78
visual_grounding,200,0.0,1.0,0.0,0.0,0.0,0.0
Average,2000,0.442,0.27,0.601,0.587,0.604,0.595
