category,total_questions,hit_all,miss_all,rot0,rot90,rot180,rot270
attribute_comparison,200,0.565,0.165,0.71,0.695,0.72,0.69
attribute_recognition,200,0.74,0.045,0.88,0.855,0.83,0.875
dynamic_temporal,200,0.185,0.245,0.47,0.505,0.42,0.48
hallucination_detection,200,0.525,0.13,0.73,0.7,0.68,0.745
object_counting,200,0.285,0.265,0.525,0.475,0.52,0.45
object_localization,200,0.715,0.015,0.885,0.9,0.915,0.87
object_presence,200,0.81,0.05,0.895,0.91,0.865,0.875
scene_understanding,200,0.92,0.025,0.945,0.945,0.955,0.965
spatial_relationship,200,0.62,0.02,0.825,0.85,0.85,0.855
visual_grounding,200,0.36,0.035,0.69,0.805,0.7,0.785
Average,2000,0.572,0.1,0.756,0.764,0.746,0.759
