category,total_questions,hit_all,miss_all,rot0,rot90,rot180,rot270
attribute_comparison,200,0.345,0.25,0.56,0.54,0.555,0.55
attribute_recognition,200,0.555,0.11,0.73,0.7,0.74,0.765
dynamic_temporal,200,0.155,0.27,0.46,0.425,0.44,0.445
hallucination_detection,200,0.35,0.34,0.48,0.495,0.52,0.485
object_counting,200,0.175,0.27,0.47,0.425,0.42,0.49
object_localization,200,0.525,0.05,0.77,0.805,0.78,0.77
object_presence,200,0.695,0.03,0.835,0.845,0.855,0.875
scene_understanding,200,0.695,0.055,0.865,0.82,0.83,0.805
spatial_relationship,200,0.34,0.065,0.645,0.655,0.73,0.655
visual_grounding,200,0.0,1.0,0.0,0.0,0.0,0.0
Average,2000,0.384,0.244,0.581,0.571,0.587,0.584
