category,total_questions,hit_all,miss_all,rot0,rot90,rot180,rot270
attribute_comparison,200,0.54,0.155,0.7,0.68,0.755,0.685
attribute_recognition,200,0.7,0.085,0.82,0.825,0.82,0.82
dynamic_temporal,200,0.21,0.21,0.46,0.495,0.47,0.5
hallucination_detection,200,0.185,0.43,0.36,0.395,0.39,0.405
object_counting,200,0.215,0.225,0.48,0.54,0.46,0.455
object_localization,200,0.575,0.02,0.865,0.835,0.795,0.81
object_presence,200,0.865,0.03,0.925,0.925,0.895,0.93
scene_understanding,200,0.92,0.03,0.955,0.95,0.95,0.94
spatial_relationship,200,0.855,0.025,0.94,0.92,0.94,0.935
visual_grounding,200,0.03,0.57,0.195,0.155,0.215,0.18
Average,2000,0.509,0.178,0.67,0.672,0.669,0.666
