category,total_questions,hit_all,miss_all,rot0,rot90,rot180,rot270
attribute_comparison,200,0.42,0.17,0.645,0.645,0.645,0.645
attribute_recognition,200,0.595,0.09,0.735,0.765,0.755,0.79
dynamic_temporal,200,0.135,0.365,0.39,0.385,0.38,0.365
hallucination_detection,200,0.365,0.335,0.525,0.49,0.51,0.55
object_counting,200,0.285,0.425,0.44,0.45,0.43,0.42
object_localization,200,0.27,0.195,0.53,0.55,0.535,0.52
object_presence,200,0.615,0.13,0.75,0.72,0.75,0.775
scene_understanding,200,0.855,0.025,0.94,0.9,0.92,0.93
spatial_relationship,200,0.14,0.075,0.53,0.58,0.5,0.525
visual_grounding,200,0.0,1.0,0.0,0.0,0.0,0.0
Average,2000,0.368,0.281,0.548,0.548,0.542,0.552
