category,total_questions,hit_all,miss_all,rot0,rot90,rot180,rot270
attribute_comparison,200,0.595,0.265,0.67,0.685,0.655,0.665
attribute_recognition,200,0.68,0.075,0.815,0.825,0.8,0.88
dynamic_temporal,200,0.155,0.225,0.43,0.47,0.43,0.445
hallucination_detection,200,0.56,0.105,0.775,0.76,0.755,0.73
object_counting,200,0.235,0.39,0.405,0.395,0.38,0.41
object_localization,200,0.365,0.045,0.735,0.71,0.72,0.725
object_presence,200,0.695,0.16,0.785,0.765,0.775,0.76
scene_understanding,200,0.84,0.02,0.955,0.925,0.915,0.905
spatial_relationship,200,0.345,0.065,0.685,0.67,0.66,0.645
visual_grounding,200,0.015,0.61,0.115,0.135,0.16,0.115
Average,2000,0.448,0.196,0.637,0.634,0.625,0.628
