category,total_questions,hit_all,miss_all,rot0,rot90,rot180,rot270
attribute_comparison,200,0.55,0.13,0.74,0.685,0.745,0.685
attribute_recognition,200,0.72,0.055,0.83,0.83,0.84,0.85
dynamic_temporal,200,0.28,0.075,0.615,0.615,0.615,0.575
hallucination_detection,200,0.56,0.09,0.755,0.77,0.745,0.755
object_counting,200,0.215,0.22,0.45,0.47,0.49,0.51
object_localization,200,0.78,0.035,0.895,0.895,0.89,0.885
object_presence,200,0.565,0.125,0.735,0.725,0.72,0.74
scene_understanding,200,0.92,0.005,0.975,0.96,0.96,0.965
spatial_relationship,200,0.77,0.01,0.93,0.895,0.92,0.89
visual_grounding,200,0.13,0.22,0.4,0.375,0.43,0.505
Average,2000,0.549,0.096,0.732,0.722,0.735,0.736
