category,total_questions,hit_all,miss_all,rot0,rot90,rot180,rot270
attribute_comparison,200,0.390,0.210,0.575,0.635,0.605,0.630
attribute_recognition,200,0.455,0.105,0.660,0.705,0.715,0.765
dynamic_temporal,200,0.105,0.310,0.400,0.400,0.420,0.395
hallucination_detection,200,0.530,0.120,0.725,0.705,0.740,0.750
object_counting,200,0.120,0.340,0.380,0.375,0.335,0.325
object_localization,200,0.330,0.080,0.620,0.630,0.660,0.655
object_presence,200,0.305,0.240,0.535,0.510,0.545,0.550
scene_understanding,200,0.580,0.075,0.825,0.755,0.770,0.760
spatial_relationship,200,0.205,0.075,0.610,0.570,0.580,0.610
visual_grounding,200,0.080,0.260,0.355,0.315,0.410,0.360
Average,2000,0.310,0.181,0.569,0.560,0.578,0.580
