category,total_questions,hit_all,miss_all,rot0,rot90,rot180,rot270
attribute_comparison,200,0.525,0.19,0.7,0.665,0.68,0.665
attribute_recognition,200,0.68,0.055,0.835,0.815,0.81,0.81
dynamic_temporal,200,0.24,0.16,0.55,0.53,0.535,0.53
hallucination_detection,200,0.405,0.18,0.625,0.61,0.615,0.665
object_counting,200,0.235,0.25,0.48,0.505,0.46,0.465
object_localization,200,0.66,0.04,0.845,0.83,0.825,0.855
object_presence,200,0.725,0.045,0.845,0.85,0.85,0.875
scene_understanding,200,0.915,0.005,0.97,0.955,0.955,0.965
spatial_relationship,200,0.6,0.02,0.815,0.825,0.84,0.78
visual_grounding,200,0.215,0.08,0.54,0.63,0.595,0.655
Average,2000,0.52,0.102,0.72,0.722,0.716,0.726
