category,total_questions,hit_all,miss_all,rot0,rot90,rot180,rot270
attribute_comparison,200,0.415,0.165,0.665,0.66,0.63,0.595
attribute_recognition,200,0.57,0.09,0.74,0.74,0.765,0.77
dynamic_temporal,200,0.145,0.29,0.425,0.425,0.39,0.38
hallucination_detection,200,0.61,0.095,0.79,0.755,0.78,0.745
object_counting,200,0.26,0.37,0.425,0.435,0.42,0.45
object_localization,200,0.18,0.105,0.485,0.56,0.515,0.565
object_presence,200,0.485,0.215,0.62,0.585,0.625,0.665
scene_understanding,200,0.815,0.04,0.9,0.915,0.885,0.9
spatial_relationship,200,0.14,0.095,0.57,0.585,0.545,0.565
visual_grounding,200,0.0,0.81,0.075,0.045,0.065,0.07
Average,2000,0.362,0.228,0.57,0.57,0.562,0.57
