category,total_questions,hit_all,miss_all,rot0,rot90,rot180,rot270
attribute_comparison,200,0.52,0.275,0.61,0.63,0.61,0.635
attribute_recognition,200,0.385,0.2,0.555,0.585,0.615,0.645
dynamic_temporal,200,0.105,0.29,0.385,0.38,0.415,0.39
hallucination_detection,200,0.705,0.08,0.805,0.865,0.83,0.83
object_counting,200,0.05,0.535,0.175,0.225,0.255,0.24
object_localization,200,0.01,0.32,0.195,0.26,0.275,0.245
object_presence,200,0.14,0.49,0.28,0.275,0.325,0.335
scene_understanding,200,0.68,0.08,0.825,0.81,0.81,0.805
spatial_relationship,200,0.005,0.345,0.23,0.28,0.2,0.225
visual_grounding,200,0.0,0.9,0.02,0.035,0.035,0.04
Average,2000,0.26,0.352,0.408,0.434,0.437,0.439
