category,total_questions,hit_all,miss_all,rot0,rot90,rot180,rot270
attribute_comparison,200,0.335,0.235,0.58,0.555,0.52,0.57
attribute_recognition,200,0.585,0.09,0.735,0.785,0.735,0.8
dynamic_temporal,200,0.145,0.315,0.435,0.425,0.415,0.43
hallucination_detection,200,0.505,0.185,0.695,0.65,0.66,0.68
object_counting,200,0.145,0.365,0.39,0.35,0.365,0.365
object_localization,200,0.495,0.025,0.74,0.78,0.775,0.795
object_presence,200,0.48,0.18,0.665,0.66,0.665,0.68
scene_understanding,200,0.645,0.075,0.84,0.755,0.785,0.815
spatial_relationship,200,0.32,0.1,0.635,0.66,0.635,0.665
visual_grounding,200,0.035,0.3,0.355,0.27,0.37,0.325
Average,2000,0.369,0.187,0.607,0.589,0.592,0.612
