category,total_questions,hit_all,miss_all,rot0,rot90,rot180,rot270
attribute_comparison,200,0.295,0.225,0.51,0.565,0.545,0.54
attribute_recognition,200,0.525,0.095,0.755,0.71,0.715,0.74
dynamic_temporal,200,0.155,0.385,0.405,0.41,0.38,0.375
hallucination_detection,200,0.14,0.59,0.31,0.255,0.275,0.25
object_counting,200,0.315,0.365,0.495,0.46,0.475,0.465
object_localization,200,0.41,0.07,0.67,0.705,0.67,0.67
object_presence,200,0.78,0.06,0.86,0.895,0.875,0.885
scene_understanding,200,0.75,0.08,0.885,0.84,0.82,0.835
spatial_relationship,200,0.365,0.125,0.63,0.625,0.69,0.625
visual_grounding,200,0.0,1.0,0.0,0.0,0.0,0.0
Average,2000,0.374,0.3,0.552,0.546,0.544,0.538
