category,total_questions,hit_all,miss_all,rot0,rot90,rot180,rot270
attribute_comparison,200,0.335,0.305,0.51,0.49,0.545,0.52
attribute_recognition,200,0.54,0.18,0.72,0.68,0.685,0.725
dynamic_temporal,200,0.075,0.355,0.355,0.36,0.35,0.345
hallucination_detection,200,0.22,0.42,0.405,0.38,0.39,0.41
object_counting,200,0.36,0.39,0.485,0.505,0.485,0.455
object_localization,200,0.33,0.165,0.555,0.64,0.575,0.58
object_presence,200,0.645,0.055,0.825,0.765,0.83,0.825
scene_understanding,200,0.705,0.09,0.835,0.835,0.805,0.81
spatial_relationship,200,0.15,0.17,0.485,0.5,0.505,0.5
visual_grounding,200,0.0,1.0,0.0,0.0,0.0,0.0
Average,2000,0.336,0.313,0.518,0.516,0.517,0.517
