category,total_questions,hit_all,miss_all,rot0,rot90,rot180,rot270
attribute_comparison,200,0.66,0.32,0.675,0.68,0.67,0.665
attribute_recognition,200,0.42,0.18,0.615,0.645,0.625,0.635
dynamic_temporal,200,0.135,0.45,0.325,0.3,0.305,0.32
hallucination_detection,200,0.205,0.54,0.335,0.315,0.335,0.35
object_counting,200,0.06,0.545,0.225,0.215,0.2,0.23
object_localization,200,0.015,0.295,0.265,0.275,0.215,0.325
object_presence,200,0.46,0.24,0.605,0.59,0.615,0.605
scene_understanding,200,0.71,0.12,0.795,0.785,0.8,0.81
spatial_relationship,200,0.005,0.355,0.205,0.24,0.23,0.255
visual_grounding,200,0.005,0.83,0.05,0.09,0.05,0.04
Average,2000,0.268,0.388,0.41,0.414,0.404,0.424
