category,total_questions,hit_all,miss_all,rot0,rot90,rot180,rot270
attribute_comparison,200,0.26,0.165,0.565,0.525,0.545,0.565
attribute_recognition,200,0.435,0.13,0.65,0.695,0.66,0.705
dynamic_temporal,200,0.14,0.27,0.385,0.45,0.42,0.46
hallucination_detection,200,0.175,0.425,0.395,0.385,0.355,0.355
object_counting,200,0.035,0.32,0.29,0.315,0.31,0.29
object_localization,200,0.035,0.14,0.415,0.36,0.395,0.43
object_presence,200,0.825,0.02,0.91,0.94,0.91,0.93
scene_understanding,200,0.795,0.045,0.905,0.89,0.91,0.885
spatial_relationship,200,0.02,0.235,0.36,0.34,0.325,0.3
visual_grounding,200,0.0,0.855,0.05,0.055,0.035,0.03
Average,2000,0.272,0.26,0.492,0.495,0.487,0.495
