 & Triangle & Quadrilateral & Length & Angle & Area & Diameter & Shape (s) & Shape (m) & Extraction & Intersection &  \\
\midrule
Phi-3.5-vision & \textcolor{red}{-2.0} & \textcolor{red}{-1.0} & \textcolor{teal}{8.0} & \textcolor{teal}{4.0} & \textcolor{red}{-3.0} & \textcolor{teal}{18.0} & \textcolor{red}{-2.0} & \textcolor{teal}{2.0} & \textcolor{teal}{6.0} & \textcolor{teal}{1.0} & \textcolor{teal}{3.4} \\
LLaVA-Next 8B & \textcolor{teal}{4.0} & \textcolor{teal}{2.0} & \textcolor{teal}{9.0} & \textcolor{teal}{1.0} & \textcolor{red}{-7.0} & \textcolor{red}{-1.0} & \textcolor{red}{-2.0} & \textcolor{teal}{14.0} & \textcolor{teal}{2.0} & \textcolor{gray}{0.0} & \textcolor{teal}{1.8} \\
LLaVA-Next 34B & \textcolor{teal}{3.0} & \textcolor{teal}{1.0} & \textcolor{red}{-7.0} & \textcolor{teal}{5.0} & \textcolor{red}{-3.0} & \textcolor{gray}{0.0} & \textcolor{teal}{4.0} & \textcolor{teal}{2.0} & \textcolor{red}{-1.0} & \textcolor{teal}{3.0} & \textcolor{teal}{0.4} \\
Llama 3.2 11B & \textcolor{gray}{0.0} & \textcolor{red}{-6.0} & \textcolor{teal}{3.0} & \textcolor{teal}{6.0} & \textcolor{red}{-6.0} & \textcolor{teal}{3.0} & \textcolor{teal}{8.0} & \textcolor{teal}{8.0} & \textcolor{teal}{9.0} & \textcolor{red}{-3.0} & \textcolor{teal}{1.6} \\
Llama 3.2 90B & \textcolor{red}{-11.0} & \textcolor{teal}{2.0} & \textcolor{teal}{8.0} & \textcolor{teal}{2.0} & \textcolor{teal}{5.0} & \textcolor{teal}{6.0} & \textcolor{teal}{2.0} & \textcolor{teal}{8.0} & \textcolor{teal}{15.0} & \textcolor{teal}{5.0} & \textcolor{teal}{4.1} \\
MolMo 7B-D & \textcolor{gray}{0.0} & \textcolor{teal}{1.0} & \textcolor{teal}{3.0} & \textcolor{teal}{8.0} & \textcolor{teal}{3.0} & \textcolor{red}{-3.0} & \textcolor{red}{-6.0} & \textcolor{teal}{10.0} & \textcolor{red}{-3.0} & \textcolor{teal}{5.0} & \textcolor{teal}{1.8} \\
MolMo 72B & \textcolor{red}{-1.0} & \textcolor{red}{-1.0} & \textcolor{teal}{2.0} & \textcolor{teal}{2.0} & \textcolor{teal}{11.0} & \textcolor{teal}{1.0} & \textcolor{red}{-10.0} & \textcolor{teal}{4.0} & \textcolor{red}{-11.0} & \textcolor{gray}{0.0} & \textcolor{gray}{0.0} \\
Qwen2-VL-2B & \textcolor{gray}{0.0} & \textcolor{gray}{0.0} & \textcolor{red}{-2.0} & \textcolor{gray}{0.0} & \textcolor{teal}{4.0} & \textcolor{gray}{0.0} & \textcolor{red}{-6.0} & \textcolor{red}{-4.0} & \textcolor{red}{-4.0} & \textcolor{teal}{3.0} & \textcolor{red}{-0.4} \\
Qwen2-VL-7B & \textcolor{red}{-1.0} & \textcolor{teal}{2.0} & \textcolor{teal}{3.0} & \textcolor{teal}{2.0} & \textcolor{red}{-5.0} & \textcolor{teal}{2.0} & \textcolor{red}{-4.0} & \textcolor{red}{-4.0} & \textcolor{teal}{3.0} & \textcolor{teal}{1.0} & \textcolor{teal}{0.3} \\
Qwen2-VL-72B & \textcolor{teal}{3.0} & \textcolor{red}{-2.0} & \textcolor{teal}{5.0} & \textcolor{red}{-2.0} & \textcolor{teal}{5.0} & \textcolor{teal}{1.0} & \textcolor{teal}{20.0} & \textcolor{teal}{2.0} & \textcolor{red}{-5.0} & \textcolor{teal}{3.0} & \textcolor{teal}{2.1} \\
InternVL2-4B & \textcolor{red}{-2.0} & \textcolor{red}{-13.0} & \textcolor{red}{-8.0} & \textcolor{teal}{6.0} & \textcolor{teal}{5.0} & \textcolor{gray}{0.0} & \textcolor{teal}{6.0} & \textcolor{red}{-2.0} & \textcolor{red}{-1.0} & \textcolor{teal}{4.0} & \textcolor{red}{-0.8} \\
InternVL2-8B & \textcolor{gray}{0.0} & \textcolor{teal}{7.0} & \textcolor{red}{-3.0} & \textcolor{red}{-10.0} & \textcolor{teal}{2.0} & \textcolor{teal}{6.0} & \textcolor{teal}{2.0} & \textcolor{red}{-2.0} & \textcolor{teal}{2.0} & \textcolor{gray}{0.0} & \textcolor{teal}{0.4} \\
InternVL2-26B & \textcolor{red}{-2.0} & \textcolor{teal}{3.0} & \textcolor{teal}{3.0} & \textcolor{teal}{1.0} & \textcolor{teal}{10.0} & \textcolor{red}{-3.0} & \textcolor{teal}{2.0} & \textcolor{teal}{2.0} & \textcolor{teal}{10.0} & \textcolor{teal}{3.0} & \textcolor{teal}{3.0} \\
InternVL2-40B & \textcolor{teal}{7.0} & \textcolor{red}{-1.0} & \textcolor{teal}{1.0} & \textcolor{teal}{1.0} & \textcolor{teal}{11.0} & \textcolor{teal}{3.0} & \textcolor{teal}{18.0} & \textcolor{teal}{8.0} & \textcolor{red}{-6.0} & \textcolor{red}{-3.0} & \textcolor{teal}{2.9} \\
InternVL2-76B & \textcolor{teal}{3.0} & \textcolor{teal}{2.0} & \textcolor{red}{-1.0} & \textcolor{red}{-7.0} & \textcolor{teal}{1.0} & \textcolor{gray}{0.0} & \textcolor{red}{-6.0} & \textcolor{red}{-2.0} & \textcolor{red}{-5.0} & \textcolor{red}{-2.0} & \textcolor{red}{-1.4} \\
\midrule
Claude 3.5 Sonnet & \textcolor{teal}{4.0} & \textcolor{teal}{3.0} & \textcolor{teal}{5.0} & \textcolor{teal}{4.0} & \textcolor{red}{-2.0} & \textcolor{red}{-5.0} & \textcolor{teal}{32.0} & \textcolor{teal}{2.0} & \textcolor{teal}{20.0} & \textcolor{teal}{10.0} & \textcolor{teal}{6.2} \\
GPT-4o-mini & \textcolor{teal}{3.0} & \textcolor{red}{-2.0} & \textcolor{teal}{3.0} & \textcolor{red}{-2.0} & \textcolor{teal}{3.0} & \textcolor{teal}{4.0} & \textcolor{teal}{14.0} & \textcolor{teal}{6.0} & \textcolor{red}{-9.0} & \textcolor{gray}{0.0} & \textcolor{teal}{1.1} \\
GPT-4o & \textcolor{red}{-3.0} & \textcolor{teal}{1.0} & \textcolor{teal}{3.0} & \textcolor{red}{-8.0} & \textcolor{teal}{4.0} & \textcolor{teal}{1.0} & \textcolor{teal}{10.0} & \textcolor{teal}{4.0} & \textcolor{teal}{5.0} & \textcolor{red}{-1.0} & \textcolor{teal}{1.0} \\
Gemini 1.5 Flash & \textcolor{teal}{3.0} & \textcolor{red}{-5.0} & \textcolor{teal}{1.0} & \textcolor{red}{-1.0} & \textcolor{red}{-1.0} & \textcolor{teal}{7.0} & \textcolor{teal}{4.0} & \textcolor{gray}{0.0} & \textcolor{teal}{7.0} & \textcolor{teal}{6.0} & \textcolor{red}{-0.8} \\
Gemini 1.5 Pro & \textcolor{gray}{0.0} & \textcolor{teal}{8.0} & \textcolor{teal}{2.0} & \textcolor{red}{-6.0} & \textcolor{red}{-5.0} & \textcolor{teal}{2.0} & \textcolor{teal}{10.0} & \textcolor{teal}{4.0} & \textcolor{teal}{5.0} & \textcolor{teal}{3.0} & \textcolor{teal}{1.8} \\
