% FO v1 Parsimony Gap Metrics
\begin{table}[t]
\centering
\caption{FO v1 parsimony gap: validity vs budgeted accuracy.}
\label{tab:fo_parsimony}
\small
\begin{tabular}{@{}lrrrr@{}}
\toprule
Model & Validity & Acc@+25 & Gap & Bloat\% \\
\midrule
Grok4 & \textbf{50.7\%} & \textbf{46.7\%} & 4.0\% & 4.0\% \\
GPT-5.2 & 43.7\% & 19.5\% & 24.3\% & 24.3\% \\
Grok4.1f & 17.9\% & 17.9\% & \textbf{0.0\%} & \textbf{0.0\%} \\
Gemini 3 & 16.0\% & 15.2\% & 0.8\% & 0.8\% \\
DSR & 10.4\% & 10.4\% & \textbf{0.0\%} & \textbf{0.0\%} \\
Opus 4.5 & 8.5\% & 8.5\% & \textbf{0.0\%} & \textbf{0.0\%} \\
Hermes4 & 2.7\% & 2.7\% & \textbf{0.0\%} & \textbf{0.0\%} \\
GPT-4o & 0.0\% & 0.0\% & \textbf{0.0\%} & \textbf{0.0\%} \\
\bottomrule
\end{tabular}
\end{table}