% EC Best-Completion Analysis (auto-generated)
% Shows how close invalid predictions are to being valid
\begin{table}[h]
\centering
\caption{\textbf{EC best-completion error analysis.}
For predictions that fail the exists-completion (EC) validity check,
we compute the \emph{minimum mismatches} achievable under any completion
of unknown atoms. A formula with min-mismatch=0 would be EC-valid;
higher values indicate how far the formula is from validity.
Mean MM = mean minimum mismatches for invalid predictions.
Distribution columns show the fraction of invalid predictions in each
mismatch range.}
\label{tab:ec_best_completion}
\small
\begin{tabular}{@{}lrrrrr@{}}
\toprule
Model & Total & Valid & Mean MM & 1--2 & $\geq$3 \\
\midrule
GPT-5.2 & 200 & \textbf{156} (78\%) & 6.2 & 19\% & 81\% \\
Gemini 3 & 200 & 107 (54\%) & \textbf{4.2} & \textbf{34\%} & \textbf{66\%} \\
Grok4 & 199 & 106 (53\%) & 6.0 & 20\% & 80\% \\
Grok4.1f & 200 & 82 (41\%) & 5.5 & 19\% & 81\% \\
DSR & 200 & 66 (33\%) & 5.6 & 14\% & 86\% \\
Opus 4.5 & 200 & 60 (30\%) & 6.5 & 8\% & 92\% \\
Hermes4 & 200 & 31 (16\%) & 6.5 & 13\% & 87\% \\
GPT-4o & 200 & 4 (2\%) & 8.4 & 3\% & 97\% \\
\bottomrule
\end{tabular}
\end{table}