% Training Error Profiles: FP/FN rates (auto-generated)
\begin{table}[h]
\centering
\caption{\textbf{Training error profiles.}
Mean per-world false positive (FP\%) and false negative (FN\%) rates.
For FullObs, rates are averaged across all worlds.
For CI, YES rates are on YES worlds only; NO Margin is mean mismatches
on NO worlds (higher = better separation from NO targets).}
\label{tab:error_profiles}
\small
\begin{tabular}{@{}l|rr|rrr@{}}
\toprule
 & \multicolumn{2}{c|}{FullObs} & \multicolumn{3}{c}{CI} \\
Model & FP\% & FN\% & YES FP\% & YES FN\% & NO Marg \\
\midrule
Grok4 & \textbf{4.3} & \textbf{2.8} & \textbf{0.1} & \textbf{1.0} & 2.6 \\
GPT-5.2 & 11.8 & 6.4 & 3.6 & 2.5 & 3.2 \\
Grok4.1f & 16.4 & 12.1 & 5.1 & 5.0 & 2.7 \\
Gemini 3 & 17.8 & 10.4 & 5.8 & 4.0 & 2.7 \\
DSR & 19.0 & 16.3 & 6.7 & 7.8 & 2.8 \\
Opus 4.5 & 20.1 & 13.8 & 6.5 & 5.3 & 2.8 \\
Hermes4 & 27.7 & 16.5 & 14.2 & 16.4 & 3.7 \\
GPT-4o & 38.2 & 7.4 & 24.2 & 11.9 & \textbf{3.8} \\
\bottomrule
\end{tabular}
\end{table}