\begin{table}[!h]
    \centering
    \begin{adjustbox}{max width=\textwidth}
    \begin{tabular}{l c c c c c c}
    \toprule
    & \multicolumn{3}{c}{\textsc{Figure \ref{fig:latent_experiments} (left)}} & \multicolumn{3}{c}{\textsc{Figure \ref{fig:latent_experiments} (right)}} \\
    %\cmidrule(lr){2–4}  \cmidrule(lr){5–7} 
    %%%%
    \textsc{Latent Confounder} & None & $Z_{5a}$ & $Z_{4a}$ & None & $Z_{5b}$ & $Z_{4b}$ \\
    \midrule
    \textsc{Label Accuracy} & 98.2 (97.7–98.7) & 100 (100–100) & 100 (100–100) & 100 (100–100) & 100 (100–100) & 100 (100–100) \\
    \bottomrule
    \end{tabular}
    \end{adjustbox}
    \caption{Performance of LDP for causally insufficient linear–Gaussian DAGs (Figure \ref{fig:latent_experiments}) with pretreatment $\z$ numerically validates Theorem \ref{theorem:pretreatment_latents}. Label accuracy is computed with the expected label for LDP under causal sufficiency as the ground truth. This is to accommodate the fact that LDP is \textit{expected} to mislabel $Z_{1a}$ and $Z_{1c}$ as $\z_{\textsc{Post}}$ even when there are no latent variables in $\g$, though the returned $\z_1$ ($\{Z_{1b}\}$) is still expected to be a valid adjustment set. All other variables in Figure \ref{fig:latent_experiments} are expected to have correct partition labels. Accuracies are averaged over 100 replicate DAGs with identical structure and varying coefficients, with structural equations reported in Table \ref{tab:sem_continuous}. The 95\% confidence intervals are reported in parentheses. Independence is determined by Fisher-z tests ($\alpha = 0.005$). All experiments were run on a 2017 MacBook with 2.9 GHz Quad-Core Intel Core i7.}
    \label{tab:latent_pretreatment}
\end{table}