\begin{table}[!h]
    \centering
    \begin{adjustbox}{max width=\textwidth}
    \begin{tabular}{l ccc ccc}
    \toprule
%%%%%%%%%%%%%%%%%%%%%
%% All observed
%%%%%%%%%%%%%%%%%%%%%
    & \multicolumn{6}{c}{\fontfamily{cmr}\textsc{\textbf{All Variables Observed}}} \\
    \cmidrule(lr){2-7} 
    %%%
     & \multicolumn{3}{c}{\textsc{Bernoulli $|$ Linear}} & \multicolumn{3}{c}{\textsc{Hypergeometric $|$ Quadratic}} \\
     \cmidrule(lr){2-4} \cmidrule(lr){5-7} 
     %%%
$n$ & \textsc{$\z$ Acc} & \textsc{$\z_1$ Prec} & \textsc{$\z_1$ Rec} & \textsc{$\z$ Acc} & \textsc{$\z_1$ Prec} & \textsc{$\z_1$ Rec} \\
\hline
$500$ & 73.5 (71.0-76.0) & 26.2 (17.6-34.9) & 27.0 (18.3-35.7) & 75.3 (73.8-76.8) & 16.0 (8.8-23.2) & 16.0 (8.8-23.2) \\
$1k$ & 92.1 (90.4-93.8) & 90.0 (84.1-95.9) & 90.0 (84.1-95.9) & 87.3 (85.8-88.7) & 94.0 (89.3-98.7) & 94.0 (89.3-98.7) \\
$5k$ & 97.1 (96.0-98.2) & 97.0 (93.6-100) & 97.0 (93.6-100) & 99.8 (99.6-100) & 100 (100-100) & 100 (100-100) \\
$10k$ & 99.7 (99.4-100) & 100 (100-100) & 100 (100-100) & 100 (100-100) & 100 (100-100) & 100 (100-100) \\
%%%%%%%%%%%%%%%%%%%
         \toprule
%%%%%%%%%%%%%%%%%%%%%
%% M1 dropped
%%%%%%%%%%%%%%%%%%%%%
    & \multicolumn{6}{c}{\fontfamily{cmr}\textsc{\textbf{$M_1$ Unobserved}}} \\
    \cmidrule(lr){2-7} 
    %%%
     & \multicolumn{3}{c}{\textsc{Bernoulli $|$ Linear}} & \multicolumn{3}{c}{\textsc{Hypergeometric $|$ Quadratic}} \\
     \cmidrule(lr){2-4} \cmidrule(lr){5-7} 
     %%%
$n$ & \textsc{$\z$ Acc} & \textsc{$\z_1$ Prec} & \textsc{$\z_1$ Rec} & \textsc{$\z$ Acc} & \textsc{$\z_1$ Prec} & \textsc{$\z_1$ Rec} \\
\hline
$500$ & 69.2 (66.4-72.0) & 17.0 (9.6-24.4) & 17.0 (9.6-24.4) & 72.8 (71.3-74.3) & 13.0 (6.4-19.6) & 13.0 (6.4-19.6) \\
$1k$ & 92.4 (90.5-94.3) & 69.0 (59.9-78.1) & 69.0 (59.9-78.1) & 90.4 (88.8-92.0) & 83.0 (75.6-90.4) & 83.0 (75.6-90.4) \\
$5k$ & 96.0 (94.4-97.6) & 80.0 (72.1-87.9) & 80.0 (72.1-87.9) & 100 (100-100) & 100 (100-100) & 100 (100-100) \\
$10k$ & 99.8 (99.4-100) & 99.0 (97.0-100) & 99.0 (97.0-100) & 99.8 (99.4-100) & 99.0 (97.0-100) & 99.0 (97.0-100) \\
%%%%%%%%%%%%%%%%%%%
             \toprule
%%%%%%%%%%%%%%%%%%%%%
%% M2 dropped
%%%%%%%%%%%%%%%%%%%%%
    & \multicolumn{6}{c}{\fontfamily{cmr}\textsc{\textbf{$M_2$ Unobserved}}} \\
    \cmidrule(lr){2-7} 
    %%%
     & \multicolumn{3}{c}{\textsc{Bernoulli $|$ Linear}} & \multicolumn{3}{c}{\textsc{Hypergeometric $|$ Quadratic}} \\
     \cmidrule(lr){2-4} \cmidrule(lr){5-7} 
     %%%
$n$ & \textsc{$\z$ Acc} & \textsc{$\z_1$ Prec} & \textsc{$\z_1$ Rec} & \textsc{$\z$ Acc} & \textsc{$\z_1$ Prec} & \textsc{$\z_1$ Rec} \\
\hline
$500$ & 57.4 (53.5-61.3) & 27.0 (18.3-35.7) & 27.0 (18.3-35.7) & 76.8 (74.5-79.1) & 37.0 (27.6-46.4) & 39.0 (29.4-48.6) \\
$1k$ & 84.6 (83.3-85.9) & 92.8 (87.9-97.7) & 94.0 (89.3-98.7) & 87.8 (86.3-89.3) & 98.0 (95.2-100) & 98.0 (95.2-100) \\
$5k$ & 78.1 (77.0-79.2) & 30.3 (28.5-32.2) & 91.0 (85.4-96.6) & 79.8 (79.5-80.1) & 34.0 (33.4-34.6) & 100 (100-100) \\
$10k$ & 80.0 (80.0-80.0) & 33.3 (33.3-33.3) & 100 (100-100) & 80.0 (80.0-80.0) & 33.3 (33.3-33.3) & 100 (100-100) \\
%%%%%%%%%%%%%%%%%%%
                  \toprule
%%%%%%%%%%%%%%%%%%%%%
%% M3 dropped
%%%%%%%%%%%%%%%%%%%%%
    & \multicolumn{6}{c}{\fontfamily{cmr}\textsc{\textbf{$M_3$ Unobserved}}} \\
    \cmidrule(lr){2-7} 
    %%%
     & \multicolumn{3}{c}{\textsc{Bernoulli $|$ Linear}} & \multicolumn{3}{c}{\textsc{Hypergeometric $|$ Quadratic}} \\
     \cmidrule(lr){2-4} \cmidrule(lr){5-7} 
     %%%
$n$ & \textsc{$\z$ Acc} & \textsc{$\z_1$ Prec} & \textsc{$\z_1$ Rec} & \textsc{$\z$ Acc} & \textsc{$\z_1$ Prec} & \textsc{$\z_1$ Rec} \\
\hline
$500$ & 78.1 (75.9-80.3) & 19.0 (11.3-26.7) & 19.0 (11.3-26.7) & 82.0 (80.7-83.3) & 11.0 (4.8-17.2) & 11.0 (4.8-17.2) \\
$1k$ & 94.2 (92.8-95.6) & 96.0 (92.1-99.9) & 96.0 (92.1-99.9) & 91.1 (89.3-92.9) & 86.0 (79.2-92.8) & 86.0 (79.2-92.8) \\
$5k$ & 97.7 (96.7-98.7) & 99.0 (97.0-100) & 99.0 (97.0-100) & 99.9 (99.7-100) & 100 (100-100) & 100 (100-100) \\
$10k$ & 99.9 (99.7-100) & 99.5 (98.5-100) & 100 (100-100) & 99.7 (99.4-100) & 100 (100-100) & 100 (100-100) \\
%%%%%%%%%%%%%%%%%%%
                 \toprule
%%%%%%%%%%%%%%%%%%%%%
%% M1 and M2 dropped
%%%%%%%%%%%%%%%%%%%%%
    & \multicolumn{6}{c}{\fontfamily{cmr}\textsc{\textbf{$M_1$ and $M_2$ Unobserved}}} \\
    \cmidrule(lr){2-7} 
    %%%
     & \multicolumn{3}{c}{\textsc{Bernoulli $|$ Linear}} & \multicolumn{3}{c}{\textsc{Hypergeometric $|$ Quadratic}} \\
     \cmidrule(lr){2-4} \cmidrule(lr){5-7} 
     %%%
$n$ & \textsc{$\z$ Acc} & \textsc{$\z_1$ Prec} & \textsc{$\z_1$ Rec} & \textsc{$\z$ Acc} & \textsc{$\z_1$ Prec} & \textsc{$\z_1$ Rec} \\
\hline
$500$ & 65.8 (61.9-69.7) & 23.0 (14.7-31.3) & 23.0 (14.7-31.3) & 74.6 (72.3-76.8) & 35.0 (25.6-44.4) & 35.0 (25.6-44.4) \\
$1k$ & 91.9 (89.9-93.8) & 70.5 (61.9-79.1) & 74.0 (65.4-82.6) & 89.1 (87.4-90.9) & 90.0 (84.1-95.9) & 90.0 (84.1-95.9) \\
$5k$ & 66.7 (66.7-66.7) & 0.0 (0.0-0.0) & 0.0 (0.0-0.0) & 66.7 (66.7-66.7) & 0.0 (0.0-0.0) & 0.0 (0.0-0.0) \\
$10k$ & 66.7 (66.7-66.7) & 0.0 (0.0-0.0) & 0.0 (0.0-0.0) & 66.9 (66.2-67.6) & 1.0 (0-3.0) & 1.0 (0-3.0) \\
     %%%%%%%%%%%%%%%%%%%
    \bottomrule
    \end{tabular}
    \end{adjustbox}
    \caption{Performance of Algorithm \ref{alg:method} on thirteen-node DAGs containing an M-structure structure (Figure \ref{fig:m_butterfly}) across noise distributions, causal mechanisms, and sample sizes ($n$). In all DAGs, exposure $X$ is a direct cause of outcome $Y$. Metrics reported are accuracy of all labels ($\z$ \textsc{Acc}), mean precision for partition $\z_1$ ($\z_1$ \textsc{Pre}), and mean recall for partition $\z_1$ ($\z_1$ \textsc{Rec}). The 95\% confidence interval over the 100 individual DAG metrics is reported in parentheses. Independence was determined by chi-square independence testing with $\alpha = 0.001$.} 
    \label{tab:results_m}
\end{table}


\begin{table}[!h]
    \centering
    \begin{adjustbox}{max width=\textwidth}
    \begin{tabular}{l ccc ccc}
    \toprule
%%%%%%%%%%%%%%%%%%%%%
%% All observed
%%%%%%%%%%%%%%%%%%%%%
          & \multicolumn{6}{c}{\fontfamily{cmr}\textsc{\textbf{All Variables Observed}}} \\
         \cmidrule(lr){2-7} 
         %%%
         & \multicolumn{3}{c}{\textsc{Bernoulli $|$ Linear}} & \multicolumn{3}{c}{\textsc{Hypergeometric $|$ Quadratic}} \\
         \cmidrule(lr){2-4} \cmidrule(lr){5-7} 
          %%%
         $n$ & \textsc{$\z$ Acc} & \textsc{$\z_1$ Prec} & \textsc{$\z_1$ Rec} & \textsc{$\z$ Acc} & \textsc{$\z_1$ Prec} & \textsc{$\z_1$ Rec} \\
         %%%
         \hline
$1k$ & 60.4 (57.5-63.2) & 16.8 (9.6-24.0) & 12.5 (6.6-18.4) & 61.5 (58.9-64.0) & 28.9 (20.1-37.7) & 16.0 (10.3-21.7) \\
$2.5k$ & 98.8 (97.1-100) & 98.0 (95.2-100) & 98.0 (95.2-100 & 99.9 (99.7-100) & 100 (100-100) & 100 (100-100) \\
$5k$ & 98.9 (97.4-100) & 99.0 (97.0-100) & 98.2 (95.8-100) & 99.9 (99.7-100) & 100 (100-100) & 100 (100-100) \\
$10k$ & 99.7 (99.4-100) & 100 (100-100) & 99.2 (98.4-100) & 99.8 (99.5-100) & 100 (100-100) & 99.5 (98.5-100) \\
    \toprule
%%%%%%%%%%%%%%%%%%%%%
%% B1 unobserved
%%%%%%%%%%%%%%%%%%%%%
          & \multicolumn{6}{c}{\fontfamily{cmr}\textsc{\textbf{$B_1$ Unobserved}}} \\
         \cmidrule(lr){2-7} 
         %%%
         & \multicolumn{3}{c}{\textsc{Bernoulli $|$ Linear}} & \multicolumn{3}{c}{\textsc{Hypergeometric $|$ Quadratic}} \\
         \cmidrule(lr){2-4} \cmidrule(lr){5-7} 
          %%%
         $n$ & \textsc{$\z$ Acc} & \textsc{$\z_1$ Prec} & \textsc{$\z_1$ Rec} & \textsc{$\z$ Acc} & \textsc{$\z_1$ Prec} & \textsc{$\z_1$ Rec} \\
         %%%
         \hline
$1k$ & 71.3 (68.3-74.3) & 36.0 (27.7-44.3) & 32.0 (24.5-39.5) & x & x & x \\
$2.5k$ & 100 (100-100) & 100 (100-100) & 100 (100-100) & x & x & x \\
$5k$ & 99.1 (98.0-100) & 98.0 (95.2-100) & 97.7 (94.8-100) & x & x & x \\
$10k$ & 99.9 (99.7-100) & 100 (100-100) & 99.7 (99.0-100) & x & x & x \\
    \toprule
%%%%%%%%%%%%%%%%%%%%%
%% B2 unobserved
%%%%%%%%%%%%%%%%%%%%%
          & \multicolumn{6}{c}{\fontfamily{cmr}\textsc{\textbf{$B_2$ Unobserved}}} \\
         \cmidrule(lr){2-7} 
         %%%
         & \multicolumn{3}{c}{\textsc{Bernoulli $|$ Linear}} & \multicolumn{3}{c}{\textsc{Hypergeometric $|$ Quadratic}} \\
         \cmidrule(lr){2-4} \cmidrule(lr){5-7} 
          %%%
         $n$ & \textsc{$\z$ Acc} & \textsc{$\z_1$ Prec} & \textsc{$\z_1$ Rec} & \textsc{$\z$ Acc} & \textsc{$\z_1$ Prec} & \textsc{$\z_1$ Rec} \\
         %%%
         \hline
$1k$ & 72.0 (68.9-75.1) & 38.2 (29.9-46.5) & 35.0 (27.4-42.6) & x & x & x \\
$2.5k$ & 99.2 (97.8-100) & 99.0 (97.0-100) & 99.0 (97.0-100) & x & x & x \\
$5k$ & 100 (100-100) & 100 (100-100) & 100 (100-100) & x & x & x \\
$10k$ & 99.5 (98.7-100) & 99.0 (97.0-100) & 99.0 (97.0-100) & x & x & x \\
    \toprule
%%%%%%%%%%%%%%%%%%%%%
%% B3 unobserved
%%%%%%%%%%%%%%%%%%%%%
          & \multicolumn{6}{c}{\fontfamily{cmr}\textsc{\textbf{$B_3$ Unobserved}}} \\
         \cmidrule(lr){2-7} 
         %%%
         & \multicolumn{3}{c}{\textsc{Bernoulli $|$ Linear}} & \multicolumn{3}{c}{\textsc{Hypergeometric $|$ Quadratic}} \\
         \cmidrule(lr){2-4} \cmidrule(lr){5-7} 
          %%%
         $n$ & \textsc{$\z$ Acc} & \textsc{$\z_1$ Prec} & \textsc{$\z_1$ Rec} & \textsc{$\z$ Acc} & \textsc{$\z_1$ Prec} & \textsc{$\z_1$ Rec} \\
         %%%
         \hline
$1k$ & 68.8 (67.7-69.9) & 46.5 (44.0-49.0) & 31.0 (29.3-32.7) & x & x & x \\
$2.5k$ & 71.0 (70.4-71.6) & 51.7 (50.7-52.7) & 36.7 (34.7-38.6) & x & x & x \\
$5k$ & 77.2 (76.3-78.1) & 62.3 (60.9-63.8) & 58.0 (55.1-60.9) & x & x & x \\
$10k$ & 80.0 (80.0-80.0) & 66.7 (66.7-66.7) & 66.7 (66.7-66.7) & x & x & x \\
$25k$ & 79.9 (79.7-80.1) & 66.7 (66.7-66.7) & 66.7 (66.7-66.7) & x & x & x \\
     %%%%%%%%%%%%%%%%%%%
    \bottomrule
    \end{tabular}
    \end{adjustbox}
    \caption{Performance of Algorithm \ref{alg:method} on thirteen-node DAGs containing a butterfly structure (Figure \ref{fig:m_butterfly}) across noise distributions, causal mechanisms, and sample sizes ($n$). In all DAGs, exposure $X$ is a direct cause of outcome $Y$. Metrics reported are accuracy of all labels ($\z$ \textsc{Acc}), mean precision for partition $\z_1$ ($\z_1$ \textsc{Pre}), and mean recall for partition $\z_1$ ($\z_1$ \textsc{Rec}). The 95\% confidence interval over the 100 individual DAG metrics is reported in parentheses. Independence was determined by chi-square independence testing with $\alpha = 0.001$.} %{\color{red} Butterfly manual threshold = 0.01, 0.0075 for linear-hypergeometric}}
    \label{tab:results_butterfly}
\end{table}