\newcolumntype{a}{>{\columncolor{Dandelion!15}}c}

\begin{table}[!h]
    \centering
    \begin{adjustbox}{max width=\textwidth}
    \begin{tabular}{l accc accc accc}
    \toprule[1pt]
        & \multicolumn{12}{c}{\Large \fontfamily{cmr}\textsc{\textbf{Common Cause Criterion}}} \\
        %%%
         \cmidrule(lr){2-13} 
         %%%%
         & \multicolumn{4}{c}{\fontfamily{cmr}\textsc{\textbf{Valid Adjustment Set}}} & \multicolumn{4}{c}{\fontfamily{cmr}\textsc{\textbf{Average Treatment Effect (ATE)}}} & \multicolumn{4}{c}{\fontfamily{cmr}\textsc{\textbf{ATE Mean Squared Error}}} \\
         %%%%
         \cmidrule(lr){2-5} \cmidrule(lr){6-9} \cmidrule(lr){10-13} 
         %%%%
        $n$ & \textsc{LDP} & \textsc{PC} & \textsc{LDECC} & \textsc{MB-by-MB} & \textsc{LDP} & \textsc{PC} & \textsc{LDECC} & \textsc{MB-by-MB} & \textsc{LDP} & \textsc{PC} & \textsc{LDECC} & \textsc{MB-by-MB} \\
        %%%
        \hline
        $1k$ & \textbf{0.93} & 0.00 & 0.03 & 0.10 & \textbf{3.77 (3.75-3.79)} & 3.58 (3.38-3.77) & 3.88 (3.71-4.05) & 3.97 (3.86-4.08) & \textbf{0.0096} & 1.0509 & 0.7817 & 0.3703 \\
        $2.5k$ & \textbf{0.96} & 0.00 & 0.02 & 0.30 & \textbf{3.76 (3.75-3.78)} & 2.5 (2.14-2.87) & 4.08 (4.07-4.09) & 3.97 (3.93-4.01) & \textbf{0.0053} & 4.9982 & 0.1088 & 0.0817 \\
        $5k$ & \textbf{0.96} & 0.03 & 0.04 & 0.60 & \textbf{3.76 (3.75-3.77)} & 1.09 (0.78-1.4) & 4.07 (4.05-4.08) & 3.87 (3.83-3.9) & \textbf{0.0046} & 9.5287 & 0.1054 & 0.0473 \\
        $7.5k$ & \textbf{0.97} & 0.11 & 0.14 & 0.73 & \textbf{3.76 (3.75-3.77)} & 1 (0.72-1.27) & 4.04 (4.01-4.06) & 3.83 (3.8-3.86) & \textbf{0.0037} & 9.5009 & 0.0950 & 0.0325 \\
        %%%%%%%%%%%%
        %%%%%%%%%%%%
        %%%%%%%%%%%%
        \midrule[0.5pt]
        %%%%
         & \multicolumn{4}{c}{\fontfamily{cmr}\textsc{\textbf{Confounder Precision}}} & \multicolumn{4}{c}{\fontfamily{cmr}\textsc{\textbf{Confounder Recall}}} & \multicolumn{4}{c}{\fontfamily{cmr}\textsc{\textbf{Adjustment Set Cardinality}}} \\
         %%%%
         \cmidrule(lr){2-5} \cmidrule(lr){6-9} \cmidrule(lr){10-13} 
         %%%%
        $n$ & \textsc{LDP} & \textsc{PC} & \textsc{LDECC} & \textsc{MB-by-MB} & \textsc{LDP} & \textsc{PC} & \textsc{LDECC} & \textsc{MB-by-MB} & \textsc{LDP} & \textsc{PC} & \textsc{LDECC} & \textsc{MB-by-MB} \\
        \hline
        $1k$ & \textbf{93 (87.97-98.03)} & 13.17 (8.88-17.45) & 3 (0-6.36) & 10 (4.09-15.91) & \textbf{93 (87.97-98.03)} & 27 (18.25-35.75) & 3 (0-6.36) & 10 (4.09-15.91) & \textbf{0.9 (0.9-1)} & 0.6 (0.4-0.7) & 0.1 (0-0.1) & 0.1 (0.1-0.2) \\
        $2.5k$ & \textbf{96 (92.14-99.86)} & 16.83 (12.34-21.32) & 2 (0-4.76) & 30 (20.97-39.03) & \textbf{96 (92.14-99.86)} & 36 (26.54-45.46) & 2 (0-4.76) & 30 (20.97-39.03) & \textbf{1 (0.9-1)} & 1 (0.8-1.2) & 0 (0-0) & 0.3 (0.2-0.4) \\
        $5k$ & \textbf{96 (92.14-99.86)} & 27.33 (23.19-31.48) & 4 (0.14-7.86) & 60 (50.35-69.65) & \textbf{96 (92.14-99.86)} & 70 (60.97-79.03) & 4 (0.14-7.86) & 60 (50.35-69.65) & \textbf{1 (0.9-1)} & 2.2 (2-2.4) & 0 (0-0.1) & 0.6 (0.5-0.7) \\
        $7.5k$ & \textbf{97 (93.64-100)} & 34.08 (30.81-37.36) & 14 (7.16-20.84) & 73 (64.25-81.75) & \textbf{97 (93.64-100)} & 90 (84.09-95.91) & 14 (7.16-20.84) & 73 (64.25-81.75) & \textbf{1 (0.9-1)} & 2.7 (2.5-2.9) & 0.1 (0.1-0.2) & 0.7 (0.7-0.8) \\
    \midrule[1pt]
    %%%%%%%%%%%%
    %%%%%%%%%%%%
    %%%%%%%%%%%%
    %\toprule[1pt]
    & \multicolumn{12}{c}{\Large \fontfamily{cmr}\textsc{\textbf{Disjunctive Cause Criterion}}} \\
        %%%
         \cmidrule(lr){2-13} 
         %%%%
         & \multicolumn{4}{c}{\fontfamily{cmr}\textsc{\textbf{Valid Adjustment Set}}} & \multicolumn{4}{c}{\fontfamily{cmr}\textsc{\textbf{Average Treatment Effect (ATE)}}} & \multicolumn{4}{c}{\fontfamily{cmr}\textsc{\textbf{ATE Mean Squared Error}}} \\
         %%%%
         \cmidrule(lr){2-5} \cmidrule(lr){6-9} \cmidrule(lr){10-13} 
         %%%%
            $n$ & \textsc{LDP} & \textsc{PC} & \textsc{LDECC} & \textsc{MB-by-MB} & \textsc{LDP} & \textsc{PC} & \textsc{LDECC} & \textsc{MB-by-MB} & \textsc{LDP} & \textsc{PC} & \textsc{LDECC} & \textsc{MB-by-MB} \\
            %%%
            \hline
            $1k$ & \textbf{0.93} & 0.0 & 0.09 & 0.02 & \textbf{3.77 (3.76-3.79)} & 0.87 (0.6-1.14) & 1.41 (1.15-1.67) & 1.05 (0.77-1.34) & \textbf{0.0091} & 10.2090 & 7.1930 & 9.3487 \\
            $2.5k$ & \textbf{0.96} & 0.0 & 0.11 & 0.08 & \textbf{3.76 (3.75-3.78)} & 0.28 (0.23-0.33) & 1.31 (1.11-1.51) & 1.34 (1.07-1.61) & \textbf{0.0055} & 12.0875 & 6.9627 & 7.6885 \\
            $5k$ & \textbf{0.96 }& 0.0 & 0.14 & 0.32 & \textbf{3.76 (3.75-3.78)} & 0.4 (0.29-0.52) & 2.09 (1.79-2.38) & 2.34 (2.07-2.62) & \textbf{0.0050 }& 11.5372 & 5.0590 & 3.9600 \\
            $7.5k$ & \textbf{0.97} & 0.03 & 0.31 & 0.48 & \textbf{3.76 (3.75-3.77)} & 0.6 (0.43-0.77) & 2.52 (2.22-2.81) & 2.75 (2.49-3.01) & \textbf{0.0037} & 10.6568 & 3.8045 & 2.7495 \\
        %%%%%%%%%
        %%%%%%%%%
        %%%%%%%%%
        \midrule[1pt]
        & \multicolumn{4}{c}{\fontfamily{cmr}\textsc{\textbf{Confounder Precision}}} & \multicolumn{4}{c}{\fontfamily{cmr}\textsc{\textbf{Confounder Recall}}} & \multicolumn{4}{c}{\fontfamily{cmr}\textsc{\textbf{Adjustment Set Cardinality}}} \\
         %%%%
         \cmidrule(lr){2-5} \cmidrule(lr){6-9} \cmidrule(lr){10-13} 
         %%%%
        $n$ & \textsc{LDP} & \textsc{PC} & \textsc{LDECC} & \textsc{MB-by-MB} & \textsc{LDP} & \textsc{PC} & \textsc{LDECC} & \textsc{MB-by-MB} & \textsc{LDP} & \textsc{PC} & \textsc{LDECC} & \textsc{MB-by-MB} \\
        \hline
        %%%
        $1k$ & \textbf{31.83 (29.97-33.7)} & 27.08 (24.77-29.4) & 23.4 (19.08-27.72) & 30.83 (27.95-33.72) & \textbf{93 (87.97-98.03)} & 85 (77.97-92.03) & 61 (51.39-70.61) & 87 (80.38-93.62) & \textbf{2.8 (2.7-2.9)} & 2.7 (2.5-2.9) & 2.4 (2.2-2.6) & 2.6 (2.3-2.8) \\
        $2.5k$ & 32.33 (30.95-33.71) & 30.43 (29.51-31.36) & 17.83 (11.86-23.8) & \textbf{40.33 (37.88-42.79)} & 96 (92.14-99.86) & 100 (100-100) & 31 (21.89-40.11) & \textbf{99 (97.04-100)} & \textbf{2.9 (2.8-3)} & 3.4 (3.3-3.5) & 1.5 (1.4-1.7) & 2.6 (2.5-2.7)  \\
        $5k$ & 32.17 (30.83-33.5) & 27.5 (26.46-28.54) & 12.5 (7.41-17.59) & \textbf{40.92 (38.57-43.26)} & 96 (92.14-99.86) & 99 (97.04-100) & 23 (14.71-31.29) & \textbf{98 (95.24-100)} & \textbf{2.9 (2.8-3)} & 3.7 (3.5-3.8) & 1.2 (1-1.3) & 2.5 (2.4-2.6) \\
        $7.5k$ & 32.5 (31.33-33.67) & 27.63 (26.49-28.77) & 19.5 (15.05-23.95) & \textbf{40.5 (38.56-42.44)} & 97 (93.64-100) & 100 (100-100) & 46 (36.18-55.82) & \textbf{99 (97.04-100)} & \textbf{2.9 (2.9-3)} & 3.8 (3.6-3.9) & 1.5 (1.3-1.7) & 2.6 (2.4-2.7) \\
    \bottomrule[1pt]
    \end{tabular}
    \end{adjustbox}
    \caption{Average treatment effect (ATE) estimation with adjustment sets identified by LDP, PC, LDECC, and MB-by-MB for a 10-node linear-Gaussian DAG (Figure \ref{fig:ten_node_dag}). Both the common cause criterion (CCC) and disjunctive cause criterion (DCC) were considered. Values are reported for 100 replicate DAGs with 95\% confidence intervals in parentheses. Independence was determined by Fisher-z tests with $\alpha = 0.01$. Adjustment set quality was measured by fraction that are valid under the backdoor criterion, ATE (ground truth = 3.75), ATE mean squared error, confounder precision per adjustment set, confounder recall per adjustment set, and cardinality of the adjustment set (ground truth is 1 under the CCC and 3 under the DCC). The method proposed in this work is highlighted in yellow. The most performant values per metric are bolded. All experiments were run on a 2017 MacBook with 2.9 GHz Quad-Core Intel Core i7. Results are visualized in Figure \ref{fig:baselines}. }
    \label{tab:ate}
\end{table}