\newcolumntype{a}{>{\columncolor{Dandelion!15}}c}

\begin{table}[!h]
    \centering
    %%%%%%%%%%%%%%%%%%%%
    %% COMMON CAUSE
    %%%%%%%%%%%%%%%%%%%%
    \begin{adjustbox}{max width=\textwidth}
    \begin{tabular}{l accc accc accc}
    \toprule[1pt]
        & \multicolumn{12}{c}{\Large \fontfamily{cmr}\textsc{\textbf{Common Cause Criterion}}} \\
        %%%
         \cmidrule(lr){2-13} 
         %%%%
         & \multicolumn{4}{c}{\fontfamily{cmr}\textsc{\textbf{Valid Adjustment Set}}} & \multicolumn{4}{c}{\fontfamily{cmr}\textsc{\textbf{Confounder Precision}}} & \multicolumn{4}{c}{\fontfamily{cmr}\textsc{\textbf{Confounder Recall}}} \\
         %%%%
         \cmidrule(lr){2-5} \cmidrule(lr){6-9} \cmidrule(lr){10-13} 
         %%%%
        $n$ & \textsc{LDP} & \textsc{PC} & \textsc{LDECC} & \textsc{MB-by-MB} & \textsc{LDP} & \textsc{PC} & \textsc{LDECC} & \textsc{MB-by-MB} & \textsc{LDP} & \textsc{PC} & \textsc{LDECC} & \textsc{MB-by-MB} \\
        %%%
        \hline
        $25k$ & \textbf{0.8} & 0.7 & 0.0 & 0.0 & \textbf{80.00 (53.87-100)} & 35.00 (20.03-49.97) & 0.0 (0.0-0.0) & 0.0 (0.0-0.0) & \textbf{80.00 (53.87-100)} & 35.00 (20.03-49.97) & 0.0 (0.0-0.0) & 0.0 (0.0-0.0) \\
        $50k$ & 0.7 & \textbf{1.0} & 0.0 & 0.0 & \textbf{76.67 (50.81-100)} & 50.00 (50.00-50.00) & 0.0 (0.0-0.0) & 0.0 (0.0-0.0) & \textbf{80.00 (53.87-100)} & 50.00 (50.00-50.00) & 0.0 (0.0-0.0) & 0.0 (0.0-0.0) \\
        $75k$ & \textbf{0.9} & 0.4 & 0.0 & 0.0 & \textbf{90.00 (80.02-99.98)} & 20.00 (4.00-36.00) & 0.0 (0.0-0.0) & 0.0 (0.0-0.0) & \textbf{100 (100-100)} & 20.00 (4.00-36.00) & 0.0 (0.0-0.0) & 0.0 (0.0-0.0) \\
    \midrule[1pt]
    %%%%%%%%%%%%%%%%%%%%
    %% DISJUNCTIVE CAUSE
    %%%%%%%%%%%%%%%%%%%%
        & \multicolumn{12}{c}{\Large  \fontfamily{cmr}\textsc{\textbf{Disjunctive Cause Criterion}}} \\
        %%%
        \cmidrule(lr){2-13} 
        & \multicolumn{4}{c}{\fontfamily{cmr}\textsc{\textbf{Valid Adjustment Set}}} & \multicolumn{4}{c}{\fontfamily{cmr}\textsc{\textbf{Confounder Precision}}} & \multicolumn{4}{c}{\fontfamily{cmr}\textsc{\textbf{Confounder Recall}}} \\
         %%%%
         \cmidrule(lr){2-5} \cmidrule(lr){6-9} \cmidrule(lr){10-13} 
         %%%%
        $n$ & \textsc{LDP} & \textsc{PC} & \textsc{LDECC} & \textsc{MB-by-MB} & \textsc{LDP} & \textsc{PC} & \textsc{LDECC} & \textsc{MB-by-MB} & \textsc{LDP} & \textsc{PC} & \textsc{LDECC} & \textsc{MB-by-MB} \\
        \hline
        $25k$ & 0.8 & \textbf{0.9} & 0.3 & 0.9 & \textbf{38.00 (25.33-50.67)} & 22.50 (17.60-27.40) & 33.33 (8.03-58.64) & 34.17 (24.91-43.42) & \textbf{80.00 (53.87-100)} & 45.00 (35.20-54.80) & 25.00 (8.67-41.33) & 45.00 (35.20-54.80) \\
        $50k$ & 0.7 & \textbf{1.0} & 0.2 & 0.7 & \textbf{36.33 (23.92-48.75)} & 26.67 (24.49-28.84) & 10.00 (0-23.07) & 23.33 (11.71-34.96) & \textbf{80.00 (53.87-100)} & 60.00 (46.93-73.07) & 10.00 (0-23.07) & 35.00 (20.03-49.97) \\
        $75k$ & 0.9 & \textbf{1.0} & 0.0 & 0.4 & \textbf{45.00 (41.73-48.27)} & 25.83 (24.2-27.47) & 8.33 (0-19.03) & 29.05 (12.20-45.90) & \textbf{100 (100-100)} & 50.00 (50.00-50.00) & 12.50 (0-28.54) & 35.71 (17.64-53.79) \\
        \midrule[1pt]
    \end{tabular}
    \end{adjustbox}
    %%%%%%%
    %%%%%%%
    %%%%%%%
    \begin{adjustbox}{max width=\textwidth}
    \begin{tabular}{l accc accc}
        %%%
        & \multicolumn{8}{c}{\Large \fontfamily{cmr}\textsc{\textbf{Both Criteria}}} \\
        %%%
        \cmidrule(lr){2-9} 
         %%%%
         & \multicolumn{4}{c}{\fontfamily{cmr}\textsc{\textbf{Independence Tests}}} & \multicolumn{4}{c}{\fontfamily{cmr}\textsc{\textbf{Runtime (seconds)}}} \\
         %%%%
         \cmidrule(lr){2-5} \cmidrule(lr){6-9} 
         %%%%
        $n$ & \textsc{LDP} & \textsc{PC} & \textsc{LDECC} & \textsc{MB-by-MB} & \textsc{LDP} & \textsc{PC} & \textsc{LDECC} & \textsc{MB-by-MB}  \\
        %%%
        \hline
        $25k$ & \textbf{142.9 (141.5-144.3)} & 3021.9 (2975.2-3068.6) & 2784.1 (2118.4-3449.8) & 823.7 (610.1-1037.3) & \textbf{0.065 (0.061-0.069)} & 92.08 (90.351-93.81) & 99.485 (78.085-120.885) & 86.292 (51.39-121.193) \\
        $50k$ & \textbf{146.9 (145.2-148.6)} & 3841.9 (3761.2-3922.6) & 4405 (3734.8-5075.2) & 1146.6 (660.5-1632.7) & \textbf{0.109 (0.101-0.116)} & 243.973 (237.472-250.474) & 310.255 (262.338-358.172) & 263.322 (145.116-381.528) \\
        $75k$ & \textbf{148.6 (147.3-149.9)} & 4307.9 (4225.9-4389.9) & 4615.2 (4049.2-5181.3) & 1567.3 (881.9-2252.7) & \textbf{0.162 (0.145-0.178)} & 415.874 (398.714-433.035) & 473.107 (408.198-538.016) & 582.672 (306.342-859.001) \\
        \bottomrule[1pt]
    \end{tabular}
    \end{adjustbox}
    
    %%%%%%%%%%
    %%%%%%%%%%
    %%%%%%%%%%



    \caption{Baseline comparison on the \textsc{Mildew} benchmark from \texttt{bnlearn} \citep{scutari_learning_2010}, with \textsc{mikro\_1} as exposure and \textsc{meldug\_2} as outcome.
    Independence was determined by chi-square independence tests with $\alpha = 0.005$. Both the common cause criterion and disjunctive cause criterion were considered. Values are reported for 10 replicate DAGs with 95\% confidence intervals in parentheses. Sample size is denoted by $n$. Adjustment set quality was measured by fraction that are valid under the backdoor criterion, confounder precision per adjustment set, and confounder recall per adjustment set. The method proposed in this work is highlighted in yellow. The most performant values per metric are bolded. All experiments were run on a 2017 MacBook with 2.9 GHz Quad-Core Intel Core i7. Results are visualized in Figure \ref{fig:baselines}.}
    \label{tab:mildew}
\end{table}