\definecolor{darkgreen}{rgb}{0.0, 0.5, 0.0}
\definecolor{darkorange}{rgb}{0.8, 0.4, 0.0}
\begin{figure*}
  \centering
  \begin{subfigure}[b]{0.33\textwidth}
    \centering
    \resizebox{\textwidth}{!}{%
      \input{figures/exp1_concrete_roc_auc_small.pgf}
    }
    \caption{%
      Performance over Paired Samples~$|\dset_J|$
    }\label{fig:expA}
  \end{subfigure}
  \hfill
  \begin{subfigure}[b]{0.66\textwidth}
    \centering
    \resizebox{0.49\textwidth}{!}{%
      \input{figures/exp3_concrete_roc_auc_small.pgf}
    }
    \resizebox{0.49\textwidth}{!}{%
      \input{figures/exp3_time_small.pgf}
    }
    \caption{%
      Performance
      and Execution Time (s)
      over Concrete Graph Size~$|\set{X}|$
    }\label{fig:expB}
  \end{subfigure}
  \caption{%
    We report the performance
    of Abs-LiNGAM
    for (a) an increasing number
    of paired samples~$|\dset_J|$~%
    and (b) an increasing number
    of concrete nodes~$|\set{X}|$~.%
    We plot a variant
    of Abs-LiNGAM
    where we bootstrap
    the abstract causal discovery step
    with five repetitions.
    We report the area under the ROC curve
    and the execution time
    over 30 runs
    on randomly generated
    Erd\H{o}s-R\'enyi abstract graphs
    with $b=5$ nodes
    and 8 edges.
    In the first experiment,
    we sample for each abstract graph
    a concrete model
    with random size $|\set{X}| \in [25, 50]$.
    In the second experiment,
    we also vary the number of paired samples
    to always be twice the number of concrete nodes.
  }\label{fig:experiments}
\end{figure*}
