\begin{figure}[tbp!]
    \centering
    \begin{subfigure}{0.6\textwidth}
        \centering
        \includegraphics[width=\textwidth]{figures/images/additional/llama2_fs_conformal.png}
        \caption{LLama 2 7B Chat}
        \label{fig:conformal_fs_llama}
    \end{subfigure}
    %
    \begin{subfigure}{0.6\textwidth}
        \centering
        \includegraphics[width=\textwidth]{figures/images/additional/mistral_fs_conformal.png}
        \caption{Mistral 7B Instruct}
        \label{fig:conformal_fs_mistral}
    \end{subfigure}
    \caption{For each target coverage, we run conformal methods (SC, CQR) and their multigroup counterparts (MVSC, GCCQR) on \textsc{Bio-FactScore}. We evaluate on generations by (a) Llama 2 7B Chat and (b) Mistral 7B Instruct. We calculate the average coverage error across all groups and plot them side by side for each pairing. All methods use \textit{self-consistency} as their base scoring function.}
    \label{fig:conformal_fs}
\end{figure}