\begin{figure*}[th]
    \centering
    % First row of figures
    \begin{subfigure}{0.2\textwidth}
        \centering
        \includegraphics[width=\linewidth]{fig/mondrian/class_real.png}
        % \caption{Subcaption for image 1}
    \end{subfigure}
    % \hfill
    \begin{subfigure}{0.2\textwidth}
        \centering
        \includegraphics[width=\linewidth]{fig/mondrian/class_dirac.png}
        % \caption{Subcaption for image 2}
    \end{subfigure}
        % \hfill
    \begin{subfigure}{0.251\textwidth}
        \centering
        \includegraphics[width=\linewidth]{fig/mondrian/entropy_std1_dis.png}
        % \caption{Subcaption for image 2}
    \end{subfigure}
    % \hfill
    \begin{subfigure}{0.205\textwidth}
        \centering
        \includegraphics[width=\linewidth]{fig/mondrian/color_stdrand_dis.png}
        % \caption{Subcaption for image 2}
    \end{subfigure}

    \vspace{-3mm}
    % \vspace{1em} % Add vertical space between rows

    \caption{True (\emph{top}) and recovered (\emph{bottom}) partition-conditional group distributions based on different data partitions (class, entropy, color) and shifts (outlined in \autoref{app:details-mcp}). \emph{From left to right:} (a) Class partition, no shift; (b) Class partition, \texttt{dirac} shift; (c) Entropy partition, \texttt{normal} shift; (d) Color partition, \texttt{var-gauss} shift. For (c) samples are partitioned by predictive entropy into exp. scaled bins, for (d) samples are assigned based on RGB values and average image color. Both are used as a measure of sample complexity. We consider $G$ as the $C8$ rotation group. Using the canonicalization network's group distributions and \autoref{eq:conditional_distribution}, the built group maps (\emph{bottom}) accurately uncover existing partition-conditional geometric patterns.
    }
    \label{fig:class_conditional_mondrian}
\end{figure*}


%------------------------------------------------


% \begin{figure*}[th]
%     \centering
%     % First row of figures
%     \begin{subfigure}{0.3\textwidth}
%         \centering
%         \includegraphics[width=\linewidth]{fig/SAMPLE_learned_joint_real.png}
%         % \caption{Subcaption for image 1}
%     \end{subfigure}
%     \hfill
%     \begin{subfigure}{0.3\textwidth}
%         \centering
%         \includegraphics[width=\linewidth]{fig/SAMPLE_learned_joint.png}
%         % \caption{Subcaption for image 2}
%     \end{subfigure}
%     \hfill
%     \begin{subfigure}{0.3\textwidth}
%         \centering
%         \includegraphics[width=\linewidth]{fig/SAMPLE_learned_joint.png}
%         % \caption{Subcaption for image 3}
%     \end{subfigure}
    
%     \vspace{1em} % Add vertical space between rows

%     % Second row of figures
%     \begin{subfigure}{0.3\textwidth}
%         \centering
%         \includegraphics[width=\linewidth]{fig/SAMPLE_learned_joint_real.png}
%         % \caption{Subcaption for image 4}
%     \end{subfigure}
%     \hfill
%     \begin{subfigure}{0.3\textwidth}
%         \centering
%         \includegraphics[width=\linewidth]{fig/SAMPLE_learned_joint.png}
%         % \caption{Subcaption for image 5}
%     \end{subfigure}
%     \hfill
%     \begin{subfigure}{0.3\textwidth}
%         \centering
%         \includegraphics[width=\linewidth]{fig/SAMPLE_learned_joint.png}
%         % \caption{Subcaption for image 6}
%     \end{subfigure}
    
%     \caption{True (top) and recovered (bottom) group distributions. Left to right: assessing exchangeability, identifying feature-conditional partition, recovering class-conditional shift.}
%     \label{fig:six_images}
% \end{figure*}
