\review{
\begin{figure}[!t]
    \centering
    \begin{minipage}{0.48\textwidth}
        \centering
        \includegraphics[width=\textwidth]{figures/other_dims/overall.pdf}
        \subcaption{Overall Score}
        \label{fig:other_dims:overall_score}
    \end{minipage}
    \hfill
    \begin{minipage}{0.48\textwidth}
        \centering
        \includegraphics[width=\textwidth]{figures/other_dims/knowledge.pdf}
        \subcaption{Knowledge}
        \label{fig:other_dims:knowledge}
    \end{minipage}
    \vspace{0.3cm}
    
    \begin{minipage}{0.48\textwidth}
        \centering
        \includegraphics[width=\textwidth]{figures/other_dims/fin_benefits.pdf}
        \subcaption{Financial Benefits}
        \label{fig:other_dims:financial_benefits}
    \end{minipage}
    \hfill
    \begin{minipage}{0.48\textwidth}
        \centering
        \includegraphics[width=\textwidth]{figures/other_dims/social_rules.pdf}
        \subcaption{Social Rules}
        \label{fig:other_dims:social_rules}
    \end{minipage}
    \vspace{0.3cm}
    
    \begin{minipage}{0.48\textwidth}
        \centering
        \includegraphics[width=\textwidth]{figures/other_dims/secret.pdf}
        \subcaption{Secret}
        \label{fig:other_dims:secret}
    \end{minipage}
    \hfill
    \begin{minipage}{0.48\textwidth}
        \centering
        \includegraphics[width=\textwidth]{figures/other_dims/relationship.pdf}
        \subcaption{Relationship}
        \label{fig:other_dims:relationship}
    \end{minipage}
    
    \caption{Performance of language agents and humans across six additional evaluation dimensions in \sotopiaeval. Each subfigure shows the trends in performance across episodes. These dimensions do not show a lot of variance in their scores across episodes.}
    \label{fig:other_dims_combined}
\end{figure}
}
