% !TEX root = ../main.tex
\begin{figure}
  \centering
  % \begin{minipage}{0.6\linewidth}
  %   \includegraphics[height=4.8cm]{figures/detailed_descriptions/barplots.pdf}
  % \end{minipage} \hfill
  % \begin{minipage}{0.3\linewidth}
  %       \includegraphics[height=2.5cm]{figures/detailed_descriptions/clip_similarity_auroc_p1_n1.pdf}    
  %       \includegraphics[height=2.5cm]{figures/detailed_descriptions/clip_similarity_domino_auroc_n1.pdf}    
  % \end{minipage}  
  \includegraphics[width=1.\textwidth]{figures/detailed_descriptions/barplotss.pdf}
\caption{
% \textbf{(Left):}
% Mean and standard deviation of the similarity scores
% for images in failure modes and their corresponding descriptions as well as 
% the AUROC between the similarity score of captions to images inside failure modes and some images outside of the failure mode.
% Our method improves over DOMINO on different datasets.
The mean and standard deviation of similarity scores between images in failure modes and their respective descriptions, along with the AUROC measuring the similarity score between descriptions and images inside and outside of failure modes,
demonstrate that our method outperforms DOMINO in descriptions it generates for detected failure modes across various datasets.
}
% \textbf{(Right): }
% Histogram of similarity scores on failure modes detected over the Living17 dataset.
% For each failure mode, we take the corresponding caption and obtain similarity of that caption to images inside the group as well as some randomly sampled images outside of the group.
% }
\label{fig:auroc}
\end{figure}
