%!TEX root = ../main.tex

\begin{figure*}[t!]
    \centering
    \begin{minipage}{1.15in}
        \scriptsize
        \begin{tabular}{lr}    
            \toprule                                                       
            \textbf{Embedding} & F1-score \\
            \midrule         
            Raw pixel          & 19.3  \\
            RN-101        & 31.1\\
            BiT-M          & 42.5  \\
            \textbf{CLIP}            & \textbf{69.6}  \\
            \bottomrule
        \end{tabular}
    \end{minipage}
    \begin{minipage}{1.85in}
        \centering
        \includegraphics[width=1.85in]{figs/video_lipschitzness.pdf}
    \end{minipage}
    \begin{minipage}{1.7in}
        \begin{flushright}
            \scriptsize
            \begin{tabular}{lr}    
                \toprule                                                     
                \textbf{Prompting} & F1-score \\
                \midrule
                No Prompt          & 48.5  \\
                Prompt Beginning          & 50.2  \\
                \textbf{Prompt End}          & \textbf{52.2} \\
                \bottomrule
            \end{tabular}
        \end{flushright}
    \end{minipage}
    \begin{minipage}{1.95in}
        \centering
        \includegraphics[width=1.85in]{figs/text_lipschitzness.pdf}
    \end{minipage}
    \caption{
        Left: \sysname\ performance and smoothness measurements of CLIP, BiT-M, ResNet-101, and raw pixels as embeddings for \basketball.
        Right: \sysname\ performance and smoothness measurements of no prompting, prompting at beginning, and prompting at end in GPT-3 for \spouse.
    }
    \label{smoothness}
\end{figure*}
