%!TEX root = ../main.tex

\begin{figure*}[t]
    \centering
    \begin{minipage}{2in}
        \begin{flushright}
            \small
            \begin{tabular}{lr}    
                \toprule                                                       
                \textbf{Embedding} & F1-score \\
                \midrule         
                Raw pixel          & 19.3  \\
                RN-101        & 31.1\\
                BiT-M          & 42.5  \\
                \textbf{CLIP}            & \textbf{69.6}  \\
                \bottomrule
            \end{tabular}
    \end{flushright}
    \end{minipage}
    \begin{minipage}{4.5in}
        \centering
        \includegraphics[width=4.5in]{figs/video_lipschitzness_all.pdf}
    \end{minipage}
    \begin{minipage}{2in}
        \begin{flushright}
            \small
            \begin{tabular}{lr}    
                \toprule                                                     
                \textbf{Prompting} & F1-score \\
                \midrule
                No Prompt          & 48.5  \\
                Prompt at Beginning          & 50.2  \\
                \textbf{Prompt at End}          & \textbf{52.2} \\
                \bottomrule
            \end{tabular}
        \end{flushright}
    \end{minipage}
    \begin{minipage}{4.5in}
        \centering
        \includegraphics[width=4.5in]{figs/text_lipschitzness_all.pdf}
    \end{minipage}
    \caption{
        Top: \sysname\ performance and smoothness measurements of CLIP, BiT-M, ResNet-101, and raw pixels as embeddings for \basketball.
        Bottom: \sysname\ performance and smoothness measurements of no prompting, prompting at beginning, and prompting at end in GPT-3 for \spouse.
    }
    \label{smoothness_all}
\end{figure*}
