


\pgfplotsset{compat=1.17}


\begin{figure*}[h!]
    \centering
    \begin{minipage}{0.9\textwidth}
    \resizebox{\textwidth}{!}{
    \begin{tikzpicture}
    % Subfigure (a)
    \begin{axis}[
        at={(0,0)},
        anchor=north west,
        title={(a) Wild-TI2I},
        xlabel={\scriptsize Text-Image Similarity (CLIP cosine similarity)},
        ylabel={\scriptsize Structure Distance (DINO self-similarity)},
        xmin=0.24, xmax=0.33,
        ymin=0.03, ymax=0.11,
        width=5cm, height=5cm,
        scale only axis,
       % axis background/.style={fill=blue!5},
        grid=both,
        grid style={dotted, gray},
        xtick={0.25, 0.26, 0.27, 0.28, 0.29, 0.30,0.31, 0.32},
        ytick={0.03, 0.04, 0.05, 0.06, 0.07, 0.08, 0.09, 0.10},
        tick label style={font=\scriptsize},
        scaled ticks=false,
        tick label style={/pgf/number format/fixed, /pgf/number format/precision=2} % Use fixed-point notation with 2 decimal places
    ]
   % \shade[top color=blue!5, bottom color=white] (0,0) rectangle (5,5);

  \addplot[only marks, mark=*, mark size=2pt, color=red] coordinates {(0.324, 0.095)};
\node[anchor=west, font=\scriptsize] at (axis cs:0.29, 0.095) {VQGAN-CLIP};

\addplot[only marks, mark=*, mark size=2pt, color=orange] coordinates {(0.281,0.105)};
\node[anchor=west, font=\scriptsize] at (axis cs:0.281,0.105) {SDEdit (n=0.85)};

\addplot[only marks, mark=*, mark size=2pt, color=orange] coordinates {(0.268,0.084)};
\node[anchor=west, font=\scriptsize] at (axis cs:0.268,0.084) {SDEdit (n=0.75)};

\addplot[only marks, mark=*, mark size=2pt, color=orange] coordinates {(0.245,0.052)};
\node[anchor=west, font=\scriptsize] at (axis cs:0.245,0.052) {SDEdit (n=0.6)};

\addplot[only marks, mark=*, mark size=2pt, color=brown] coordinates {(0.253,0.04)};
\node[anchor=west, font=\scriptsize] at (axis cs:0.253,0.04) {DiffuseIT};

\addplot[only marks, mark=*, mark size=2pt, color=purple] coordinates {(0.2825, 0.058)};
\node[anchor=west, font=\scriptsize] at (axis cs:0.2825, 0.058) {PnP};

\addplot[only marks, mark=*, mark size=2pt, color=green] coordinates {(0.2961, 0.0492)};
\node[anchor=west, font=\scriptsize] at (axis cs:0.2961, 0.0492) {Ours [l=4,5]};

\addplot[only marks, mark=*, mark size=2pt, color=green] coordinates {(0.3105, 0.0602)};
\node[anchor=west, font=\scriptsize] at (axis cs:0.3105, 0.0602) {Ours [l=4]};




% Generated
\addplot[only marks, mark=square*, mark size=2pt, color=red] coordinates {(0.325, 0.1)};
\addplot[only marks, mark=square*, mark size=2pt, color=orange] coordinates {(0.283,0.09)};
\addplot[only marks, mark=square*, mark size=2pt, color=orange] coordinates {(0.272,0.067)};
\addplot[only marks, mark=square*, mark size=2pt, color=orange] coordinates {(0.247,0.043)};
\addplot[only marks, mark=square*, mark size=2pt, color=brown] coordinates {(0.255,0.033)};
\addplot[only marks, mark=square*, mark size=2pt, color=purple] coordinates {(0.289, 0.048)};
\addplot[only marks, mark=square*, mark size=2pt, color=green] coordinates {(0.3083, 0.065)};
\addplot[only marks, mark=square*, mark size=2pt, color=green] coordinates {(0.3193, 0.0852)};

% Dotted lines connecting corresponding points
\addplot[dashed, color=gray] coordinates {(0.324, 0.095) (0.325, 0.1)};
\addplot[dashed, color=gray] coordinates {(0.281, 0.105) (0.283, 0.09)};
\addplot[dashed, color=gray] coordinates {(0.268, 0.084) (0.272, 0.067)};
\addplot[dashed, color=gray] coordinates {(0.245, 0.052) (0.247, 0.043)};
\addplot[dashed, color=gray] coordinates {(0.253, 0.04) (0.255, 0.033)};
\addplot[dashed, color=gray] coordinates {(0.2825, 0.058) (0.289, 0.048)};

\addplot[dashed, color=gray] coordinates {(0.2961, 0.0492) (0.3083, 0.065)};
\addplot[dashed, color=gray] coordinates {(0.3105, 0.0602) (0.3193, 0.0852)};

    %\draw[->, thick, color=green] (axis cs:0.31, 0.0358) -- ++(0.02,-0.02);
    %\addplot[only marks, mark=10-pointed star, mark size=6pt, color=red] coordinates {(0.31, 0.0358)};
    \node[anchor=west, font=\small] at (axis cs:0.31, 0.0358) {\textbf{Better}};
    \end{axis}
    \end{tikzpicture}
    % Subfigure (b)






    
    \begin{tikzpicture}
    % Subfigure (a)
    \begin{axis}[
        at={(0,0)},
        anchor=north west,
        title={(b) ImageNet-R-TI2I},
        xlabel={\scriptsize Text-Image Similarity (CLIP cosine similarity)},
        ylabel={\scriptsize Structure Distance (DINO self-similarity)},
        xmin=0.22, xmax=0.325,
        ymin=0.03, ymax=0.1,
        width=5cm, height=5cm,
        scale only axis,
       % axis background/.style={fill=blue!5},
        grid=both,
        grid style={dotted, gray},
        xtick={0.22,  0.24,  0.26,  0.28, 0.30, 0.32},
        ytick={0.03, 0.04, 0.05, 0.06, 0.07, 0.08, 0.09, 0.10},
        tick label style={font=\scriptsize},
        scaled ticks=false,
        tick label style={/pgf/number format/fixed, /pgf/number format/precision=2} % Use fixed-point notation with 2 decimal places
    ]





    
   % \shade[top color=blue!5, bottom color=white] (0,0) rectangle (5,5);
    \addplot[only marks, mark=*, mark size=2pt, color=red] coordinates {(0.3204, 0.089)};
    \node[anchor=west, font=\scriptsize] at (axis cs:0.2804, 0.089) {VQGAN-CLIP};
   
    \addplot[only marks, mark=*, mark size=2pt, color=orange] coordinates {(0.272,0.096)};
    \node[anchor=west, font=\scriptsize] at (axis cs:0.272,0.096) {SDEdit (n=0.85)};
    
    \addplot[only marks, mark=*, mark size=2pt, color=orange] coordinates {(0.269,0.073)};
    \node[anchor=west, font=\scriptsize] at (axis cs:0.269,0.073) {SDEdit (n=0.75)};

    \addplot[only marks, mark=*, mark size=2pt, color=orange] coordinates {(0.255,0.048)};
    \node[anchor=west, font=\scriptsize] at (axis cs:0.258,0.048) {SDEdit (n=0.6)};

    \addplot[only marks, mark=*, mark size=2pt, color=blue] coordinates {(0.225, 0.057)};
    \node[anchor=west, font=\scriptsize] at (axis cs: 0.225, 0.057) {P2P};
    
    
    \addplot[only marks, mark=*, mark size=2pt, color=brown] coordinates {(0.245, 0.035)};
    \node[anchor=west, font=\scriptsize] at (axis cs: 0.245, 0.035) {DiffuseIT};
    
    \addplot[only marks, mark=*, mark size=2pt, color=purple] coordinates {(0.2725, 0.052)};
    \node[anchor=west, font=\scriptsize] at (axis cs: 0.2725, 0.052) {PnP};

    \addplot[only marks, mark=*, mark size=2pt, color=green] coordinates {(0.298, 0.06)};
    \node[anchor=west, font=\scriptsize] at (axis cs: 0.298, 0.06) {Ours [l=4]};
    
    \addplot[only marks, mark=*, mark size=2pt, color=green] coordinates {(0.3055, 0.083)};
    \node[anchor=west, font=\scriptsize] at (axis cs: 0.3055, 0.083) {Ours [l=4,5]};

    %\draw[->, thick, color=green] (axis cs:0.31, 0.0358) -- ++(0.02,-0.02);
    %\addplot[only marks, mark=10-pointed star, mark size=6pt, color=red] coordinates {(0.31, 0.0358)};
    \node[anchor=west, font=\small] at (axis cs:0.295, 0.0358) {\textbf{Better}};


    \end{axis}
    \end{tikzpicture}



    
       \begin{tikzpicture}
    % Subfigure (c)
    \begin{axis}[
        at={(0,0)},
        anchor=north west,
        title={(c) Generated ImageNet-R-TI2I},
        xlabel={\scriptsize Text-Image Similarity (CLIP cosine similarity)},
        ylabel={\scriptsize Structure Distance (DINO self-similarity)},
        xmin=0.245, xmax=0.32,
        ymin=0.025, ymax=0.1,
        width=5cm, height=5cm,
        scale only axis,
       % axis background/.style={fill=blue!5},
        grid=both,
        grid style={dotted, gray},
        xtick={0.25,  0.26, 0.27,  0.28, 0.29, 0.30, 0.31, 0.32},
        ytick={0.03, 0.04, 0.05, 0.06, 0.07, 0.08, 0.09, 0.10},
        tick label style={font=\scriptsize},
        scaled ticks=false,
        tick label style={/pgf/number format/fixed, /pgf/number format/precision=2} % Use fixed-point notation with 2 decimal places
    ]













    
   % \shade[top color=blue!5, bottom color=white] (0,0) rectangle (5,5);
    \addplot[only marks, mark=square*, mark size=2pt, color=red] coordinates {(0.315, 0.082)};
    \node[anchor=west, font=\scriptsize] at (axis cs:0.287, 0.082) {VQGAN-CLIP};
   
    \addplot[only marks, mark=square*, mark size=2pt, color=orange] coordinates {(0.28,0.09)};
    \node[anchor=west, font=\scriptsize] at (axis cs:0.28,0.09) {SDEdit (n=0.85)};
    
    \addplot[only marks, mark=square*, mark size=2pt, color=orange] coordinates {(0.267, 0.065)};
    \node[anchor=west, font=\scriptsize] at (axis cs:0.267, 0.065) {SDEdit (n=0.75)};

    \addplot[only marks, mark=square*, mark size=2pt, color=orange] coordinates {(0.248,0.038)};
    \node[anchor=west, font=\scriptsize] at (axis cs:0.248,0.038) {SDEdit (n=0.6)};

    \addplot[only marks, mark=square*, mark size=2pt, color=blue] coordinates {(0.282, 0.095)};
    \node[anchor=west, font=\scriptsize] at (axis cs: 0.282, 0.094) {P2P (t=500)};

    \addplot[only marks, mark=square*, mark size=2pt, color=blue] coordinates {(0.268, 0.087)};
    \node[anchor=west, font=\scriptsize] at (axis cs: 0.268, 0.087) {P2P (t=1000)};
    
    
    \addplot[only marks, mark=square*, mark size=2pt, color=brown] coordinates {(0.255, 0.035)};
    \node[anchor=west, font=\scriptsize] at (axis cs: 0.255, 0.035) {DiffuseIT};
    
    \addplot[only marks, mark=square*, mark size=2pt, color=purple] coordinates {(0.275, 0.042)};
    \node[anchor=west, font=\scriptsize] at (axis cs: 0.275, 0.042) {PnP};


    \addplot[only marks, mark=square*, mark size=2pt, color=green] coordinates {(0.3037, 0.049)};
    \node[anchor=west, font=\scriptsize] at (axis cs: 0.3037, 0.049) {Ours [l=4]};
    
    \addplot[only marks, mark=square*, mark size=2pt, color=green] coordinates {(0.2927, 0.032)};
    \node[anchor=west, font=\scriptsize] at (axis cs: 0.2927, 0.032) {Ours [l=4,5]};

    %\draw[->, thick, color=green] (axis cs:0.31, 0.0358) -- ++(0.02,-0.02);
    %\addplot[only marks, mark=10-pointed star, mark size=6pt, color=red] coordinates {(0.31, 0.0358)};
    \node[anchor=west, font=\small] at (axis cs:0.295, 0.0358) {\textbf{Better}};


    \end{axis}
    \end{tikzpicture}
    }
    \end{minipage}
    \caption{ Quantitative evaluation. We measure CLIP cosine similarity (higher is better) and DINO-ViT self-similarity distance (lower is better) to quantify the fidelity to text and preservation of structure, respectively. We report these metrics on three benchmarks: (a) Wild-TI2I, (b) ImageNet-R-TI2I, and (c) Generated ImageNet-R-TI2I. \cite{tumanyan_plug-and-play_2023}}
    \label{fig:pnp_map}
\end{figure*}
