% pearsonr bail prompt bail first value: -0.1686031078511675 p value: 0.35629681003851993
% distance corr bail prompt bail first value: 0.2546164545837631 p value: 0.425

\begin{figure}[H]
\centering
\pgfplotstableread{
Label refusePr bailPr
gpt-3.5-turbo 2.190184049079755 83.77975178675092
gpt-4 16.33128834355828 93.97783950638302
gpt-4-turbo 2.6319018404907975 87.79797429423151
gpt-4o-mini 15.030674846625766 86.32249874150898
gpt-4o 52.466257668711656 88.27282715478749
gpt-4.1-nano 12.460122699386503 91.87518332115332
gpt-4.1-mini 0.245398773006135 90.07945984469346
gpt-4.1 0.27607361963190186 92.55439197295846
claude-3-haiku-20240307 31.435582822085887 97.52805055921178
claude-3-5-haiku-20241022 10.521472392638037 97.08691879433503
claude-3-5-sonnet-20240620 1.687116564417178 97.56141413151617
claude-3-5-sonnet-20241022 20.80368098159509 97.30493857151818
claude-3-7-sonnet-20250219 0.4171779141104294 93.72049780523525
claude-sonnet-4-20250514 2.4171779141104297 91.71525801318981
claude-3-opus-20240229 12.94478527607362 97.65222037089703
claude-opus-4-20250514 8.49079754601227 88.94525920002395
claude-opus-4-1-20250805 13.447852760736195 90.29761679782575
NousResearch/Hermes-3-Llama-3.2-3B 65.14110429447852 53.06528862214296
NousResearch/Hermes-3-Llama-3.1-8B 0.22699386503067487 69.03809739037938
unsloth/Llama-3.1-8B-Instruct 33.23312883435583 89.73584828052694
Qwen/Qwen3-1.7B 38.47239263803681 44.76861113689245
Qwen/Qwen3-4B 1.3558282208588956 57.59240693196745
Qwen/Qwen3-8B 1.1533742331288344 57.219730176900065
Qwen/Qwen3-32B 3.9079754601226995 64.80506839774594
Qwen/Qwen3-30B-A3B 2.110429447852761 66.6867686539797
Qwen/QwQ-32B 5.319018404907975 64.9813748272193
Qwen/Qwen2.5-7B-Instruct 4.355828220858895 80.1666466893057
zai-org/GLM-4-32B-0414 0.147239263803681 86.36646310718476
zai-org/GLM-Z1-9B-0414 19.96319018404908 62.884260388853974
google/gemma-2-2b-it 52.52147239263804 90.20442422800069
google/gemma-2-9b-it 0.9693251533742332 95.48484590646319
google/gemma-2-27b-it 0.0 95.5098134642681
}\datatable
\begin{tikzpicture}
  \begin{axis}[
      width=15cm,
      height=9cm,
      xlabel={Refusal probability (\texttt{refusePr})},
      ylabel={Bail-out probability (\texttt{bailPr})},
      title={LLM trade-off scatterplot},
      grid=both,
      enlargelimits=0.03,
      % nodes-near-coords settings
      nodes near coords,
      point meta=explicit symbolic,      % meta column holds the label
      every node near coord/.style={
        font=\scriptsize,
        anchor=west,
        xshift=2pt,
        draw=white, fill=white,  % tiny white halo for readability
        inner sep=1pt
      },
      % visual style of the marks
      only marks,
      mark=*,
      mark size=2pt,
      color=blue!60!black
  ]
    % ----------------------------------------------------------------------
    % 2.  The actual plot ---------------------------------------------------
    % ----------------------------------------------------------------------
    \addplot table[
        x=refusePr,
        y=bailPr,
        meta=label                % <-- use "label" column as point meta
    ] {\datatable};
  \end{axis}
\end{tikzpicture}
\end{figure}
