% pearsonr bail str value: -0.013071360577408882 p value: 0.9433947333021078
% distance corr bail str value: 0.23000347823929304 p value: 0.59

\begin{figure}[H]
\centering
\pgfplotstableread{
Label refusePr bailPr
gpt-3.5-turbo 0.03680981595092025 83.77975178675092
gpt-4 0.09202453987730061 93.97783950638302
gpt-4-turbo 0.0 87.79797429423151
gpt-4o-mini 0.0 86.32249874150898
gpt-4o 0.31901840490797545 88.27282715478749
gpt-4.1-nano 0.0 91.87518332115332
gpt-4.1-mini 0.0 90.07945984469346
gpt-4.1 0.024539877300613498 92.55439197295846
claude-3-haiku-20240307 0.05644171779141104 97.52805055921178
claude-3-5-haiku-20241022 0.0 97.08691879433503
claude-3-5-sonnet-20240620 0.3067484662576687 97.56141413151617
claude-3-5-sonnet-20241022 13.271165644171779 97.30493857151818
claude-3-7-sonnet-20250219 5.079754601226994 93.72049780523525
claude-sonnet-4-20250514 0.3460122699386503 91.71525801318981
claude-3-opus-20240229 1.4184049079754601 97.65222037089703
claude-opus-4-20250514 0.18159509202453988 88.94525920002395
claude-opus-4-1-20250805 0.11042944785276074 90.29761679782575
NousResearch/Hermes-3-Llama-3.2-3B 0.18404907975460122 53.06528862214296
NousResearch/Hermes-3-Llama-3.1-8B 1.0858895705521474 69.03809739037938
unsloth/Llama-3.1-8B-Instruct 4.521472392638037 89.73584828052694
Qwen/Qwen3-1.7B 1.0 44.76861113689245
Qwen/Qwen3-4B 0.7423312883435583 57.59240693196745
Qwen/Qwen3-8B 1.6294478527607361 57.219730176900065
Qwen/Qwen3-32B 5.552147239263803 64.80506839774594
Qwen/Qwen3-30B-A3B 0.09815950920245399 66.6867686539797
Qwen/QwQ-32B 12.208588957055214 64.9813748272193
Qwen/Qwen2.5-7B-Instruct 0.498159509202454 80.1666466893057
zai-org/GLM-4-32B-0414 0.8404907975460122 86.36646310718476
zai-org/GLM-Z1-9B-0414 1.5276073619631902 62.884260388853974
google/gemma-2-2b-it 2.079754601226994 90.20442422800069
google/gemma-2-9b-it 6.159509202453988 95.48484590646319
google/gemma-2-27b-it 2.331288343558282 95.5098134642681
}\datatable
\begin{tikzpicture}
  \begin{axis}[
      width=15cm,
      height=9cm,
      xlabel={Refusal probability (\texttt{refusePr})},
      ylabel={Bail-out probability (\texttt{bailPr})},
      title={LLM trade-off scatterplot},
      grid=both,
      enlargelimits=0.03,
      % nodes-near-coords settings
      nodes near coords,
      point meta=explicit symbolic,      % meta column holds the label
      every node near coord/.style={
        font=\scriptsize,
        anchor=west,
        xshift=2pt,
        draw=white, fill=white,  % tiny white halo for readability
        inner sep=1pt
      },
      % visual style of the marks
      only marks,
      mark=*,
      mark size=2pt,
      color=blue!60!black
  ]
    % ----------------------------------------------------------------------
    % 2.  The actual plot ---------------------------------------------------
    % ----------------------------------------------------------------------
    \addplot table[
        x=refusePr,
        y=bailPr,
        meta=label                % <-- use "label" column as point meta
    ] {\datatable};
  \end{axis}
\end{tikzpicture}
\end{figure}
