
% median: 0.002812208069497205

\begin{tikzpicture}
\definecolor{bailtool}{RGB}{155, 89, 182}                  % Purple (warm undertones)
\definecolor{bailstring}{RGB}{231, 76, 60}                 % Bright Red
\definecolor{bailpromptcontinuefirst}{RGB}{230, 126, 34}   % Standard Orange
\definecolor{bailpromptbailfirst}{RGB}{243, 156, 18}       % Golden Orange
\definecolor{bailpromptunknown}{RGB}{149,165,166}          % Gray
\usetikzlibrary{patterns}
\pgfplotstableread{
Label toolBailPr toolBailPr_err strBailPr strBailPr_err promptBailFirstBailPr promptBailFirstBailPr_err promptBailFirstUnknownPr promptContinueFirstBailPr promptContinueFirstBailPr_err promptContinueFirstUnknownPr
Hermes-3-Llama-3.2-3B 0.0 0.011781272457897283 0 0 0 0 0 0 0 0
{} 0 0 0.09600203060409329 0.04897087335826009 0 0 0 0 0 0
{} 0 0 0 0 35.70552147239264 0.7354788376174228 0 0 0 0
{} 0 0 0 0 0 0 0 10.128834355828223 0.4632232562817143 0
zai-org/GLM-4-32B-0414 6.502927279208952 0.3786375768077571 0 0 0 0 0 0 0 0
{} 0 0 0.3839382531107804 0.09564781275526596 0 0 0 0 0 0
{} 0 0 0 0 0.018404907975460127 0.023922434483238924 0 0 0 0
{} 0 0 0 0 0 0 0 0.06134969325153375 0.03978851642720141 0
Qwen3-8B 3.226965790224221 0.27148360275565236 0 0 0 0 0 0 0 0
{} 0 0 0.8991619599787004 0.1453612530986273 0 0 0 0 0 0
{} 0 0 0 0 0.2773006134969325 0.08156624723598353 0 0 0 0
{} 0 0 0 0 0 0 0 1.6613496932515337 0.19653246279099754 0
google/gemma-2-2b-it 0 0.011781272457897283 0 0 0 0 0 0 0 0
{} 0 0 0.8388315910522033 0.14047559298873827 0 0 0 0 0 0
{} 0 0 0 0 2.7239263803680984 0.2501168469820114 0 0 0 0
{} 0 0 0 0 0 0 0 0.1226993865030675 0.055006185371798216 0
claude-3-6-sonnet 1.95183327063717 0.21265154906361466 0 0 0 0 0 0 0 0
{} 0 0 0.6297266842000461 0.12198298595478296 0 0 0 0 0 0
{} 0 0 0 0 0.0 0.011781272457897283 0 0 0 0
{} 0 0 0 0 0 0 0 0.012269938650306749 0.020683466198947988 0
Qwen2.5-7B-Instruct 0.6472936454611414 0.12364622525153235 0 0 0 0 0 0 0 0
{} 0 0 0.2851410004025085 0.08268439889507184 0 0 0 0 0 0
{} 0 0 0 0 0.36809815950920244 0.0936918635589946 0 0 0 0
{} 0 0 0 0 0 0 0 0.09570552147239263 0.048899641761954646 0
gpt-4o 0.17061642462450535 0.0644294254647432 0 0 0 0 0 0 0 0
{} 0 0 0.1539087130876681 0.061309417706694944 0 0 0 0 0 0
{} 0 0 0 0 0.024539877300613498 0.026772042068470944 0 0 0 0
{} 0 0 0 0 0 0 0 0.09815950920245399 0.04948607345075612 0
}\datatable


\begin{axis}[
  ybar stacked,
  width = \linewidth,
  bar width = 8pt,
  ymin=0, ymax=100,
  xtick=data,
  ylabel = {Average no-refusal bail \% on BailBench},
  enlarge x limits = {abs = 20pt},
  xticklabels from table={\datatable}{Label},
  xticklabel style={xshift=12pt,rotate=90,align=center}, % ← rightwards shift
  xtick style={draw=none},
  enlarge y limits={value=0.05,upper},
  legend style={cells={anchor=east},legend pos=north east},
  reverse legend=false
]
    \addplot[fill=bailtool,
           error bars/.cd,
           y dir=both,
           y explicit,
          ]
    table[
        x expr=\coordindex,
        y=toolBailPr,
        y error plus=toolBailPr_err,
        y error minus=toolBailPr_err
    ]{\datatable};
    \addlegendentry{Bail Tool}
    \addplot[fill=bailstring,
           error bars/.cd,
           y dir=both,
           y explicit,
          ]
    table[
        x expr=\coordindex,
        y=strBailPr,
        y error plus=strBailPr_err,
        y error minus=strBailPr_err
    ]{\datatable};
    \addlegendentry{Bail String}
    \addplot[fill=bailpromptbailfirst,
           error bars/.cd,
           y dir=both,
           y explicit
          ]
    table[
        x expr=\coordindex,
        y=promptBailFirstBailPr,
        y error plus=promptBailFirstBailPr_err,
        y error minus=promptBailFirstBailPr_err
    ]{\datatable};
    \addlegendentry{Bail Prompt Bail-first}
    \addplot[fill=bailpromptunknown
          ]
    table[
        x expr=\coordindex,
        y=promptBailFirstUnknownPr,
        forget plot,
    ]{\datatable};
    \addplot[fill=bailpromptcontinuefirst,
           error bars/.cd,
           y dir=both,
           y explicit
          ]
    table[
        x expr=\coordindex,
        y=promptContinueFirstBailPr,
        y error plus=promptContinueFirstBailPr_err,
        y error minus=promptContinueFirstBailPr_err
    ]{\datatable};
    \addlegendentry{Bail Prompt Continue-first}
    \addplot[fill=bailpromptunknown
          ]
    table[
        x expr=\coordindex,
        y=promptContinueFirstUnknownPr,
        forget plot,
    ]{\datatable};
    \addplot[
      draw=none,                       % nothing visible
      fill=bailpromptunknown
    ] coordinates {(0,0)};             % single dummy point
    \addlegendentry{Refusal Classifier/Invalid Outputs}

\end{axis}
\end{tikzpicture}
