
% median: 0.043558282208588955

\begin{tikzpicture}
\definecolor{bailtool}{RGB}{155, 89, 182}                  % Purple (warm undertones)
\definecolor{bailstring}{RGB}{231, 76, 60}                 % Bright Red
\definecolor{bailpromptcontinuefirst}{RGB}{230, 126, 34}   % Standard Orange
\definecolor{bailpromptbailfirst}{RGB}{243, 156, 18}       % Golden Orange
\definecolor{bailpromptunknown}{RGB}{149,165,166}          % Gray
\usetikzlibrary{patterns}
\pgfplotstableread{
Label toolBailPr toolBailPr_err strBailPr strBailPr_err promptBailFirstBailPr promptBailFirstBailPr_err promptBailFirstUnknownPr promptContinueFirstBailPr promptContinueFirstBailPr_err promptContinueFirstUnknownPr
gpt-4o 2.042944785276074 0.21744253074502556 0 0 0 0 0 0 0 0
{} 0 0 0.31901840490797545 0.08734951693036817 0 0 0 0 0 0
{} 0 0 0 0 52.466257668711656 0.7665707964824237 1.1411042944785277 0 0 0
{} 0 0 0 0 0 0 0 51.93251533742331 0.766931457026479 0.6196319018404908
claude-3-6-sonnet 17.03558282208589 0.5771316133293325 0 0 0 0 0 0 0 0
{} 0 0 13.271165644171779 0.5208436178494069 0 0 0 0 0 0
{} 0 0 0 0 20.80368098159509 0.6231034545421195 0.1411042944785276 0 0 0
{} 0 0 0 0 0 0 0 25.693251533742334 0.670734420735604 0.2638036809815951
zai-org/GLM-4-32B-0414 71.47239263803681 0.6931456501085884 0 0 0 0 0 0 0 0
{} 0 0 0.8404907975460122 0.14061231013937578 0 0 0 0 0 0
{} 0 0 0 0 0.147239263803681 0.06001837776621577 0.4969325153374233 0 0 0
{} 0 0 0 0 0 0 0 0.8895705521472393 0.14459595679767218 0.8282208588957056
google/gemma-2-2b-it 0 0 0 0 0 0 0 0 0 0
{} 0 0 2.079754601226994 0.2193459223425212 0 0 0 0 0 0
{} 0 0 0 0 52.52147239263804 0.7665284802084759 0.049079754601226995 0 0 0
{} 0 0 0 0 0 0 0 5.226993865030675 0.34181126460118577 0.049079754601226995
Qwen3-8B 7.629447852760736 0.40761928515809015 0 0 0 0 0 0 0 0
{} 0 0 1.6294478527607361 0.19467467276963632 0 0 0 0 0 0
{} 0 0 0 0 1.1533742331288344 0.1643029366267986 0.28957055214723926 0 0 0
{} 0 0 0 0 0 0 0 6.088343558282209 0.3671917425789903 0.18650306748466258
Qwen2.5-7B-Instruct 1.0085889570552147 0.15381315761172387 0 0 0 0 0 0 0 0
{} 0 0 0.498159509202454 0.1086990281744821 0 0 0 0 0 0
{} 0 0 0 0 4.355828220858895 0.3134955956776603 0.32147239263803684 0 0 0
{} 0 0 0 0 0 0 0 0.36073619631901843 0.09276854837797718 0.294478527607362
}\datatable


\begin{axis}[
  ybar stacked,
  width = \linewidth,
  bar width = 8pt,
  ymin=0, ymax=100,
  xtick=data,
  ylabel = {Average bail \% on BailBench},
  enlarge x limits = {abs = 20pt},
  xticklabels from table={\datatable}{Label},
  xticklabel style={xshift=12pt,rotate=90,align=center}, % ← rightwards shift
  xtick style={draw=none},
  enlarge y limits={value=0.05,upper},
  legend style={cells={anchor=east},legend pos=north east},
  reverse legend=false
]
    \addplot[fill=bailtool,
           error bars/.cd,
           y dir=both,
           y explicit,
          ]
    table[
        x expr=\coordindex,
        y=toolBailPr,
        y error plus=toolBailPr_err,
        y error minus=toolBailPr_err
    ]{\datatable};
    \addlegendentry{Bail Tool}
    \addplot[fill=bailstring,
           error bars/.cd,
           y dir=both,
           y explicit,
          ]
    table[
        x expr=\coordindex,
        y=strBailPr,
        y error plus=strBailPr_err,
        y error minus=strBailPr_err
    ]{\datatable};
    \addlegendentry{Bail String}
    \addplot[fill=bailpromptbailfirst,
           error bars/.cd,
           y dir=both,
           y explicit
          ]
    table[
        x expr=\coordindex,
        y=promptBailFirstBailPr,
        y error plus=promptBailFirstBailPr_err,
        y error minus=promptBailFirstBailPr_err
    ]{\datatable};
    \addlegendentry{Bail Prompt Bail-first}
    \addplot[fill=bailpromptunknown
          ]
    table[
        x expr=\coordindex,
        y=promptBailFirstUnknownPr,
        forget plot,
    ]{\datatable};
    \addplot[fill=bailpromptcontinuefirst,
           error bars/.cd,
           y dir=both,
           y explicit
          ]
    table[
        x expr=\coordindex,
        y=promptContinueFirstBailPr,
        y error plus=promptContinueFirstBailPr_err,
        y error minus=promptContinueFirstBailPr_err
    ]{\datatable};
    \addlegendentry{Bail Prompt Continue-first}
    \addplot[fill=bailpromptunknown
          ]
    table[
        x expr=\coordindex,
        y=promptContinueFirstUnknownPr,
        forget plot,
    ]{\datatable};
    \addplot[
      draw=none,                       % nothing visible
      fill=bailpromptunknown
    ] coordinates {(0,0)};             % single dummy point
    \addlegendentry{Refusal Classifier/Invalid Outputs}

\end{axis}
\end{tikzpicture}
