,win_rate,standard_error,mode,n_draws,n_total,n_wins,n_wins_base,output_length,avg_length
gpt4,77.01863354037268,1.46803688292698,minimal,12,805,614,179,,1365
claude,75.83850931677019,1.4981004247868313,minimal,9,805,606,190,,1082
llama-2-70b-chat-hf,72.91925465838509,1.5622590981080728,minimal,4,805,585,216,,1790
vicuna-33b-v1.3,72.36024844720497,1.5710737760483915,verified,5,805,580,220,,1479
claude-2,71.98757763975155,1.5824915958976835,minimal,1,805,579,225,1069.0,1069
jina-chat,66.64596273291924,1.65695577964565,community,5,805,534,266,,676
vicuna-13b-v1.3,66.2111801242236,1.6657907370589309,verified,2,805,532,271,,1132
wizardlm-13b,66.14906832298136,1.6584088766540706,minimal,9,805,528,268,,985
vicuna-13b,63.22981366459627,1.698243477332765,minimal,2,805,508,295,,1037
guanaco-65b,62.60869565217392,1.7063755171155923,minimal,0,805,504,301,,1249
vicuna-7b-v1.3,62.54658385093168,1.7035470981976453,verified,3,805,502,300,,1110
nous-hermes-13b,60.86956521739131,1.7144465955143962,verified,6,805,487,312,,844
guanaco-33b,57.88819875776397,1.7412811662531051,verified,0,805,466,339,,1311
vicuna-7b,57.329192546583855,1.7409917994657298,verified,3,805,460,342,,1044
oasst-rlhf-llama-33b,57.329192546583855,1.7409917994657302,minimal,3,805,460,342,,1079
llama-2-13b-chat-hf,56.14906832298136,1.7499783078823692,minimal,0,805,452,353,,1513
guanaco-13b,53.36239103362392,1.7582560332920765,verified,3,803,427,373,,1774
llama-2-7b-chat-hf,51.98757763975155,1.7608738025727095,minimal,1,805,418,386,,1479
oasst-sft-llama-33b,51.24223602484472,1.748518981999294,verified,13,805,406,386,,748
text_davinci_003,50.0,0.0,minimal,805,805,0,0,,307
alpaca-farm-ppo-sim-gpt4-20k,48.19875776397515,1.7512254507446705,verified,10,805,383,412,,511
guanaco-7b,47.5776397515528,1.7590989434689512,verified,2,805,382,421,,1364
falcon-40b-instruct,46.70807453416149,1.7551420072945083,minimal,4,805,374,427,,662
alpaca-farm-ppo-human,46.45962732919255,1.750131850347461,minimal,8,805,370,427,,803
pythia-12b-mix-sft,43.22981366459627,1.7449120766669366,verified,2,805,347,456,,913
oasst-sft-pythia-12b,32.79503105590062,1.6369108459870174,verified,16,805,256,533,,726
alpaca-7b,32.298136645962735,1.630307861230374,minimal,16,805,252,537,,396
falcon-7b-instruct,29.565217391304348,1.6021542242903124,verified,6,805,235,564,,478
text_davinci_001,21.490683229813666,1.421716368655911,minimal,20,805,163,622,,296
