,win_rate,standard_error,mode,avg_length,n_wins,n_wins_base,n_draws,n_total,discrete_win_rate,length_controlled_winrate
gpt4_1106_preview,50.0,0.0,community,2049,0,0,805,805,50.0,50.0
claude-3-opus-20240229,27.45341614906832,1.5714493961428302,minimal,1388,220,583,2,805,27.45341614906832,43.25056335573304
gpt4_0314,15.217391304347828,1.259117090773072,verified,1371,120,680,5,805,15.217391304347828,29.779791079392187
mistral-large-2402,16.459627329192546,1.306288755306555,minimal,1362,132,672,1,805,16.459627329192546,28.18279361879813
gpt4_0613,8.136645962732919,0.9581691305772524,minimal,1140,64,738,3,805,8.136645962732919,20.456928802947065
gpt-3.5-turbo-1106,6.211180124223603,0.8420811207823524,minimal,796,48,753,4,805,6.211180124223603,16.7339348632326
