Model,Total Score,Included Tasks,Included Score,Avg Tests Passed,Pass Rate (%),Medal,Human Relative Rank,Human Percentile,Rank,Relative Score (%)
gpt-oss-120b_sp3,346.0,5,346.0,76.95,60.0,Silver,49,82.28782287822878,1,69.2
gpt-oss-120b_sp4,287.0,5,287.0,74.39,40.0,Bronze,82,70.11070110701107,2,57.4
gpt-o3-mini-high,284.0,5,284.0,76.14,40.0,Bronze,82,70.11070110701107,2,56.8
gpt-oss-120b-high,279.0,5,279.0,67.66,40.0,Bronze,87,68.26568265682657,3,55.8
claude-sonnet-4.5,275.0,5,275.0,76.29,40.0,Bronze,89,67.52767527675277,5,55.0
seed-oss_16384,256.0,5,256.0,67.93,40.0,Bronze,100,63.46863468634686,5,51.2
seed-oss_8192,256.0,5,256.0,68.44,40.0,Bronze,100,63.46863468634686,6,51.2
gemini-2.5-pro,256.0,5,256.0,67.92,40.0,Bronze,100,63.46863468634686,7,51.2
gemini-2.5-flash,256.0,5,256.0,67.48,40.0,Bronze,100,63.46863468634686,4,51.2
gpt-oss-120b_sp2,249.0,5,249.0,61.79,40.0,Bronze,102,62.730627306273064,10,49.8
gpt-oss-120b-medium,249.0,5,249.0,64.06,40.0,Bronze,102,62.730627306273064,8,49.8
gpt-oss-120b_sp1,249.0,5,249.0,61.61,40.0,Bronze,102,62.730627306273064,12,49.8
seed-oss_-1,246.0,5,246.0,59.58,40.0,Bronze,109,60.14760147601476,9,49.2
gpt-5,303.0,5,303.0,68.76,60.0,Bronze,74,73.06273062730628,1,60.6
gpt-oss-20b-high,200.0,5,200.0,51.85,50.0,None,158,42.06642066420664,10,40.0
gpt-oss-20b-medium,200.0,5,200.0,50.52,50.0,None,158,42.06642066420664,11,40.0
gpt-oss-120b-low,161.0,5,161.0,45.84,20.0,None,215,21.03321033210332,12,32.2
gpt-4.1,160.0,5,160.0,43.87,20.0,None,215,21.03321033210332,13,32.0
DeepSeek-R1-Distill-Llama-70B,128.0,5,128.0,40.59,20.0,None,224,17.71217712177122,14,25.6
Qwen3-32B,128.0,5,128.0,42.67,20.0,None,224,17.71217712177122,20,25.6
Qwen3-4B,110.0,5,110.0,28.23,20.0,None,230,15.498154981549815,15,22.0
Qwen3-8B,110.0,5,110.0,28.91,20.0,None,230,15.498154981549815,16,22.0
grok-4-fast-reasoning,103.0,5,103.0,46.69,33.33,None,232,14.760147601476016,23,20.6
OlympicCoder-7B,103.0,5,103.0,29.96,25.0,None,232,14.760147601476016,24,20.6
deepseek-reasoner,103.0,5,103.0,31.15,20.0,None,232,14.760147601476016,17,20.6
Qwen3-14B,103.0,5,103.0,27.59,20.0,None,232,14.760147601476016,26,20.6
OpenCodeReasoning-Nemotron-32B-IOI,100.0,5,100.0,40.72,33.33,None,232,14.760147601476016,27,20.0
seed-oss_2048,100.0,5,100.0,20.0,20.0,None,232,14.760147601476016,18,20.0
gpt-oss-20b-low,100.0,5,100.0,20.68,20.0,None,232,14.760147601476016,19,20.0
seed-oss_4096,100.0,5,100.0,20.48,20.0,None,232,14.760147601476016,20,20.0
Qwen3-4B-Non-Thinking,56.0,5,56.0,26.13,0.0,None,254,6.642066420664206,21,11.2
Llama-4-Scout,56.0,5,56.0,27.68,0.0,None,254,6.642066420664206,22,11.2
Qwen3-32B-Non-Thinking,56.0,5,56.0,26.13,0.0,None,254,6.642066420664206,23,11.2
Qwen3-30B-Non-Thinking,31.0,5,31.0,21.21,0.0,None,262,3.690036900369004,24,6.2
Mistral-Large-Instruct-2411,28.0,5,28.0,23.22,0.0,None,262,3.690036900369004,25,5.6
Qwen3-8B-Non-Thinking,28.0,5,28.0,22.02,0.0,None,262,3.690036900369004,26,5.6
Qwen2.5-Coder-7B-Instruct,15.0,5,15.0,10.86,0.0,None,271,0.36900369003690037,27,3.0
seed-oss_1024,0.0,5,0.0,0.23,0.0,None,272,0.0,29,0.0
seed-oss_512,0.0,5,0.0,0.0,0.0,None,272,0.0,30,0.0
seed-oss_0,0.0,5,0.0,1.32,0.0,None,272,0.0,31,0.0
Qwen3-14B-Non-Thinking,0.0,5,0.0,0.0,0.0,None,272,0.0,28,0.0
