Model,Total Score,Included Tasks,Included Score,Avg Tests Passed,Pass Rate (%),Medal,Human Relative Rank,Human Percentile,Rank,Relative Score (%)
gpt-5,149.0,3,149.0,64.13,33.33,Silver,17,90.69767441860465,1,49.67
gpt-oss-20b-high,100.0,3,100.0,50.0,50.0,Bronze,44,75.0,2,33.33
gpt-oss-120b_sp4,45.0,3,45.0,28.4,0.0,None,94,45.93023255813954,3,15.0
gpt-o3-mini-high,31.0,3,31.0,43.08,0.0,None,114,34.30232558139535,3,10.33
gemini-2.5-flash,29.0,3,29.0,29.62,0.0,None,117,32.55813953488372,4,9.67
gemini-2.5-pro,29.0,3,29.0,51.61,0.0,None,117,32.55813953488372,5,9.67
grok-4-fast-reasoning,21.0,3,21.0,25.9,0.0,None,128,26.162790697674417,7,7.0
Qwen3-32B,19.0,3,19.0,36.19,0.0,None,129,25.58139534883721,6,6.33
gpt-4.1,4.0,3,4.0,29.74,0.0,None,162,6.395348837209302,11,1.33
claude-sonnet-4.5,16.0,3,16.0,50.45,0.0,None,130,25.0,10,5.33
gpt-oss-120b_sp1,16.0,3,16.0,50.15,0.0,None,130,25.0,11,5.33
QwQ-32B,15.0,3,15.0,12.67,0.0,None,152,12.209302325581396,7,5.0
deepseek-reasoner,15.0,3,15.0,13.78,0.0,None,152,12.209302325581396,8,5.0
Qwen3-8B,15.0,3,15.0,12.67,0.0,None,152,12.209302325581396,9,5.0
Qwen3-30B,15.0,3,15.0,13.78,0.0,None,152,12.209302325581396,10,5.0
gpt-oss-120b_sp3,4.0,3,4.0,27.57,0.0,None,162,6.395348837209302,16,1.33
Qwen3-8B-Non-Thinking,0.0,3,0.0,0.0,0.0,None,173,0.0,12,0.0
Codestral-22B-v0.1,0.0,3,0.0,0.0,0.0,None,173,0.0,13,0.0
Qwen3-30B-Non-Thinking,0.0,3,0.0,0.0,0.0,None,173,0.0,14,0.0
DeepSeek-R1-Distill-Qwen-7B,0.0,3,0.0,0.0,0.0,None,173,0.0,15,0.0
DeepSeek-R1-Distill-Llama-8B,0.0,3,0.0,0.0,0.0,None,173,0.0,16,0.0
Llama-3.1-8B-Instruct,0.0,3,0.0,0.0,0.0,None,173,0.0,17,0.0
seed-oss_2048,0.0,3,0.0,0.0,0.0,None,173,0.0,19,0.0
seed-oss_512,0.0,3,0.0,0.0,0.0,None,173,0.0,20,0.0
seed-oss_8192,0.0,3,0.0,0.0,0.0,None,173,0.0,21,0.0
OpenCodeReasoning-Nemotron-32B-IOI,0.0,3,0.0,0.0,0.0,None,173,0.0,26,0.0
seed-oss_1024,0.0,3,0.0,0.0,0.0,None,173,0.0,23,0.0
seed-oss_0,0.0,3,0.0,0.0,0.0,None,173,0.0,24,0.0
Llama-4-Scout,0.0,3,0.0,0.0,0.0,None,173,0.0,22,0.0
seed-oss_16384,0.0,3,0.0,10.56,0.0,None,173,0.0,31,0.0
seed-oss_4096,0.0,3,0.0,1.65,0.0,None,173,0.0,35,0.0
DeepSeek-R1-Distill-Qwen-14B,0.0,3,0.0,5.93,0.0,None,173,0.0,32,0.0
Mistral-Small-3.1-24B-2503,0.0,3,0.0,3.17,0.0,None,173,0.0,33,0.0
Mistral-Large-Instruct-2411,0.0,3,0.0,1.65,0.0,None,173,0.0,34,0.0
gpt-oss-120b-high,0.0,3,0.0,5.93,0.0,None,173,0.0,28,0.0
DeepSeek-R1-Distill-Llama-70B,0.0,3,0.0,5.93,0.0,None,173,0.0,36,0.0
Qwen2.5-Coder-7B-Instruct,0.0,3,0.0,3.17,0.0,None,173,0.0,37,0.0
gpt-oss-20b-medium,0.0,3,0.0,19.82,0.0,None,173,0.0,27,0.0
DeepSeek-R1-Distill-Qwen-32B,0.0,3,0.0,9.52,0.0,None,173,0.0,39,0.0
Qwen2.5-Coder-14B-Instruct,0.0,3,0.0,3.17,0.0,None,173,0.0,38,0.0
Qwen3-4B-Non-Thinking,0.0,3,0.0,3.17,0.0,None,173,0.0,40,0.0
Qwen3-4B,0.0,3,0.0,8.33,0.0,None,173,0.0,26,0.0
deepseek-chat,0.0,3,0.0,5.93,0.0,None,173,0.0,29,0.0
gpt-oss-20b-low,0.0,3,0.0,0.0,0.0,None,173,0.0,25,0.0
gpt-oss-120b-low,0.0,3,0.0,4.65,0.0,None,173,0.0,30,0.0
OlympicCoder-7B,0.0,3,0.0,3.17,0.0,None,173,0.0,46,0.0
Qwen2.5-Coder-32B-Instruct,0.0,3,0.0,3.17,0.0,None,173,0.0,42,0.0
Qwen3-14B,0.0,3,0.0,9.52,0.0,None,173,0.0,41,0.0
Qwen3-14B-Non-Thinking,0.0,3,0.0,3.17,0.0,None,173,0.0,43,0.0
gpt-oss-120b_sp2,0.0,3,0.0,18.11,0.0,None,173,0.0,50,0.0
gpt-oss-120b-medium,0.0,3,0.0,7.25,0.0,None,173,0.0,45,0.0
Llama-3.3-70B-Instruct,0.0,3,0.0,4.6,0.0,None,173,0.0,44,0.0
Qwen2.5-72B,0.0,3,0.0,5.93,0.0,None,173,0.0,47,0.0
seed-oss_-1,0.0,3,0.0,23.74,0.0,None,173,0.0,46,0.0
DeepSeek-Coder-V2-Lite-Instruct,0.0,3,0.0,5.93,0.0,None,173,0.0,48,0.0
Qwen3-32B-Non-Thinking,0.0,3,0.0,0.0,0.0,None,173,0.0,18,0.0
