Model,Total Score,Included Tasks,Included Score,Avg Tests Passed,Pass Rate (%),Medal,Human Relative Rank,Human Percentile,Rank,Relative Score (%)
grok-4-fast-reasoning,49.0,5,49.0,68.64,60.0,Gold,91,97.71978718013682,1,65.33
gpt-oss-120b-high,47.0,5,47.0,65.66,60.0,Gold,15,99.64530022802128,1,62.67
gpt-oss-120b-low,45.0,5,45.0,63.54,60.0,Gold,17,99.59462883202433,2,60.0
gpt-5,45.0,5,45.0,63.01,60.0,Gold,17,99.59462883202433,3,60.0
claude-sonnet-4.5,36.0,5,36.0,50.91,40.0,Gold,351,91.13250570053205,5,48.0
gpt-o3-mini-high,34.0,5,34.0,47.21,40.0,Silver,27,99.34127185203953,4,45.33
gemini-2.5-pro,34.0,5,34.0,48.85,40.0,Silver,27,99.34127185203953,5,45.33
gpt-oss-120b_sp4,32.0,5,32.0,44.82,40.0,Silver,773,80.44084114517355,8,42.67
gpt-oss-20b-medium,32.0,5,32.0,43.54,40.0,Silver,29,99.29060045604257,6,42.67
gpt-oss-120b_sp3,32.0,5,32.0,44.82,40.0,Silver,773,80.44084114517355,10,42.67
gpt-oss-120b_sp2,32.0,5,32.0,44.82,40.0,Silver,773,80.44084114517355,11,42.67
gemini-2.5-flash,32.0,5,32.0,47.26,40.0,Silver,29,99.29060045604257,7,42.67
gpt-oss-20b-low,15.0,5,15.0,100.0,100.0,None,46,98.85989359006841,40,20.0
gpt-oss-20b-high,32.0,5,32.0,47.21,40.0,Silver,29,99.29060045604257,8,42.67
Qwen2.5-Coder-14B-Instruct,30.0,5,30.0,50.66,50.0,Bronze,31,99.23992906004561,10,40.0
Qwen3-14B-Non-Thinking,0.0,5,0.0,0.0,0.0,None,61,98.47985812009121,46,0.0
Qwen2.5-72B,30.0,5,30.0,54.48,50.0,Bronze,31,99.23992906004561,11,40.0
seed-oss_8192,30.0,5,30.0,42.48,40.0,Bronze,31,99.23992906004561,12,40.0
seed-oss_1024,30.0,5,30.0,40.88,40.0,Bronze,31,99.23992906004561,13,40.0
seed-oss_-1,30.0,5,30.0,53.1,50.0,Bronze,31,99.23992906004561,9,40.0
deepseek-reasoner,30.0,5,30.0,43.94,40.0,Bronze,31,99.23992906004561,14,40.0
Qwen3-32B,30.0,5,30.0,42.88,40.0,Bronze,31,99.23992906004561,15,40.0
DeepSeek-R1-Distill-Llama-8B,0.0,5,0.0,0.0,0.0,None,61,98.47985812009121,44,0.0
Qwen3-32B-Non-Thinking,30.0,5,30.0,40.93,40.0,Bronze,31,99.23992906004561,16,40.0
Qwen3-4B-Non-Thinking,30.0,5,30.0,40.35,40.0,Bronze,31,99.23992906004561,21,40.0
gpt-4.1,30.0,5,30.0,42.88,40.0,Bronze,31,99.23992906004561,18,40.0
OpenCodeReasoning-Nemotron-32B-IOI,30.0,5,30.0,43.94,40.0,Bronze,1800,54.42107930073473,27,40.0
OlympicCoder-7B,30.0,5,30.0,42.88,40.0,Bronze,1800,54.42107930073473,28,40.0
Mistral-Large-Instruct-2411,30.0,5,30.0,42.12,40.0,Bronze,31,99.23992906004561,26,40.0
Qwen3-14B,30.0,5,30.0,42.88,40.0,Bronze,31,99.23992906004561,22,40.0
deepseek-chat,30.0,5,30.0,42.48,40.0,Bronze,31,99.23992906004561,20,40.0
DeepSeek-R1-Distill-Llama-70B,30.0,5,30.0,42.83,40.0,Bronze,31,99.23992906004561,25,40.0
Codestral-22B-v0.1,30.0,5,30.0,40.4,40.0,Bronze,31,99.23992906004561,27,40.0
Qwen3-8B,30.0,5,30.0,41.11,40.0,Bronze,31,99.23992906004561,19,40.0
Qwen3-4B,30.0,5,30.0,43.23,40.0,Bronze,31,99.23992906004561,17,40.0
Qwen3-30B,30.0,5,30.0,44.12,40.0,Bronze,31,99.23992906004561,29,40.0
Qwen3-30B-Non-Thinking,30.0,5,30.0,40.53,40.0,Bronze,31,99.23992906004561,31,40.0
Llama-3.3-70B-Instruct,30.0,5,30.0,40.93,40.0,Bronze,31,99.23992906004561,33,40.0
Llama-4-Scout,30.0,5,30.0,40.93,40.0,Bronze,31,99.23992906004561,32,40.0
gpt-oss-120b_sp1,30.0,5,30.0,43.23,40.0,Bronze,1800,54.42107930073473,40,40.0
gpt-oss-120b-medium,30.0,5,30.0,44.12,40.0,Bronze,31,99.23992906004561,34,40.0
Mistral-Small-3.1-24B-2503,30.0,5,30.0,40.53,40.0,Bronze,31,99.23992906004561,35,40.0
seed-oss_0,25.0,5,25.0,35.33,20.0,None,36,99.11325057005321,36,33.33
Qwen2.5-Coder-7B-Instruct,20.0,5,20.0,26.84,20.0,None,41,98.98657208006081,37,26.67
DeepSeek-Coder-V2-Lite-Instruct,17.0,5,17.0,27.98,20.0,None,44,98.91056498606537,38,22.67
seed-oss_512,16.0,5,16.0,26.7,20.0,None,45,98.88522928806688,39,21.33
Llama-3.1-8B-Instruct,15.0,5,15.0,23.32,20.0,None,46,98.85989359006841,41,20.0
Qwen3-8B-Non-Thinking,15.0,5,15.0,20.93,20.0,None,46,98.85989359006841,42,20.0
seed-oss_16384,0.0,5,0.0,0.0,0.0,None,61,98.47985812009121,43,0.0
seed-oss_4096,0.0,5,0.0,0.0,0.0,None,61,98.47985812009121,45,0.0
DeepSeek-R1-Distill-Qwen-7B,0.0,5,0.0,0.0,0.0,None,61,98.47985812009121,47,0.0
seed-oss_2048,0.0,5,0.0,0.0,0.0,None,61,98.47985812009121,48,0.0
Qwen2.5-Coder-32B-Instruct,30.0,5,30.0,40.53,40.0,Bronze,31,99.23992906004561,24,40.0
QwQ-32B,30.0,5,30.0,41.46,40.0,Bronze,31,99.23992906004561,23,40.0
DeepSeek-R1-Distill-Qwen-14B,30.0,5,30.0,40.75,40.0,Bronze,31,99.23992906004561,28,40.0
DeepSeek-R1-Distill-Qwen-32B,30.0,5,30.0,43.23,40.0,Bronze,31,99.23992906004561,30,40.0
