Model,Total Score,Included Tasks,Included Score,Avg Tests Passed,Pass Rate (%),Medal,Human Relative Rank,Human Percentile,Rank,Relative Score (%)
gpt-5,183.0,6,183.0,42.19,16.67,Bronze,143,59.887005649717516,1,30.5
gemini-2.5-pro,160.0,6,160.0,42.57,0.0,Bronze,173,51.41242937853107,2,26.67
gpt-oss-120b-high,128.0,6,128.0,31.98,16.67,None,218,38.70056497175141,3,21.33
claude-sonnet-4.5,131.0,6,131.0,43.27,0.0,None,215,39.548022598870055,4,21.83
seed-oss_-1,125.0,6,125.0,29.37,0.0,None,222,37.570621468926554,4,20.83
grok-4-fast-reasoning,119.0,6,119.0,35.27,0.0,None,227,36.15819209039548,6,19.83
gpt-o3-mini-high,112.0,6,112.0,29.63,0.0,None,237,33.333333333333336,6,18.67
claude-haiku-4.5,107.0,6,107.0,37.72,0.0,None,244,31.35593220338983,8,17.83
Qwen3-30B-Non-Thinking,69.0,6,69.0,21.66,0.0,None,283,20.338983050847457,9,11.5
gemini-2.5-flash,63.0,6,63.0,20.68,0.0,None,289,18.64406779661017,10,10.5
deepseek-chat,62.0,6,62.0,22.67,0.0,None,290,18.361581920903955,11,10.33
gpt-4.1,32.0,6,32.0,11.26,0.0,None,319,10.169491525423728,20,5.33
Mistral-Large-Instruct-2411,44.0,6,44.0,14.29,0.0,None,312,12.146892655367232,13,7.33
OpenCodeReasoning-Nemotron-32B-IOI,42.0,6,42.0,13.11,0.0,None,314,11.581920903954803,14,7.0
gpt-oss-120b_sp2,42.0,6,42.0,16.89,0.0,None,314,11.581920903954803,15,7.0
QwQ-32B,59.0,6,59.0,14.69,0.0,None,291,18.07909604519774,12,9.83
Qwen3-14B-Non-Thinking,39.0,6,39.0,12.39,0.0,None,317,10.734463276836157,17,6.5
gpt-oss-20b-high,41.0,6,41.0,16.78,0.0,None,316,11.016949152542374,16,6.83
OlympicCoder-32B,34.0,6,34.0,11.67,0.0,None,319,10.169491525423728,19,5.67
gpt-oss-120b_sp1,32.0,6,32.0,15.18,0.0,None,319,10.169491525423728,20,5.33
gpt-oss-20b-low,32.0,6,32.0,9.9,0.0,None,319,10.169491525423728,18,5.33
gpt-oss-120b-medium,32.0,6,32.0,14.59,0.0,None,319,10.169491525423728,22,5.33
gpt-oss-120b-low,32.0,6,32.0,13.36,0.0,None,319,10.169491525423728,21,5.33
gpt-oss-20b-medium,42.0,6,42.0,16.76,0.0,None,314,11.581920903954803,15,7.0
Qwen3-14B,23.0,6,23.0,12.72,0.0,None,330,7.062146892655368,23,3.83
gpt-oss-120b_sp3,22.0,6,22.0,10.67,0.0,None,330,7.062146892655368,26,3.67
Qwen3-32B-Non-Thinking,19.0,6,19.0,9.14,0.0,None,335,5.649717514124294,24,3.17
gpt-oss-120b_sp4,18.0,6,18.0,6.95,0.0,None,336,5.367231638418079,28,3.0
Qwen3-32B,87.0,6,87.0,27.01,0.0,None,264,25.706214689265536,8,14.5
Qwen3-8B,13.0,6,13.0,7.28,0.0,None,340,4.237288135593221,27,2.17
deepseek-reasoner,13.0,6,13.0,9.81,0.0,None,340,4.237288135593221,28,2.17
OlympicCoder-7B,13.0,6,13.0,4.6,0.0,None,340,4.237288135593221,32,2.17
DeepSeek-R1-Distill-Llama-70B,13.0,6,13.0,10.41,0.0,None,340,4.237288135593221,30,2.17
DeepSeek-R1-Distill-Qwen-14B,5.0,6,5.0,4.72,0.0,None,347,2.2598870056497176,33,0.83
DeepSeek-R1-Distill-Qwen-32B,13.0,6,13.0,8.42,0.0,None,340,4.237288135593221,29,2.17
Qwen3-4B,5.0,6,5.0,4.08,0.0,None,347,2.2598870056497176,37,0.83
Llama-4-Scout,5.0,6,5.0,5.35,0.0,None,347,2.2598870056497176,36,0.83
Qwen2.5-Coder-14B-Instruct,0.0,6,0.0,5.52,0.0,None,347,2.2598870056497176,48,0.0
Qwen2.5-Coder-32B-Instruct,44.0,6,44.0,15.83,0.0,None,312,12.146892655367232,14,7.33
Qwen2.5-Coder-7B-Instruct,0.0,6,0.0,0.15,0.0,None,347,2.2598870056497176,40,0.0
DeepSeek-R1-Distill-Qwen-7B,0.0,6,0.0,0.0,0.0,None,347,2.2598870056497176,39,0.0
Llama-3.1-8B-Instruct,0.0,6,0.0,1.7,0.0,None,347,2.2598870056497176,41,0.0
Codestral-22B-v0.1,0.0,6,0.0,0.66,0.0,None,347,2.2598870056497176,42,0.0
Qwen3-4B-Non-Thinking,0.0,6,0.0,0.55,0.0,None,347,2.2598870056497176,43,0.0
Qwen3-8B-Non-Thinking,0.0,6,0.0,0.65,0.0,None,347,2.2598870056497176,44,0.0
DeepSeek-Coder-V2-Lite-Instruct,0.0,6,0.0,3.04,0.0,None,347,2.2598870056497176,45,0.0
DeepSeek-R1-Distill-Llama-8B,0.0,6,0.0,2.15,0.0,None,347,2.2598870056497176,46,0.0
Mistral-Small-3.1-24B-2503,0.0,6,0.0,1.76,0.0,None,347,2.2598870056497176,47,0.0
