Model,Total Score,Included Tasks,Included Score,Avg Tests Passed,Pass Rate (%),Medal,Rank,Relative Score (%)
gpt-5,87.0,6,87.0,57.5,50.0,None,1,58.0
gpt-oss-120b-high,75.0,6,75.0,50.38,50.0,None,2,50.0
gemini-2.5-pro,62.0,6,62.0,46.43,33.33,None,3,41.33
grok-4-fast-reasoning,61.0,6,61.0,43.38,33.33,None,4,40.67
gpt-oss-20b-high,55.0,6,55.0,36.14,33.33,None,4,36.67
gpt-oss-120b-medium,55.0,6,55.0,39.36,33.33,None,5,36.67
gemini-2.5-flash,53.0,6,53.0,38.26,33.33,None,6,35.33
gpt-oss-120b-low,51.0,6,51.0,34.57,33.33,None,7,34.0
gpt-oss-20b-low,50.0,6,50.0,33.52,33.33,None,8,33.33
gpt-oss-20b-medium,50.0,6,50.0,33.81,33.33,None,9,33.33
gpt-oss-120b_sp2,50.0,6,50.0,33.95,33.33,None,11,33.33
gpt-oss-120b_sp4,50.0,6,50.0,35.13,33.33,None,12,33.33
gpt-oss-120b_sp1,50.0,6,50.0,34.1,33.33,None,13,33.33
gpt-oss-120b_sp3,50.0,6,50.0,34.38,33.33,None,14,33.33
deepseek-reasoner,34.0,6,34.0,23.99,16.67,None,15,22.67
seed-oss_16384,50.0,6,50.0,36.93,33.33,None,10,33.33
gpt-o3-mini-high,50.0,6,50.0,36.07,33.33,None,11,33.33
seed-oss_-1,50.0,6,50.0,35.44,33.33,None,12,33.33
seed-oss_8192,42.0,6,42.0,26.06,16.67,None,13,28.0
claude-sonnet-4.5,39.0,6,39.0,30.28,16.67,None,20,26.0
seed-oss_4096,34.0,6,34.0,23.41,16.67,None,14,22.67
Qwen3-32B,25.0,6,25.0,19.4,16.67,None,25,16.67
gpt-4.1,33.0,6,33.0,23.48,16.67,None,16,22.0
seed-oss_512,33.0,6,33.0,21.62,16.67,None,17,22.0
deepseek-chat,26.0,6,26.0,18.95,16.67,None,18,17.33
Qwen3-14B,26.0,6,26.0,20.16,16.67,None,19,17.33
Qwen3-8B,25.0,6,25.0,16.67,16.67,None,20,16.67
seed-oss_2048,25.0,6,25.0,16.86,16.67,None,21,16.67
OlympicCoder-7B,25.0,6,25.0,16.86,16.67,None,29,16.67
OpenCodeReasoning-Nemotron-32B-IOI,25.0,6,25.0,17.43,16.67,None,30,16.67
DeepSeek-R1-Distill-Llama-70B,25.0,6,25.0,17.53,16.67,None,22,16.67
Qwen3-30B,25.0,6,25.0,18.1,16.67,None,24,16.67
seed-oss_1024,10.0,6,10.0,11.59,0.0,None,26,6.67
Llama-3.3-70B-Instruct,6.0,6,6.0,4.92,0.0,None,27,4.0
Qwen3-32B-Non-Thinking,5.0,6,5.0,4.06,0.0,None,28,3.33
Mistral-Large-Instruct-2411,5.0,6,5.0,4.15,0.0,None,29,3.33
Qwen2.5-Coder-7B-Instruct,5.0,6,5.0,4.3,0.0,None,30,3.33
Qwen2.5-72B,5.0,6,5.0,4.44,0.0,None,31,3.33
Qwen3-30B-Non-Thinking,5.0,6,5.0,4.54,0.0,None,33,3.33
Qwen2.5-Coder-14B-Instruct,5.0,6,5.0,4.25,0.0,None,35,3.33
DeepSeek-Coder-V2-Lite-Instruct,5.0,6,5.0,4.06,0.0,None,34,3.33
Qwen3-8B-Non-Thinking,5.0,6,5.0,4.44,0.0,None,36,3.33
Codestral-22B-v0.1,1.0,6,1.0,0.95,0.0,None,37,0.67
Qwen3-4B,1.0,6,1.0,9.54,0.0,None,38,0.67
QwQ-32B,25.0,6,25.0,17.81,16.67,None,23,16.67
DeepSeek-R1-Distill-Qwen-32B,5.0,6,5.0,4.06,0.0,None,32,3.33
DeepSeek-R1-Distill-Qwen-7B,0.0,6,0.0,0.0,0.0,None,39,0.0
DeepSeek-R1-Distill-Llama-8B,0.0,6,0.0,0.0,0.0,None,40,0.0
DeepSeek-R1-Distill-Qwen-14B,0.0,6,0.0,6.05,0.0,None,42,0.0
Qwen2.5-Coder-32B-Instruct,0.0,6,0.0,2.07,0.0,None,45,0.0
Qwen3-14B-Non-Thinking,0.0,6,0.0,0.0,0.0,None,41,0.0
Llama-4-Scout,0.0,6,0.0,0.48,0.0,None,43,0.0
Llama-3.1-8B-Instruct,0.0,6,0.0,0.33,0.0,None,44,0.0
seed-oss_0,0.0,6,0.0,0.62,0.0,None,46,0.0
Qwen3-4B-Non-Thinking,0.0,6,0.0,0.28,0.0,None,47,0.0
Mistral-Small-3.1-24B-2503,0.0,6,0.0,2.47,0.0,None,48,0.0
