Model,Total Score,Included Tasks,Included Score,Avg Tests Passed,Pass Rate (%),Medal,Human Relative Rank,Human Percentile,Rank,Relative Score (%)
gpt-oss-120b-high,0.0,5,0.0,0.0,0.0,None,60,20.27027027027027,37,0.0
gpt-oss-20b-high,283.0,5,283.0,62.5,60.0,Silver,9,89.1891891891892,1,56.6
gpt-oss-120b_sp2,270.0,5,270.0,60.0,60.0,Silver,10,87.83783783783784,3,54.0
grok-4-fast-reasoning,270.0,5,270.0,60.0,60.0,Silver,10,87.83783783783784,4,54.0
gemini-2.5-flash,270.0,5,270.0,60.0,60.0,Silver,10,87.83783783783784,3,54.0
gpt-5,270.0,5,270.0,60.0,60.0,Silver,10,87.83783783783784,2,54.0
gemini-2.5-pro,270.0,5,270.0,60.0,60.0,Silver,10,87.83783783783784,4,54.0
gpt-oss-120b_sp3,270.0,5,270.0,60.0,60.0,Silver,10,87.83783783783784,8,54.0
gpt-oss-120b_sp4,234.0,5,234.0,52.65,40.0,Silver,11,86.48648648648648,9,46.8
seed-oss_16384,186.0,5,186.0,44.49,40.0,Silver,15,81.08108108108108,6,37.2
seed-oss_8192,186.0,5,186.0,44.49,40.0,Silver,15,81.08108108108108,8,37.2
gpt-oss-120b-medium,186.0,5,186.0,44.49,40.0,Silver,15,81.08108108108108,7,37.2
seed-oss_-1,186.0,5,186.0,44.49,40.0,Silver,15,81.08108108108108,5,37.2
gpt-o3-mini-high,186.0,5,186.0,44.49,40.0,Silver,15,81.08108108108108,9,37.2
gpt-oss-120b_sp1,186.0,5,186.0,44.49,40.0,Silver,15,81.08108108108108,15,37.2
Qwen3-30B,186.0,5,186.0,44.49,40.0,Silver,15,81.08108108108108,10,37.2
Qwen3-14B,186.0,5,186.0,44.49,40.0,Silver,15,81.08108108108108,11,37.2
Qwen3-32B,186.0,5,186.0,44.49,40.0,Silver,15,81.08108108108108,12,37.2
Qwen3-8B,160.0,5,160.0,40.0,40.0,Silver,15,81.08108108108108,13,32.0
gpt-oss-20b-medium,160.0,5,160.0,40.41,40.0,Silver,15,81.08108108108108,14,32.0
OpenCodeReasoning-Nemotron-32B-IOI,160.0,5,160.0,42.04,40.0,Silver,15,81.08108108108108,21,32.0
claude-sonnet-4.5,160.0,5,160.0,40.41,40.0,Silver,15,81.08108108108108,22,32.0
gpt-oss-120b-low,76.0,5,76.0,24.49,20.0,Bronze,24,68.91891891891892,16,15.2
deepseek-reasoner,76.0,5,76.0,24.49,20.0,Bronze,24,68.91891891891892,17,15.2
gpt-4.1,50.0,5,50.0,20.41,20.0,Bronze,32,58.108108108108105,19,10.0
deepseek-chat,50.0,5,50.0,20.0,20.0,Bronze,32,58.108108108108105,20,10.0
gpt-oss-20b-low,38.0,5,38.0,9.49,0.0,None,57,24.324324324324323,21,7.6
seed-oss_2048,12.0,5,12.0,5.0,0.0,None,60,20.27027027027027,22,2.4
seed-oss_0,12.0,5,12.0,5.0,0.0,None,60,20.27027027027027,23,2.4
QwQ-32B,148.0,5,148.0,29.49,20.0,Silver,15,81.08108108108108,15,29.6
DeepSeek-R1-Distill-Qwen-14B,0.0,5,0.0,0.41,0.0,None,60,20.27027027027027,42,0.0
seed-oss_512,0.0,5,0.0,0.0,0.0,None,60,20.27027027027027,24,0.0
Qwen2.5-Coder-14B-Instruct,0.0,5,0.0,0.0,0.0,None,60,20.27027027027027,28,0.0
Qwen3-14B-Non-Thinking,0.0,5,0.0,0.0,0.0,None,60,20.27027027027027,29,0.0
DeepSeek-R1-Distill-Llama-8B,0.0,5,0.0,0.0,0.0,None,60,20.27027027027027,27,0.0
seed-oss_4096,0.0,5,0.0,0.0,0.0,None,60,20.27027027027027,30,0.0
Llama-4-Scout,0.0,5,0.0,0.0,0.0,None,60,20.27027027027027,25,0.0
Mistral-Large-Instruct-2411,0.0,5,0.0,0.0,0.0,None,60,20.27027027027027,33,0.0
Codestral-22B-v0.1,0.0,5,0.0,0.0,0.0,None,60,20.27027027027027,26,0.0
Qwen3-4B-Non-Thinking,0.0,5,0.0,0.0,0.0,None,60,20.27027027027027,31,0.0
Qwen2.5-Coder-7B-Instruct,0.0,5,0.0,0.0,0.0,None,60,20.27027027027027,32,0.0
DeepSeek-R1-Distill-Llama-70B,0.0,5,0.0,0.0,0.0,None,60,20.27027027027027,34,0.0
Llama-3.3-70B-Instruct,0.0,5,0.0,0.0,0.0,None,60,20.27027027027027,35,0.0
Mistral-Small-3.1-24B-2503,0.0,5,0.0,0.0,0.0,None,60,20.27027027027027,36,0.0
Llama-3.1-8B-Instruct,0.0,5,0.0,0.0,0.0,None,60,20.27027027027027,40,0.0
seed-oss_1024,0.0,5,0.0,0.0,0.0,None,60,20.27027027027027,38,0.0
DeepSeek-R1-Distill-Qwen-7B,0.0,5,0.0,0.0,0.0,None,60,20.27027027027027,39,0.0
OlympicCoder-7B,0.0,5,0.0,0.0,0.0,None,60,20.27027027027027,48,0.0
Qwen3-30B-Non-Thinking,0.0,5,0.0,0.0,0.0,None,60,20.27027027027027,41,0.0
Qwen2.5-Coder-32B-Instruct,0.0,5,0.0,0.0,0.0,None,60,20.27027027027027,47,0.0
DeepSeek-R1-Distill-Qwen-32B,50.0,5,50.0,20.0,20.0,Bronze,32,58.108108108108105,18,10.0
Qwen2.5-72B,0.0,5,0.0,0.0,0.0,None,60,20.27027027027027,43,0.0
Qwen3-4B,0.0,5,0.0,0.41,0.0,None,60,20.27027027027027,44,0.0
Qwen3-8B-Non-Thinking,0.0,5,0.0,0.0,0.0,None,60,20.27027027027027,45,0.0
Qwen3-32B-Non-Thinking,0.0,5,0.0,0.0,0.0,None,60,20.27027027027027,46,0.0
DeepSeek-Coder-V2-Lite-Instruct,0.0,5,0.0,0.0,0.0,None,60,20.27027027027027,48,0.0
