Model,Total Score,Included Tasks,Included Score,Avg Tests Passed,Pass Rate (%),Medal,Human Relative Rank,Human Percentile,Rank,Relative Score (%)
gpt-5,423.0,6,423.0,73.22,66.67,Gold,2,98.91304347826087,1,70.5
gpt-oss-120b-high,400.0,6,400.0,67.49,66.67,Gold,3,97.82608695652173,2,66.67
grok-4-fast-reasoning,331.0,6,331.0,63.58,33.33,Gold,5,95.65217391304348,3,55.17
gpt-oss-120b_sp2,270.0,6,270.0,46.84,33.33,Silver,11,89.1304347826087,4,45.0
gpt-oss-20b-high,245.0,6,245.0,60.71,50.0,Silver,13,86.95652173913044,3,40.83
gpt-o3-mini-high,227.0,6,227.0,40.96,16.67,Silver,21,78.26086956521739,4,37.83
gpt-oss-120b-medium,220.0,6,220.0,41.59,33.33,Bronze,24,75.0,5,36.67
gemini-2.5-pro,203.0,6,203.0,44.19,16.67,Bronze,27,71.73913043478261,6,33.83
gpt-oss-120b_sp4,200.0,6,200.0,43.29,16.67,Bronze,28,70.65217391304348,9,33.33
gpt-oss-120b_sp1,197.0,6,197.0,36.64,16.67,Bronze,29,69.56521739130434,10,32.83
gpt-oss-120b_sp3,176.0,6,176.0,38.12,16.67,Bronze,35,63.04347826086956,11,29.33
gemini-2.5-flash,162.0,6,162.0,30.59,0.0,Bronze,40,57.608695652173914,7,27.0
gpt-oss-20b-medium,160.0,6,160.0,31.9,20.0,Bronze,40,57.608695652173914,8,26.67
seed-oss_-1,113.0,6,113.0,22.33,0.0,Bronze,60,35.869565217391305,10,18.83
deepseek-reasoner,107.0,6,107.0,22.75,0.0,Bronze,60,35.869565217391305,11,17.83
claude-sonnet-4.5,99.0,6,99.0,24.79,0.0,Bronze,64,31.52173913043478,16,16.5
gpt-oss-120b-low,95.0,6,95.0,16.59,0.0,Bronze,65,30.434782608695652,12,15.83
seed-oss_16384,92.0,6,92.0,19.21,0.0,Bronze,66,29.347826086956523,13,15.33
Qwen3-32B,87.0,6,87.0,22.57,0.0,Bronze,67,28.26086956521739,14,14.5
Qwen3-14B,79.0,6,79.0,14.88,0.0,None,72,22.82608695652174,15,13.17
Qwen3-4B,68.0,6,68.0,13.47,0.0,None,75,19.565217391304348,16,11.33
Qwen3-30B,68.0,6,68.0,16.21,0.0,None,75,19.565217391304348,17,11.33
OpenCodeReasoning-Nemotron-32B-IOI,65.0,6,65.0,12.31,0.0,None,75,19.565217391304348,23,10.83
gpt-oss-20b-low,60.0,6,60.0,12.33,0.0,None,78,16.304347826086957,18,10.0
Qwen3-8B,59.0,6,59.0,14.03,0.0,None,78,16.304347826086957,19,9.83
Llama-3.3-70B-Instruct,51.0,6,51.0,16.33,0.0,None,78,16.304347826086957,20,8.5
seed-oss_8192,45.0,6,45.0,6.38,0.0,None,79,15.217391304347826,22,7.5
deepseek-chat,43.0,6,43.0,11.29,0.0,None,79,15.217391304347826,23,7.17
Qwen3-32B-Non-Thinking,0.0,6,0.0,0.0,0.0,None,91,2.1739130434782608,36,0.0
QwQ-32B,118.0,6,118.0,23.96,0.0,Bronze,58,38.04347826086956,9,19.67
Llama-4-Scout,20.0,6,20.0,5.95,0.0,None,84,9.782608695652174,25,3.33
DeepSeek-R1-Distill-Llama-70B,16.0,6,16.0,6.22,0.0,None,86,7.608695652173913,27,2.67
gpt-4.1,14.0,6,14.0,9.71,0.0,None,86,7.608695652173913,28,2.33
Mistral-Small-3.1-24B-2503,5.0,6,5.0,2.74,0.0,None,86,7.608695652173913,30,0.83
Qwen2.5-72B,5.0,6,5.0,6.34,0.0,None,86,7.608695652173913,31,0.83
Qwen3-30B-Non-Thinking,5.0,6,5.0,5.74,0.0,None,86,7.608695652173913,34,0.83
Mistral-Large-Instruct-2411,5.0,6,5.0,4.38,0.0,None,86,7.608695652173913,32,0.83
Qwen3-14B-Non-Thinking,5.0,6,5.0,2.76,0.0,None,86,7.608695652173913,33,0.83
Qwen2.5-Coder-14B-Instruct,5.0,6,5.0,3.86,0.0,None,86,7.608695652173913,35,0.83
OlympicCoder-7B,5.0,6,5.0,5.5,0.0,None,86,7.608695652173913,40,0.83
DeepSeek-R1-Distill-Qwen-32B,50.0,6,50.0,11.01,0.0,None,78,16.304347826086957,21,8.33
Qwen2.5-Coder-32B-Instruct,25.0,6,25.0,7.24,0.0,None,82,11.956521739130435,24,4.17
DeepSeek-R1-Distill-Qwen-14B,16.0,6,16.0,5.91,0.0,None,86,7.608695652173913,26,2.67
DeepSeek-R1-Distill-Qwen-7B,0.0,6,0.0,0.0,0.0,None,91,2.1739130434782608,37,0.0
DeepSeek-R1-Distill-Llama-8B,0.0,6,0.0,0.0,0.0,None,91,2.1739130434782608,38,0.0
seed-oss_2048,0.0,6,0.0,0.0,0.0,None,91,2.1739130434782608,39,0.0
seed-oss_4096,0.0,6,0.0,0.0,0.0,None,91,2.1739130434782608,40,0.0
seed-oss_0,0.0,6,0.0,0.27,0.0,None,91,2.1739130434782608,41,0.0
Llama-3.1-8B-Instruct,0.0,6,0.0,0.27,0.0,None,91,2.1739130434782608,42,0.0
Codestral-22B-v0.1,0.0,6,0.0,0.27,0.0,None,91,2.1739130434782608,44,0.0
seed-oss_512,0.0,6,0.0,1.59,0.0,None,91,2.1739130434782608,43,0.0
Qwen3-4B-Non-Thinking,5.0,6,5.0,2.49,0.0,None,86,7.608695652173913,29,0.83
Qwen2.5-Coder-7B-Instruct,0.0,6,0.0,0.55,0.0,None,91,2.1739130434782608,46,0.0
Qwen3-8B-Non-Thinking,0.0,6,0.0,0.4,0.0,None,91,2.1739130434782608,45,0.0
seed-oss_1024,0.0,6,0.0,1.13,0.0,None,91,2.1739130434782608,47,0.0
DeepSeek-Coder-V2-Lite-Instruct,0.0,6,0.0,0.77,0.0,None,91,2.1739130434782608,48,0.0
