Model,Total Score,Included Tasks,Included Score,Avg Tests Passed,Pass Rate (%),Medal,Human Relative Rank,Human Percentile,Rank,Relative Score (%)
gpt-oss-120b-high,360.0,4,360.0,80.0,80.0,Gold,1,100.0,1,90.0
gemini-2.5-pro,360.0,4,360.0,80.0,80.0,Gold,1,100.0,2,90.0
gpt-5,349.0,4,349.0,74.68,60.0,Gold,1,100.0,3,87.25
grok-4-fast-reasoning,251.0,4,251.0,82.55,75.0,Gold,3,98.88888888888889,4,62.75
claude-sonnet-4.5,240.0,4,240.0,81.47,75.0,Gold,3,98.88888888888889,5,60.0
gpt-oss-120b_sp3,240.0,4,240.0,60.14,60.0,Gold,3,98.88888888888889,6,60.0
seed-oss_16384,240.0,4,240.0,62.59,60.0,Gold,3,98.88888888888889,4,60.0
gpt-oss-120b_sp1,240.0,4,240.0,62.59,60.0,Gold,3,98.88888888888889,8,60.0
gpt-oss-20b-high,240.0,4,240.0,60.14,60.0,Gold,3,98.88888888888889,5,60.0
gpt-oss-120b-medium,203.0,4,203.0,62.39,40.0,Gold,6,97.22222222222223,6,50.75
gpt-oss-120b_sp2,184.0,4,184.0,49.04,40.0,Gold,6,97.22222222222223,11,46.0
gpt-o3-mini-high,184.0,4,184.0,50.99,40.0,Gold,6,97.22222222222223,7,46.0
Qwen3-32B,184.0,4,184.0,48.4,40.0,Gold,6,97.22222222222223,9,46.0
seed-oss_-1,184.0,4,184.0,48.4,40.0,Gold,6,97.22222222222223,8,46.0
gemini-2.5-flash,164.0,4,164.0,52.71,40.0,Silver,31,83.33333333333333,10,41.0
seed-oss_8192,159.0,4,159.0,52.91,40.0,Silver,31,83.33333333333333,11,39.75
gpt-oss-120b_sp4,157.0,4,157.0,46.54,40.0,Silver,31,83.33333333333333,17,39.25
gpt-oss-20b-medium,157.0,4,157.0,43.37,40.0,Silver,31,83.33333333333333,12,39.25
Qwen3-8B,147.0,4,147.0,42.58,40.0,Silver,31,83.33333333333333,13,36.75
Qwen3-14B,147.0,4,147.0,42.58,40.0,Silver,31,83.33333333333333,14,36.75
gpt-4.1,147.0,4,147.0,42.72,40.0,Silver,31,83.33333333333333,15,36.75
QwQ-32B,147.0,4,147.0,42.58,40.0,Silver,31,83.33333333333333,16,36.75
Qwen3-30B,147.0,4,147.0,42.72,40.0,Silver,31,83.33333333333333,18,36.75
deepseek-reasoner,147.0,4,147.0,42.72,40.0,Silver,31,83.33333333333333,17,36.75
gpt-oss-120b-low,147.0,4,147.0,45.82,40.0,Silver,31,83.33333333333333,19,36.75
seed-oss_4096,120.0,4,120.0,40.0,40.0,Silver,44,76.11111111111111,20,30.0
gpt-oss-20b-low,120.0,4,120.0,40.0,40.0,Silver,44,76.11111111111111,21,30.0
seed-oss_2048,120.0,4,120.0,40.14,40.0,Silver,44,76.11111111111111,24,30.0
OlympicCoder-7B,120.0,4,120.0,40.14,40.0,Silver,44,76.11111111111111,29,30.0
Llama-4-Scout,120.0,4,120.0,40.14,40.0,Silver,44,76.11111111111111,23,30.0
DeepSeek-R1-Distill-Qwen-14B,120.0,4,120.0,40.14,40.0,Silver,44,76.11111111111111,25,30.0
Qwen2.5-Coder-32B-Instruct,120.0,4,120.0,40.14,40.0,Silver,44,76.11111111111111,26,30.0
Qwen3-4B,120.0,4,120.0,40.14,40.0,Silver,44,76.11111111111111,22,30.0
DeepSeek-R1-Distill-Llama-70B,120.0,4,120.0,40.14,40.0,Silver,44,76.11111111111111,31,30.0
DeepSeek-R1-Distill-Qwen-32B,120.0,4,120.0,40.14,40.0,Silver,44,76.11111111111111,28,30.0
Qwen2.5-72B,120.0,4,120.0,40.14,40.0,Silver,44,76.11111111111111,29,30.0
Qwen2.5-Coder-14B-Instruct,120.0,4,120.0,40.14,40.0,Silver,44,76.11111111111111,32,30.0
deepseek-chat,120.0,4,120.0,40.14,40.0,Silver,44,76.11111111111111,27,30.0
Qwen3-32B-Non-Thinking,120.0,4,120.0,40.14,40.0,Silver,44,76.11111111111111,30,30.0
OpenCodeReasoning-Nemotron-32B-IOI,120.0,4,120.0,40.14,40.0,Silver,44,76.11111111111111,40,30.0
Llama-3.3-70B-Instruct,120.0,4,120.0,40.14,40.0,Silver,44,76.11111111111111,33,30.0
Qwen3-30B-Non-Thinking,102.0,4,102.0,32.79,20.0,None,116,36.111111111111114,34,25.5
Qwen3-8B-Non-Thinking,102.0,4,102.0,32.65,20.0,None,116,36.111111111111114,35,25.5
Mistral-Small-3.1-24B-2503,72.0,4,72.0,29.59,0.0,None,123,32.22222222222222,36,18.0
Qwen3-14B-Non-Thinking,70.0,4,70.0,20.0,20.0,None,123,32.22222222222222,37,17.5
seed-oss_1024,65.0,4,65.0,26.94,20.0,None,129,28.88888888888889,38,16.25
seed-oss_0,65.0,4,65.0,26.94,20.0,None,129,28.88888888888889,39,16.25
Codestral-22B-v0.1,50.0,4,50.0,21.6,20.0,None,138,23.88888888888889,40,12.5
Qwen2.5-Coder-7B-Instruct,50.0,4,50.0,21.6,20.0,None,138,23.88888888888889,41,12.5
Mistral-Large-Instruct-2411,50.0,4,50.0,32.94,20.0,None,138,23.88888888888889,42,12.5
seed-oss_512,47.0,4,47.0,19.45,0.0,None,165,8.88888888888889,43,11.75
DeepSeek-Coder-V2-Lite-Instruct,32.0,4,32.0,13.99,0.0,None,165,8.88888888888889,44,8.0
Qwen3-4B-Non-Thinking,13.0,4,13.0,11.48,0.0,None,167,7.777777777777778,45,3.25
Llama-3.1-8B-Instruct,13.0,4,13.0,7.44,0.0,None,167,7.777777777777778,46,3.25
DeepSeek-R1-Distill-Llama-8B,0.0,4,0.0,0.0,0.0,None,173,4.444444444444445,47,0.0
