Model,Total Score,Included Tasks,Included Score,Avg Tests Passed,Pass Rate (%),Medal,Human Relative Rank,Human Percentile,Rank,Relative Score (%)
gpt-5,450.0,5,450.0,100.0,100.0,Gold,1,100.0,1,90.0
gpt-oss-120b_sp4,410.0,5,410.0,94.89,80.0,Gold,14,96.29629629629629,2,82.0
gpt-oss-120b_sp1,370.0,5,370.0,86.56,80.0,Gold,17,95.44159544159544,3,74.0
gpt-oss-20b-medium,370.0,5,370.0,86.56,80.0,Gold,17,95.44159544159544,2,74.0
gpt-oss-120b-medium,370.0,5,370.0,86.56,80.0,Gold,17,95.44159544159544,3,74.0
gpt-oss-120b-high,340.0,5,340.0,80.0,80.0,Gold,21,94.3019943019943,4,68.0
gpt-oss-20b-high,340.0,5,340.0,80.0,80.0,Gold,21,94.3019943019943,5,68.0
gpt-o3-mini-high,340.0,5,340.0,80.0,80.0,Gold,21,94.3019943019943,6,68.0
grok-4-fast-reasoning,340.0,5,340.0,80.0,80.0,Gold,21,94.3019943019943,9,68.0
gemini-2.5-pro,340.0,5,340.0,83.83,80.0,Gold,21,94.3019943019943,7,68.0
seed-oss_-1,290.0,5,290.0,71.24,60.0,Gold,28,92.3076923076923,8,58.0
gpt-oss-120b_sp2,285.0,5,285.0,70.21,60.0,Gold,28,92.3076923076923,12,57.0
deepseek-reasoner,260.0,5,260.0,65.11,60.0,Silver,31,91.45299145299145,9,52.0
claude-sonnet-4.5,260.0,5,260.0,77.61,60.0,Silver,31,91.45299145299145,14,52.0
gpt-oss-120b_sp3,255.0,5,255.0,68.94,60.0,Silver,35,90.31339031339031,15,51.0
QwQ-32B,245.0,5,245.0,72.5,60.0,Silver,37,89.74358974358974,10,49.0
Qwen3-14B,245.0,5,245.0,72.5,60.0,Silver,37,89.74358974358974,11,49.0
Qwen3-32B,245.0,5,245.0,72.93,60.0,Silver,37,89.74358974358974,13,49.0
Qwen3-30B,245.0,5,245.0,72.93,60.0,Silver,37,89.74358974358974,14,49.0
gemini-2.5-flash,245.0,5,245.0,72.93,60.0,Silver,37,89.74358974358974,12,49.0
gpt-oss-20b-low,230.0,5,230.0,60.0,60.0,Silver,44,87.74928774928775,15,46.0
gpt-oss-120b-low,230.0,5,230.0,60.0,60.0,Silver,44,87.74928774928775,16,46.0
OpenCodeReasoning-Nemotron-32B-IOI,230.0,5,230.0,60.0,60.0,Silver,44,87.74928774928775,23,46.0
DeepSeek-R1-Distill-Qwen-32B,230.0,5,230.0,60.0,60.0,Silver,44,87.74928774928775,17,46.0
gpt-4.1,230.0,5,230.0,62.81,60.0,Silver,44,87.74928774928775,18,46.0
Qwen3-4B,230.0,5,230.0,69.38,60.0,Silver,44,87.74928774928775,19,46.0
Qwen3-8B,230.0,5,230.0,69.38,60.0,Silver,44,87.74928774928775,20,46.0
OlympicCoder-7B,198.0,5,198.0,64.5,40.0,Silver,72,79.77207977207978,28,39.6
deepseek-chat,180.0,5,180.0,52.86,40.0,Bronze,107,69.8005698005698,21,36.0
Qwen2.5-Coder-32B-Instruct,163.0,5,163.0,52.98,20.0,Bronze,109,69.23076923076923,22,32.6
seed-oss_8192,160.0,5,160.0,40.0,40.0,Bronze,111,68.66096866096866,23,32.0
Qwen3-32B-Non-Thinking,160.0,5,160.0,40.0,40.0,Bronze,111,68.66096866096866,24,32.0
DeepSeek-R1-Distill-Llama-70B,160.0,5,160.0,40.71,40.0,Bronze,111,68.66096866096866,25,32.0
Mistral-Small-3.1-24B-2503,128.0,5,128.0,42.71,20.0,Bronze,129,63.53276353276353,28,25.6
Mistral-Large-Instruct-2411,148.0,5,148.0,49.14,20.0,Bronze,114,67.80626780626781,26,29.6
Qwen2.5-Coder-14B-Instruct,143.0,5,143.0,50.84,20.0,Bronze,117,66.95156695156695,27,28.6
Qwen2.5-72B,107.0,5,107.0,33.61,0.0,None,188,46.72364672364672,29,21.4
Qwen3-30B-Non-Thinking,104.0,5,104.0,33.48,0.0,None,189,46.43874643874644,30,20.8
Llama-3.3-70B-Instruct,96.0,5,96.0,30.4,20.0,None,191,45.86894586894587,31,19.2
Llama-4-Scout,85.0,5,85.0,32.14,20.0,None,192,45.58404558404558,32,17.0
Qwen3-4B-Non-Thinking,85.0,5,85.0,32.94,20.0,None,192,45.58404558404558,33,17.0
Qwen3-14B-Non-Thinking,80.0,5,80.0,28.0,20.0,None,260,26.210826210826212,34,16.0
DeepSeek-R1-Distill-Qwen-14B,50.0,5,50.0,20.0,20.0,None,274,22.22222222222222,35,10.0
Qwen2.5-Coder-7B-Instruct,50.0,5,50.0,20.0,20.0,None,274,22.22222222222222,36,10.0
seed-oss_1024,50.0,5,50.0,20.0,20.0,None,274,22.22222222222222,37,10.0
seed-oss_512,50.0,5,50.0,20.0,20.0,None,274,22.22222222222222,38,10.0
seed-oss_2048,50.0,5,50.0,20.0,20.0,None,274,22.22222222222222,39,10.0
seed-oss_0,50.0,5,50.0,20.0,20.0,None,274,22.22222222222222,40,10.0
seed-oss_4096,50.0,5,50.0,20.71,20.0,None,274,22.22222222222222,41,10.0
Llama-3.1-8B-Instruct,39.0,5,39.0,16.0,0.0,None,335,4.843304843304844,42,7.8
Qwen3-8B-Non-Thinking,39.0,5,39.0,16.0,0.0,None,335,4.843304843304844,43,7.8
Codestral-22B-v0.1,39.0,5,39.0,16.8,0.0,None,335,4.843304843304844,44,7.8
DeepSeek-Coder-V2-Lite-Instruct,39.0,5,39.0,13.73,0.0,None,335,4.843304843304844,45,7.8
seed-oss_16384,0.0,5,0.0,0.0,0.0,None,347,1.4245014245014245,46,0.0
DeepSeek-R1-Distill-Qwen-7B,0.0,5,0.0,0.0,0.0,None,347,1.4245014245014245,47,0.0
DeepSeek-R1-Distill-Llama-8B,0.0,5,0.0,0.0,0.0,None,347,1.4245014245014245,48,0.0
