Model,Total Score,Included Tasks,Included Score,Avg Tests Passed,Pass Rate (%),Medal,Human Relative Rank,Human Percentile,Rank,Relative Score (%)
gpt-5,762.0,8,762.0,87.87,77.78,Gold,15,98.80239520958084,1,95.25
seed-oss_16384,658.0,8,658.0,78.17,66.67,Gold,59,95.03849443969204,3,82.25
gpt-oss-120b-high,680.0,8,680.0,80.32,66.67,Gold,49,95.89392643284859,2,85.0
gpt-oss-120b-medium,657.0,8,657.0,78.85,66.67,Gold,59,95.03849443969204,4,82.12
gemini-2.5-pro,657.0,8,657.0,79.31,66.67,Gold,59,95.03849443969204,5,82.12
gpt-oss-120b_sp1,551.0,8,551.0,64.51,55.56,Silver,248,78.87082976903336,6,68.88
gpt-oss-120b_sp2,533.0,8,533.0,65.29,55.56,Silver,290,75.27801539777587,7,66.62
gpt-oss-20b-high,621.0,8,621.0,77.21,66.67,Silver,96,91.87339606501283,6,77.62
gpt-oss-120b_sp3,519.0,8,519.0,61.51,55.56,Bronze,330,71.8562874251497,9,64.88
gpt-o3-mini-high,569.0,8,569.0,74.66,44.44,Silver,200,82.97690333618478,8,71.12
seed-oss_-1,579.0,8,579.0,77.64,44.44,Silver,175,85.11548331907613,7,72.38
seed-oss_8192,471.0,8,471.0,67.99,33.33,Bronze,426,63.64414029084688,11,58.88
gemini-2.5-flash,538.0,8,538.0,76.8,33.33,Silver,271,76.90333618477331,10,67.25
Qwen3-32B,460.0,8,460.0,69.16,22.22,Bronze,433,63.045337895637296,12,57.5
grok-4-fast-reasoning,455.0,8,455.0,76.6,42.86,Bronze,437,62.703165098374676,15,56.88
gpt-oss-20b-medium,546.0,8,546.0,65.93,55.56,Silver,255,78.27202737382378,9,68.25
Qwen3-30B,397.0,8,397.0,67.57,22.22,Bronze,501,57.2284003421728,15,49.62
gpt-oss-120b-low,455.0,8,455.0,60.2,33.33,Bronze,437,62.703165098374676,13,56.88
Qwen3-14B,379.0,8,379.0,62.9,22.22,Bronze,508,56.629597946963216,17,47.38
gpt-oss-120b_sp4,369.0,8,369.0,50.01,33.33,Bronze,517,55.859709153122324,20,46.12
deepseek-reasoner,423.0,8,423.0,63.24,22.22,Bronze,469,59.96578272027374,14,52.88
claude-sonnet-4.5,348.0,8,348.0,65.12,25.0,Bronze,523,55.3464499572284,22,43.5
Qwen3-8B,397.0,8,397.0,66.62,22.22,Bronze,501,57.2284003421728,16,49.62
DeepSeek-R1-Distill-Qwen-32B,314.0,8,314.0,53.81,11.11,Bronze,542,53.72112917023097,19,39.25
QwQ-32B,313.0,8,313.0,54.62,22.22,Bronze,542,53.72112917023097,20,39.12
gpt-oss-20b-low,375.0,8,375.0,51.19,22.22,Bronze,512,56.287425149700596,18,46.88
seed-oss_4096,293.0,8,293.0,41.78,25.0,Bronze,559,52.26689478186484,22,36.62
OpenCodeReasoning-Nemotron-32B-IOI,253.0,8,253.0,42.65,22.22,Bronze,579,50.556030795551756,28,31.62
deepseek-chat,253.0,8,253.0,57.49,11.11,Bronze,579,50.556030795551756,24,31.62
Qwen3-4B,263.0,8,263.0,58.17,11.11,Bronze,574,50.98374679213003,23,32.88
DeepSeek-R1-Distill-Qwen-14B,240.0,8,240.0,33.22,22.22,None,588,49.786142001710864,25,30.0
DeepSeek-R1-Distill-Llama-70B,297.0,8,297.0,55.01,11.11,Bronze,559,52.26689478186484,21,37.12
Qwen2.5-Coder-32B-Instruct,220.0,8,220.0,38.67,11.11,None,594,49.272882805816934,26,27.5
gpt-4.1,200.0,8,200.0,42.22,11.11,None,641,45.25235243798118,27,25.0
Llama-3.3-70B-Instruct,190.0,8,190.0,36.29,11.11,None,644,44.99572284003422,28,23.75
Qwen3-32B-Non-Thinking,189.0,8,189.0,33.36,11.11,None,644,44.99572284003422,29,23.62
OlympicCoder-7B,185.0,8,185.0,32.27,11.11,None,644,44.99572284003422,37,23.12
Qwen3-30B-Non-Thinking,168.0,8,168.0,30.5,11.11,None,652,44.31137724550898,30,21.0
Qwen2.5-Coder-14B-Instruct,155.0,8,155.0,27.01,11.11,None,657,43.88366124893071,32,19.38
Qwen3-14B-Non-Thinking,165.0,8,165.0,28.83,11.11,None,652,44.31137724550898,31,20.62
Mistral-Small-3.1-24B-2503,135.0,8,135.0,30.51,11.11,None,669,42.857142857142854,33,16.88
seed-oss_0,130.0,8,130.0,18.24,11.11,None,682,41.74508126603935,34,16.25
Llama-4-Scout,117.0,8,117.0,17.52,11.11,None,705,39.7775876817793,35,14.62
Qwen2.5-72B,102.0,8,102.0,21.92,0.0,None,719,38.57998289136014,37,12.75
Codestral-22B-v0.1,100.0,8,100.0,12.41,11.11,None,785,32.93413173652694,38,12.5
DeepSeek-Coder-V2-Lite-Instruct,100.0,8,100.0,19.53,11.11,None,785,32.93413173652694,39,12.5
Qwen3-4B-Non-Thinking,112.0,8,112.0,26.28,0.0,None,705,39.7775876817793,36,14.0
Mistral-Large-Instruct-2411,60.0,8,60.0,25.5,0.0,None,830,29.0846877673225,40,7.5
seed-oss_1024,59.0,8,59.0,16.91,0.0,None,830,29.0846877673225,41,7.38
seed-oss_2048,51.0,8,51.0,21.92,0.0,None,848,27.54491017964072,42,6.38
seed-oss_512,40.0,8,40.0,18.36,0.0,None,858,26.689478186484173,43,5.0
DeepSeek-R1-Distill-Llama-8B,30.0,8,30.0,4.89,0.0,None,867,25.919589392643285,44,3.75
Qwen3-8B-Non-Thinking,14.0,8,14.0,12.65,0.0,None,914,21.899059024807528,45,1.75
Llama-3.1-8B-Instruct,0.0,8,0.0,0.0,0.0,None,963,17.70744225834046,46,0.0
Qwen2.5-Coder-7B-Instruct,0.0,8,0.0,2.0,0.0,None,963,17.70744225834046,47,0.0
