Model,Total Score,Included Tasks,Included Score,Avg Tests Passed,Pass Rate (%),Medal,Human Relative Rank,Human Percentile,Rank,Relative Score (%)
gpt-5,698.0,9,698.0,86.61,66.67,Gold,44,96.14003590664272,1,77.56
gpt-oss-120b-high,680.0,9,680.0,81.82,66.67,Gold,67,94.0754039497307,2,75.56
grok-4-fast-reasoning,677.0,9,677.0,86.06,44.44,Gold,69,93.89587073608618,3,75.22
gpt-oss-120b_sp2,646.0,9,646.0,77.08,66.67,Silver,99,91.20287253141831,4,71.78
gpt-oss-120b-low,616.0,9,616.0,71.04,66.67,Silver,132,88.24057450628366,3,68.44
gpt-oss-20b-medium,607.0,9,607.0,69.03,55.56,Silver,140,87.52244165170556,5,67.44
gpt-o3-mini-high,616.0,9,616.0,73.87,66.67,Silver,132,88.24057450628366,4,68.44
gpt-oss-120b_sp3,606.0,9,606.0,73.92,55.56,Silver,142,87.34290843806104,8,67.33
seed-oss_-1,593.0,9,593.0,71.5,55.56,Silver,175,84.38061041292639,6,65.89
gpt-oss-120b-medium,583.0,9,583.0,76.26,55.56,Silver,189,83.12387791741472,7,64.78
gemini-2.5-pro,583.0,9,583.0,78.27,44.44,Silver,189,83.12387791741472,8,64.78
gpt-oss-120b_sp4,575.0,9,575.0,73.46,55.56,Silver,198,82.31597845601436,12,63.89
gemini-2.5-flash,558.0,9,558.0,77.21,33.33,Silver,245,78.09694793536805,9,62.0
gpt-oss-120b_sp1,537.0,9,537.0,70.68,44.44,Bronze,297,73.42908438061042,14,59.67
seed-oss_16384,512.0,9,512.0,65.63,33.33,Bronze,373,66.6068222621185,10,56.89
gpt-oss-20b-low,484.0,9,484.0,60.31,44.44,Bronze,417,62.657091561938955,12,53.78
gpt-oss-20b-high,480.0,9,480.0,71.02,57.14,Bronze,422,62.208258527827645,13,53.33
deepseek-reasoner,472.0,9,472.0,64.41,33.33,Bronze,434,61.1310592459605,14,52.44
Qwen3-14B,461.0,9,461.0,59.69,44.44,Bronze,442,60.412926391382406,15,51.22
Qwen3-32B,456.0,9,456.0,60.0,33.33,Bronze,449,59.78456014362657,16,50.67
seed-oss_8192,453.0,9,453.0,56.06,33.33,Bronze,450,59.69479353680431,17,50.33
OpenCodeReasoning-Nemotron-32B-IOI,445.0,9,445.0,57.18,33.33,Bronze,453,59.42549371633752,22,49.44
Qwen3-30B,441.0,9,441.0,59.0,33.33,Bronze,459,58.88689407540395,18,49.0
claude-sonnet-4.5,410.0,9,410.0,62.22,33.33,Bronze,475,57.450628366247756,24,45.56
Qwen3-4B,408.0,9,408.0,54.28,33.33,Bronze,477,57.27109515260323,19,45.33
Qwen3-8B,408.0,9,408.0,53.8,33.33,Bronze,477,57.27109515260323,20,45.33
DeepSeek-R1-Distill-Llama-70B,377.0,9,377.0,56.51,22.22,Bronze,502,55.02692998204668,21,41.89
Qwen2.5-Coder-14B-Instruct,373.0,9,373.0,50.94,22.22,Bronze,507,54.57809694793537,22,41.44
Qwen3-8B-Non-Thinking,373.0,9,373.0,47.63,22.22,Bronze,507,54.57809694793537,23,41.44
gpt-4.1,338.0,9,338.0,48.81,11.11,Bronze,524,53.05206463195691,25,37.56
OlympicCoder-7B,306.0,9,306.0,42.86,22.22,Bronze,543,51.34649910233393,31,34.0
seed-oss_4096,306.0,9,306.0,42.46,22.22,Bronze,543,51.34649910233393,27,34.0
deepseek-chat,299.0,9,299.0,45.96,11.11,Bronze,556,50.179533213644525,28,33.22
seed-oss_1024,296.0,9,296.0,39.14,22.22,Bronze,556,50.179533213644525,29,32.89
Mistral-Large-Instruct-2411,289.0,9,289.0,40.5,11.11,None,558,50.0,30,32.11
Llama-3.3-70B-Instruct,284.0,9,284.0,40.02,22.22,None,559,49.91023339317774,31,31.56
Mistral-Small-3.1-24B-2503,273.0,9,273.0,37.69,11.11,None,565,49.371633752244165,32,30.33
Qwen2.5-72B,264.0,9,264.0,38.27,11.11,None,566,49.281867145421906,33,29.33
Qwen3-30B-Non-Thinking,264.0,9,264.0,35.79,11.11,None,566,49.281867145421906,34,29.33
seed-oss_0,263.0,9,263.0,40.06,11.11,None,567,49.19210053859964,36,29.22
Qwen3-32B-Non-Thinking,254.0,9,254.0,38.76,11.11,None,569,49.012567324955114,37,28.22
Qwen3-14B-Non-Thinking,228.0,9,228.0,36.48,22.22,None,581,47.93536804308797,38,25.33
seed-oss_2048,221.0,9,221.0,36.04,11.11,None,585,47.576301615798926,39,24.56
Llama-4-Scout,219.0,9,219.0,29.9,22.22,None,591,47.03770197486535,40,24.33
Qwen2.5-Coder-7B-Instruct,199.0,9,199.0,29.59,11.11,None,618,44.614003590664275,41,22.11
seed-oss_512,190.0,9,190.0,30.71,11.11,None,621,44.34470377019748,42,21.11
Llama-3.1-8B-Instruct,190.0,9,190.0,25.61,11.11,None,621,44.34470377019748,43,21.11
Qwen3-4B-Non-Thinking,180.0,9,180.0,25.74,11.11,None,625,43.98563734290844,44,20.0
Codestral-22B-v0.1,165.0,9,165.0,27.43,11.11,None,635,43.08797127468582,45,18.33
DeepSeek-Coder-V2-Lite-Instruct,112.0,9,112.0,23.57,0.0,None,675,39.497307001795335,46,12.44
DeepSeek-R1-Distill-Qwen-14B,333.0,9,333.0,45.6,33.33,Bronze,526,52.87253141831239,26,37.0
DeepSeek-R1-Distill-Qwen-32B,349.0,9,349.0,42.58,33.33,Bronze,519,53.50089766606822,24,38.78
DeepSeek-R1-Distill-Llama-8B,100.0,9,100.0,11.89,11.11,None,727,34.829443447037704,47,11.11
QwQ-32B,496.0,9,496.0,60.41,44.44,Bronze,400,64.18312387791741,11,55.11
Qwen2.5-Coder-32B-Instruct,264.0,9,264.0,42.4,11.11,None,566,49.281867145421906,35,29.33
DeepSeek-R1-Distill-Qwen-7B,0.0,9,0.0,0.0,0.0,None,953,14.542190305206462,48,0.0
