Model,Total Score,Included Tasks,Included Score,Avg Tests Passed,Pass Rate (%),Medal,Human Relative Rank,Human Percentile,Rank,Relative Score (%)
gpt-oss-120b_sp2,75.0,5,75.0,100.0,100.0,Gold,1,100.0,1,100.0
gpt-oss-120b-medium,75.0,5,75.0,100.0,100.0,Gold,1,100.0,3,100.0
gpt-oss-120b_sp4,75.0,5,75.0,100.0,100.0,Gold,1,100.0,3,100.0
gpt-oss-120b_sp1,75.0,5,75.0,100.0,100.0,Gold,1,100.0,4,100.0
gpt-oss-120b_sp3,75.0,5,75.0,100.0,100.0,Gold,1,100.0,5,100.0
grok-4-fast-reasoning,75.0,5,75.0,100.0,100.0,Gold,1,100.0,6,100.0
claude-sonnet-4.5,75.0,5,75.0,100.0,100.0,Gold,1,100.0,7,100.0
gpt-oss-20b-high,15.0,5,15.0,100.0,100.0,None,59,99.06224737267583,35,20.0
gpt-oss-120b-low,15.0,5,15.0,100.0,100.0,None,59,99.06224737267583,41,20.0
Qwen3-32B,15.0,5,15.0,100.0,100.0,None,59,99.06224737267583,45,20.0
gpt-5,75.0,5,75.0,100.0,100.0,Gold,1,100.0,1,100.0
gpt-o3-mini-high,75.0,5,75.0,100.0,100.0,Gold,1,100.0,5,100.0
gemini-2.5-flash,75.0,5,75.0,100.0,100.0,Gold,1,100.0,7,100.0
gpt-oss-120b-high,15.0,5,15.0,100.0,100.0,None,59,99.06224737267583,40,20.0
seed-oss_-1,60.0,5,60.0,80.0,80.0,Silver,14,99.78981406628941,25,80.0
gpt-oss-20b-low,75.0,5,75.0,100.0,100.0,Gold,1,100.0,2,100.0
gemini-2.5-pro,75.0,5,75.0,100.0,100.0,Gold,1,100.0,6,100.0
gpt-4.1,75.0,5,75.0,100.0,100.0,Gold,1,100.0,8,100.0
OpenCodeReasoning-Nemotron-32B-IOI,75.0,5,75.0,100.0,100.0,Gold,1,100.0,19,100.0
deepseek-reasoner,15.0,5,15.0,100.0,100.0,None,59,99.06224737267583,36,20.0
DeepSeek-R1-Distill-Llama-70B,75.0,5,75.0,100.0,100.0,Gold,1,100.0,12,100.0
Qwen3-30B,75.0,5,75.0,100.0,100.0,Gold,1,100.0,11,100.0
gpt-oss-20b-medium,15.0,5,15.0,100.0,100.0,None,59,99.06224737267583,39,20.0
QwQ-32B,75.0,5,75.0,100.0,100.0,Gold,1,100.0,9,100.0
DeepSeek-R1-Distill-Qwen-14B,75.0,5,75.0,100.0,100.0,Gold,1,100.0,10,100.0
Qwen3-8B,75.0,5,75.0,100.0,100.0,Gold,1,100.0,4,100.0
DeepSeek-R1-Distill-Qwen-32B,72.0,5,72.0,96.13,80.0,Gold,2,99.98383185125303,13,96.0
Qwen3-32B-Non-Thinking,66.0,5,66.0,88.39,80.0,Gold,8,99.88682295877122,15,88.0
Llama-4-Scout,66.0,5,66.0,88.39,80.0,Gold,8,99.88682295877122,14,88.0
Qwen2.5-Coder-14B-Instruct,66.0,5,66.0,88.39,80.0,Gold,8,99.88682295877122,18,88.0
Mistral-Large-Instruct-2411,66.0,5,66.0,88.39,80.0,Gold,8,99.88682295877122,19,88.0
Qwen2.5-Coder-32B-Instruct,66.0,5,66.0,88.39,80.0,Gold,8,99.88682295877122,17,88.0
OlympicCoder-7B,63.0,5,63.0,87.1,80.0,Gold,443,92.85367825383993,33,84.0
Qwen3-30B-Non-Thinking,63.0,5,63.0,87.1,80.0,Gold,11,99.83831851253032,22,84.0
Qwen3-14B,15.0,5,15.0,100.0,100.0,None,59,99.06224737267583,38,20.0
Qwen3-4B,63.0,5,63.0,87.1,80.0,Gold,11,99.83831851253032,20,84.0
Qwen2.5-72B,63.0,5,63.0,83.23,80.0,Gold,11,99.83831851253032,21,84.0
Mistral-Small-3.1-24B-2503,63.0,5,63.0,84.52,80.0,Gold,11,99.83831851253032,23,84.0
seed-oss_8192,60.0,5,60.0,100.0,100.0,Silver,14,99.78981406628941,24,80.0
Codestral-22B-v0.1,60.0,5,60.0,82.58,80.0,Silver,14,99.78981406628941,26,80.0
Qwen3-4B-Non-Thinking,60.0,5,60.0,81.94,80.0,Silver,14,99.78981406628941,27,80.0
deepseek-chat,66.0,5,66.0,92.26,80.0,Gold,8,99.88682295877122,16,88.0
Llama-3.1-8B-Instruct,51.0,5,51.0,64.44,60.0,Silver,23,99.64430072756669,28,68.0
seed-oss_512,48.0,5,48.0,79.03,75.0,Bronze,26,99.59579628132579,29,64.0
Llama-3.3-70B-Instruct,48.0,5,48.0,71.23,60.0,Bronze,26,99.59579628132579,30,64.0
Qwen3-8B-Non-Thinking,33.0,5,33.0,54.03,50.0,None,41,99.35327405012126,33,44.0
DeepSeek-R1-Distill-Llama-8B,0.0,5,0.0,0.0,0.0,None,74,98.8197251414713,46,0.0
Qwen2.5-Coder-7B-Instruct,36.0,5,36.0,52.44,40.0,None,38,99.40177849636217,31,48.0
DeepSeek-Coder-V2-Lite-Instruct,36.0,5,36.0,52.44,40.0,None,38,99.40177849636217,32,48.0
seed-oss_16384,30.0,5,30.0,100.0,100.0,None,44,99.30476960388036,34,40.0
seed-oss_0,15.0,5,15.0,100.0,100.0,None,59,99.06224737267583,37,20.0
seed-oss_4096,15.0,5,15.0,100.0,100.0,None,59,99.06224737267583,42,20.0
seed-oss_2048,15.0,5,15.0,100.0,100.0,None,59,99.06224737267583,43,20.0
seed-oss_1024,15.0,5,15.0,100.0,100.0,None,59,99.06224737267583,44,20.0
DeepSeek-R1-Distill-Qwen-7B,0.0,5,0.0,0.0,0.0,None,74,98.8197251414713,47,0.0
