,solver,solver_id,problem,competition,split,judge,accuracy
0,GPT OSS 120B (high),openai/oss-120b,allrussian_2025_1,allrussian,proofs,OPC R1 8B,0.0
1,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,allrussian_2025_1,allrussian,proofs,OPC R1 8B,1.0
2,Qwen3-4B (25/07),qwen/qwen3_4b,allrussian_2025_1,allrussian,proofs,OPC R1 8B,0.0
3,o4-mini (high),openai/o4-mini--high,allrussian_2025_1,allrussian,proofs,OPC R1 8B,0.0
4,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,allrussian_2025_1,allrussian,proofs,OPC R1 8B,0.0
5,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,allrussian_2025_1,allrussian,proofs,OPC R1 8B,0.0
6,GPT-5-mini (high),openai/gpt-5-mini,allrussian_2025_1,allrussian,proofs,OPC R1 8B,0.0
7,GPT-5 (high),openai/gpt-5,allrussian_2025_1,allrussian,proofs,OPC R1 8B,0.0
8,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,allrussian_2025_1,allrussian,proofs,OPC R1 8B,1.0
9,Grok 4,xai/grok-4,allrussian_2025_1,allrussian,proofs,OPC R1 8B,0.0
10,gemini-2.5-pro,gemini/gemini-pro-2.5,allrussian_2025_1,allrussian,proofs,OPC R1 8B,0.0
11,Grok 4,xai/grok-4,allrussian_2025_10,allrussian,proofs,OPC R1 8B,1.0
12,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,allrussian_2025_10,allrussian,proofs,OPC R1 8B,0.0
13,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,allrussian_2025_10,allrussian,proofs,OPC R1 8B,1.0
14,gemini-2.5-pro,gemini/gemini-pro-2.5,allrussian_2025_10,allrussian,proofs,OPC R1 8B,0.0
15,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,allrussian_2025_10,allrussian,proofs,OPC R1 8B,0.0
16,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,allrussian_2025_10,allrussian,proofs,OPC R1 8B,1.0
17,Qwen3-4B (25/07),qwen/qwen3_4b,allrussian_2025_10,allrussian,proofs,OPC R1 8B,0.0
18,o4-mini (high),openai/o4-mini--high,allrussian_2025_10,allrussian,proofs,OPC R1 8B,0.0
19,GPT-5-mini (high),openai/gpt-5-mini,allrussian_2025_10,allrussian,proofs,OPC R1 8B,1.0
20,GPT-5 (high),openai/gpt-5,allrussian_2025_10,allrussian,proofs,OPC R1 8B,1.0
21,GPT OSS 120B (high),openai/oss-120b,allrussian_2025_10,allrussian,proofs,OPC R1 8B,0.0
22,gemini-2.5-pro,gemini/gemini-pro-2.5,allrussian_2025_11,allrussian,proofs,OPC R1 8B,0.0
23,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,allrussian_2025_11,allrussian,proofs,OPC R1 8B,0.0
24,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,allrussian_2025_11,allrussian,proofs,OPC R1 8B,0.0
25,GPT OSS 120B (high),openai/oss-120b,allrussian_2025_11,allrussian,proofs,OPC R1 8B,0.0
26,GPT-5-mini (high),openai/gpt-5-mini,allrussian_2025_11,allrussian,proofs,OPC R1 8B,0.0
27,GPT-5 (high),openai/gpt-5,allrussian_2025_11,allrussian,proofs,OPC R1 8B,0.0
28,o4-mini (high),openai/o4-mini--high,allrussian_2025_11,allrussian,proofs,OPC R1 8B,0.0
29,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,allrussian_2025_11,allrussian,proofs,OPC R1 8B,1.0
30,Qwen3-4B (25/07),qwen/qwen3_4b,allrussian_2025_11,allrussian,proofs,OPC R1 8B,0.0
31,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,allrussian_2025_11,allrussian,proofs,OPC R1 8B,0.0
32,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,allrussian_2025_12,allrussian,proofs,OPC R1 8B,0.0
33,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,allrussian_2025_12,allrussian,proofs,OPC R1 8B,0.0
34,GPT-5-mini (high),openai/gpt-5-mini,allrussian_2025_12,allrussian,proofs,OPC R1 8B,0.0
35,GPT OSS 120B (high),openai/oss-120b,allrussian_2025_12,allrussian,proofs,OPC R1 8B,0.0
36,o4-mini (high),openai/o4-mini--high,allrussian_2025_12,allrussian,proofs,OPC R1 8B,0.0
37,Qwen3-4B (25/07),qwen/qwen3_4b,allrussian_2025_12,allrussian,proofs,OPC R1 8B,0.0
38,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,allrussian_2025_12,allrussian,proofs,OPC R1 8B,0.0
39,Grok 4,xai/grok-4,allrussian_2025_12,allrussian,proofs,OPC R1 8B,0.0
40,GPT-5 (high),openai/gpt-5,allrussian_2025_12,allrussian,proofs,OPC R1 8B,0.0
41,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,allrussian_2025_12,allrussian,proofs,OPC R1 8B,0.0
42,gemini-2.5-pro,gemini/gemini-pro-2.5,allrussian_2025_12,allrussian,proofs,OPC R1 8B,0.0
43,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,allrussian_2025_13,allrussian,proofs,OPC R1 8B,1.0
44,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,allrussian_2025_13,allrussian,proofs,OPC R1 8B,1.0
45,GPT OSS 120B (high),openai/oss-120b,allrussian_2025_13,allrussian,proofs,OPC R1 8B,0.0
46,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,allrussian_2025_13,allrussian,proofs,OPC R1 8B,1.0
47,GPT-5 (high),openai/gpt-5,allrussian_2025_13,allrussian,proofs,OPC R1 8B,1.0
48,Grok 4,xai/grok-4,allrussian_2025_13,allrussian,proofs,OPC R1 8B,1.0
49,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,allrussian_2025_13,allrussian,proofs,OPC R1 8B,1.0
50,GPT-5-mini (high),openai/gpt-5-mini,allrussian_2025_13,allrussian,proofs,OPC R1 8B,1.0
51,Qwen3-4B (25/07),qwen/qwen3_4b,allrussian_2025_13,allrussian,proofs,OPC R1 8B,0.0
52,gemini-2.5-pro,gemini/gemini-pro-2.5,allrussian_2025_13,allrussian,proofs,OPC R1 8B,0.0
53,o4-mini (high),openai/o4-mini--high,allrussian_2025_13,allrussian,proofs,OPC R1 8B,0.0
54,gemini-2.5-pro,gemini/gemini-pro-2.5,allrussian_2025_14,allrussian,proofs,OPC R1 8B,0.0
55,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,allrussian_2025_14,allrussian,proofs,OPC R1 8B,1.0
56,GPT-5-mini (high),openai/gpt-5-mini,allrussian_2025_14,allrussian,proofs,OPC R1 8B,0.0
57,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,allrussian_2025_14,allrussian,proofs,OPC R1 8B,0.0
58,GPT OSS 120B (high),openai/oss-120b,allrussian_2025_14,allrussian,proofs,OPC R1 8B,1.0
59,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,allrussian_2025_14,allrussian,proofs,OPC R1 8B,0.0
60,Qwen3-4B (25/07),qwen/qwen3_4b,allrussian_2025_14,allrussian,proofs,OPC R1 8B,0.0
61,Grok 4,xai/grok-4,allrussian_2025_14,allrussian,proofs,OPC R1 8B,0.0
62,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,allrussian_2025_14,allrussian,proofs,OPC R1 8B,0.0
63,o4-mini (high),openai/o4-mini--high,allrussian_2025_14,allrussian,proofs,OPC R1 8B,0.0
64,GPT-5 (high),openai/gpt-5,allrussian_2025_14,allrussian,proofs,OPC R1 8B,0.0
65,Qwen3-4B (25/07),qwen/qwen3_4b,allrussian_2025_15,allrussian,proofs,OPC R1 8B,0.0
66,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,allrussian_2025_15,allrussian,proofs,OPC R1 8B,0.0
67,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,allrussian_2025_15,allrussian,proofs,OPC R1 8B,0.0
68,GPT-5-mini (high),openai/gpt-5-mini,allrussian_2025_15,allrussian,proofs,OPC R1 8B,0.0
69,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,allrussian_2025_15,allrussian,proofs,OPC R1 8B,0.0
70,Grok 4,xai/grok-4,allrussian_2025_15,allrussian,proofs,OPC R1 8B,0.0
71,GPT OSS 120B (high),openai/oss-120b,allrussian_2025_15,allrussian,proofs,OPC R1 8B,1.0
72,o4-mini (high),openai/o4-mini--high,allrussian_2025_15,allrussian,proofs,OPC R1 8B,0.0
73,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,allrussian_2025_15,allrussian,proofs,OPC R1 8B,0.0
74,gemini-2.5-pro,gemini/gemini-pro-2.5,allrussian_2025_15,allrussian,proofs,OPC R1 8B,0.0
75,gemini-2.5-pro,gemini/gemini-pro-2.5,allrussian_2025_16,allrussian,proofs,OPC R1 8B,1.0
76,o4-mini (high),openai/o4-mini--high,allrussian_2025_16,allrussian,proofs,OPC R1 8B,1.0
77,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,allrussian_2025_16,allrussian,proofs,OPC R1 8B,0.0
78,Qwen3-4B (25/07),qwen/qwen3_4b,allrussian_2025_16,allrussian,proofs,OPC R1 8B,1.0
79,Grok 4,xai/grok-4,allrussian_2025_16,allrussian,proofs,OPC R1 8B,0.0
80,GPT-5-mini (high),openai/gpt-5-mini,allrussian_2025_16,allrussian,proofs,OPC R1 8B,1.0
81,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,allrussian_2025_16,allrussian,proofs,OPC R1 8B,0.0
82,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,allrussian_2025_16,allrussian,proofs,OPC R1 8B,0.0
83,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,allrussian_2025_16,allrussian,proofs,OPC R1 8B,1.0
84,GPT-5 (high),openai/gpt-5,allrussian_2025_16,allrussian,proofs,OPC R1 8B,0.0
85,GPT OSS 120B (high),openai/oss-120b,allrussian_2025_16,allrussian,proofs,OPC R1 8B,0.0
86,Grok 4,xai/grok-4,allrussian_2025_2,allrussian,proofs,OPC R1 8B,0.0
87,GPT-5-mini (high),openai/gpt-5-mini,allrussian_2025_2,allrussian,proofs,OPC R1 8B,1.0
88,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,allrussian_2025_2,allrussian,proofs,OPC R1 8B,0.0
89,Qwen3-4B (25/07),qwen/qwen3_4b,allrussian_2025_2,allrussian,proofs,OPC R1 8B,0.0
90,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,allrussian_2025_2,allrussian,proofs,OPC R1 8B,0.0
91,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,allrussian_2025_2,allrussian,proofs,OPC R1 8B,0.0
92,gemini-2.5-pro,gemini/gemini-pro-2.5,allrussian_2025_2,allrussian,proofs,OPC R1 8B,1.0
93,GPT-5 (high),openai/gpt-5,allrussian_2025_2,allrussian,proofs,OPC R1 8B,1.0
94,o4-mini (high),openai/o4-mini--high,allrussian_2025_2,allrussian,proofs,OPC R1 8B,0.0
95,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,allrussian_2025_2,allrussian,proofs,OPC R1 8B,0.0
96,GPT OSS 120B (high),openai/oss-120b,allrussian_2025_2,allrussian,proofs,OPC R1 8B,0.0
97,GPT-5-mini (high),openai/gpt-5-mini,allrussian_2025_3,allrussian,proofs,OPC R1 8B,0.0
98,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,allrussian_2025_3,allrussian,proofs,OPC R1 8B,1.0
99,Grok 4,xai/grok-4,allrussian_2025_3,allrussian,proofs,OPC R1 8B,0.0
100,o4-mini (high),openai/o4-mini--high,allrussian_2025_3,allrussian,proofs,OPC R1 8B,0.0
101,gemini-2.5-pro,gemini/gemini-pro-2.5,allrussian_2025_3,allrussian,proofs,OPC R1 8B,1.0
102,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,allrussian_2025_3,allrussian,proofs,OPC R1 8B,1.0
103,Qwen3-4B (25/07),qwen/qwen3_4b,allrussian_2025_3,allrussian,proofs,OPC R1 8B,1.0
104,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,allrussian_2025_3,allrussian,proofs,OPC R1 8B,0.0
105,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,allrussian_2025_3,allrussian,proofs,OPC R1 8B,1.0
106,GPT OSS 120B (high),openai/oss-120b,allrussian_2025_3,allrussian,proofs,OPC R1 8B,0.0
107,GPT-5 (high),openai/gpt-5,allrussian_2025_3,allrussian,proofs,OPC R1 8B,0.0
108,GPT OSS 120B (high),openai/oss-120b,allrussian_2025_4,allrussian,proofs,OPC R1 8B,0.0
109,GPT-5 (high),openai/gpt-5,allrussian_2025_4,allrussian,proofs,OPC R1 8B,1.0
110,o4-mini (high),openai/o4-mini--high,allrussian_2025_4,allrussian,proofs,OPC R1 8B,0.0
111,gemini-2.5-pro,gemini/gemini-pro-2.5,allrussian_2025_4,allrussian,proofs,OPC R1 8B,0.0
112,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,allrussian_2025_4,allrussian,proofs,OPC R1 8B,0.0
113,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,allrussian_2025_4,allrussian,proofs,OPC R1 8B,0.0
114,Grok 4,xai/grok-4,allrussian_2025_4,allrussian,proofs,OPC R1 8B,0.0
115,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,allrussian_2025_4,allrussian,proofs,OPC R1 8B,0.0
116,Qwen3-4B (25/07),qwen/qwen3_4b,allrussian_2025_4,allrussian,proofs,OPC R1 8B,0.0
117,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,allrussian_2025_4,allrussian,proofs,OPC R1 8B,0.0
118,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,allrussian_2025_5,allrussian,proofs,OPC R1 8B,0.0
119,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,allrussian_2025_5,allrussian,proofs,OPC R1 8B,1.0
120,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,allrussian_2025_5,allrussian,proofs,OPC R1 8B,1.0
121,Qwen3-4B (25/07),qwen/qwen3_4b,allrussian_2025_5,allrussian,proofs,OPC R1 8B,1.0
122,GPT OSS 120B (high),openai/oss-120b,allrussian_2025_5,allrussian,proofs,OPC R1 8B,0.0
123,GPT-5 (high),openai/gpt-5,allrussian_2025_5,allrussian,proofs,OPC R1 8B,1.0
124,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,allrussian_2025_5,allrussian,proofs,OPC R1 8B,0.0
125,Grok 4,xai/grok-4,allrussian_2025_5,allrussian,proofs,OPC R1 8B,0.0
126,GPT-5-mini (high),openai/gpt-5-mini,allrussian_2025_5,allrussian,proofs,OPC R1 8B,1.0
127,o4-mini (high),openai/o4-mini--high,allrussian_2025_5,allrussian,proofs,OPC R1 8B,1.0
128,gemini-2.5-pro,gemini/gemini-pro-2.5,allrussian_2025_5,allrussian,proofs,OPC R1 8B,1.0
129,Qwen3-4B (25/07),qwen/qwen3_4b,allrussian_2025_6,allrussian,proofs,OPC R1 8B,0.0
130,GPT-5 (high),openai/gpt-5,allrussian_2025_6,allrussian,proofs,OPC R1 8B,1.0
131,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,allrussian_2025_6,allrussian,proofs,OPC R1 8B,0.0
132,o4-mini (high),openai/o4-mini--high,allrussian_2025_6,allrussian,proofs,OPC R1 8B,1.0
133,GPT-5-mini (high),openai/gpt-5-mini,allrussian_2025_6,allrussian,proofs,OPC R1 8B,0.0
134,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,allrussian_2025_6,allrussian,proofs,OPC R1 8B,0.0
135,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,allrussian_2025_6,allrussian,proofs,OPC R1 8B,0.0
136,Grok 4,xai/grok-4,allrussian_2025_6,allrussian,proofs,OPC R1 8B,0.0
137,gemini-2.5-pro,gemini/gemini-pro-2.5,allrussian_2025_6,allrussian,proofs,OPC R1 8B,0.0
138,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,allrussian_2025_6,allrussian,proofs,OPC R1 8B,1.0
139,GPT OSS 120B (high),openai/oss-120b,allrussian_2025_6,allrussian,proofs,OPC R1 8B,0.0
140,o4-mini (high),openai/o4-mini--high,allrussian_2025_7,allrussian,proofs,OPC R1 8B,0.0
141,GPT-5-mini (high),openai/gpt-5-mini,allrussian_2025_7,allrussian,proofs,OPC R1 8B,0.0
142,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,allrussian_2025_7,allrussian,proofs,OPC R1 8B,0.0
143,gemini-2.5-pro,gemini/gemini-pro-2.5,allrussian_2025_7,allrussian,proofs,OPC R1 8B,1.0
144,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,allrussian_2025_7,allrussian,proofs,OPC R1 8B,0.0
145,GPT-5 (high),openai/gpt-5,allrussian_2025_7,allrussian,proofs,OPC R1 8B,0.0
146,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,allrussian_2025_7,allrussian,proofs,OPC R1 8B,1.0
147,Qwen3-4B (25/07),qwen/qwen3_4b,allrussian_2025_7,allrussian,proofs,OPC R1 8B,0.0
148,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,allrussian_2025_7,allrussian,proofs,OPC R1 8B,0.0
149,GPT OSS 120B (high),openai/oss-120b,allrussian_2025_7,allrussian,proofs,OPC R1 8B,0.0
150,gemini-2.5-pro,gemini/gemini-pro-2.5,allrussian_2025_8,allrussian,proofs,OPC R1 8B,0.0
151,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,allrussian_2025_8,allrussian,proofs,OPC R1 8B,0.0
152,o4-mini (high),openai/o4-mini--high,allrussian_2025_8,allrussian,proofs,OPC R1 8B,0.0
153,Qwen3-4B (25/07),qwen/qwen3_4b,allrussian_2025_8,allrussian,proofs,OPC R1 8B,0.0
154,GPT-5-mini (high),openai/gpt-5-mini,allrussian_2025_8,allrussian,proofs,OPC R1 8B,0.0
155,Grok 4,xai/grok-4,allrussian_2025_8,allrussian,proofs,OPC R1 8B,0.0
156,GPT OSS 120B (high),openai/oss-120b,allrussian_2025_8,allrussian,proofs,OPC R1 8B,1.0
157,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,allrussian_2025_8,allrussian,proofs,OPC R1 8B,0.0
158,GPT-5 (high),openai/gpt-5,allrussian_2025_8,allrussian,proofs,OPC R1 8B,0.0
159,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,allrussian_2025_8,allrussian,proofs,OPC R1 8B,0.0
160,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,allrussian_2025_8,allrussian,proofs,OPC R1 8B,0.0
161,gemini-2.5-pro,gemini/gemini-pro-2.5,allrussian_2025_9,allrussian,proofs,OPC R1 8B,1.0
162,GPT-5 (high),openai/gpt-5,allrussian_2025_9,allrussian,proofs,OPC R1 8B,1.0
163,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,allrussian_2025_9,allrussian,proofs,OPC R1 8B,1.0
164,Grok 4,xai/grok-4,allrussian_2025_9,allrussian,proofs,OPC R1 8B,1.0
165,o4-mini (high),openai/o4-mini--high,allrussian_2025_9,allrussian,proofs,OPC R1 8B,1.0
166,Qwen3-4B (25/07),qwen/qwen3_4b,allrussian_2025_9,allrussian,proofs,OPC R1 8B,0.0
167,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,allrussian_2025_9,allrussian,proofs,OPC R1 8B,1.0
168,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,allrussian_2025_9,allrussian,proofs,OPC R1 8B,0.0
169,GPT-5-mini (high),openai/gpt-5-mini,allrussian_2025_9,allrussian,proofs,OPC R1 8B,1.0
170,GPT OSS 120B (high),openai/oss-120b,allrussian_2025_9,allrussian,proofs,OPC R1 8B,0.0
171,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,allrussian_2025_9,allrussian,proofs,OPC R1 8B,1.0
172,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,bmo_2025_1,bmo,proofs,OPC R1 8B,0.0
173,GPT OSS 120B (high),openai/oss-120b,bmo_2025_1,bmo,proofs,OPC R1 8B,0.0
174,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,bmo_2025_1,bmo,proofs,OPC R1 8B,1.0
175,o4-mini (high),openai/o4-mini--high,bmo_2025_1,bmo,proofs,OPC R1 8B,0.0
176,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,bmo_2025_1,bmo,proofs,OPC R1 8B,0.0
177,Qwen3-4B (25/07),qwen/qwen3_4b,bmo_2025_1,bmo,proofs,OPC R1 8B,0.0
178,gemini-2.5-pro,gemini/gemini-pro-2.5,bmo_2025_1,bmo,proofs,OPC R1 8B,0.0
179,Grok 4,xai/grok-4,bmo_2025_1,bmo,proofs,OPC R1 8B,0.0
180,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,bmo_2025_1,bmo,proofs,OPC R1 8B,0.0
181,GPT-5 (high),openai/gpt-5,bmo_2025_1,bmo,proofs,OPC R1 8B,1.0
182,Grok 4,xai/grok-4,bmo_2025_2,bmo,proofs,OPC R1 8B,0.0
183,Qwen3-4B (25/07),qwen/qwen3_4b,bmo_2025_2,bmo,proofs,OPC R1 8B,0.0
184,GPT OSS 120B (high),openai/oss-120b,bmo_2025_2,bmo,proofs,OPC R1 8B,1.0
185,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,bmo_2025_2,bmo,proofs,OPC R1 8B,0.0
186,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,bmo_2025_2,bmo,proofs,OPC R1 8B,0.0
187,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,bmo_2025_2,bmo,proofs,OPC R1 8B,0.0
188,o4-mini (high),openai/o4-mini--high,bmo_2025_2,bmo,proofs,OPC R1 8B,0.0
189,GPT-5 (high),openai/gpt-5,bmo_2025_2,bmo,proofs,OPC R1 8B,0.0
190,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,bmo_2025_2,bmo,proofs,OPC R1 8B,0.0
191,gemini-2.5-pro,gemini/gemini-pro-2.5,bmo_2025_2,bmo,proofs,OPC R1 8B,0.0
192,Qwen3-4B (25/07),qwen/qwen3_4b,bmo_2025_3,bmo,proofs,OPC R1 8B,0.0
193,GPT OSS 120B (high),openai/oss-120b,bmo_2025_3,bmo,proofs,OPC R1 8B,0.0
194,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,bmo_2025_3,bmo,proofs,OPC R1 8B,1.0
195,GPT-5 (high),openai/gpt-5,bmo_2025_3,bmo,proofs,OPC R1 8B,0.0
196,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,bmo_2025_3,bmo,proofs,OPC R1 8B,0.0
197,o4-mini (high),openai/o4-mini--high,bmo_2025_3,bmo,proofs,OPC R1 8B,0.0
198,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,bmo_2025_3,bmo,proofs,OPC R1 8B,1.0
199,Grok 4,xai/grok-4,bmo_2025_3,bmo,proofs,OPC R1 8B,0.0
200,GPT-5-mini (high),openai/gpt-5-mini,bmo_2025_3,bmo,proofs,OPC R1 8B,0.0
201,gemini-2.5-pro,gemini/gemini-pro-2.5,bmo_2025_3,bmo,proofs,OPC R1 8B,0.0
202,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,bmo_2025_3,bmo,proofs,OPC R1 8B,0.0
203,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,bmo_2025_4,bmo,proofs,OPC R1 8B,0.0
204,o4-mini (high),openai/o4-mini--high,bmo_2025_4,bmo,proofs,OPC R1 8B,0.0
205,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,bmo_2025_4,bmo,proofs,OPC R1 8B,1.0
206,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,bmo_2025_4,bmo,proofs,OPC R1 8B,0.0
207,Qwen3-4B (25/07),qwen/qwen3_4b,bmo_2025_4,bmo,proofs,OPC R1 8B,0.0
208,GPT-5 (high),openai/gpt-5,bmo_2025_4,bmo,proofs,OPC R1 8B,1.0
209,gemini-2.5-pro,gemini/gemini-pro-2.5,bmo_2025_4,bmo,proofs,OPC R1 8B,0.0
210,Grok 4,xai/grok-4,bmo_2025_4,bmo,proofs,OPC R1 8B,0.0
211,GPT-5-mini (high),openai/gpt-5-mini,bmo_2025_4,bmo,proofs,OPC R1 8B,0.0
212,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,bmo_2025_4,bmo,proofs,OPC R1 8B,0.0
213,GPT OSS 120B (high),openai/oss-120b,bmo_2025_4,bmo,proofs,OPC R1 8B,0.0
214,GPT-5 (high),openai/gpt-5,bmosl_A_2025_1,bmosl,proofs,OPC R1 8B,1.0
215,GPT OSS 120B (high),openai/oss-120b,bmosl_A_2025_1,bmosl,proofs,OPC R1 8B,1.0
216,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,bmosl_A_2025_1,bmosl,proofs,OPC R1 8B,0.0
217,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,bmosl_A_2025_1,bmosl,proofs,OPC R1 8B,0.0
218,o4-mini (high),openai/o4-mini--high,bmosl_A_2025_1,bmosl,proofs,OPC R1 8B,0.0
219,Grok 4,xai/grok-4,bmosl_A_2025_1,bmosl,proofs,OPC R1 8B,0.0
220,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,bmosl_A_2025_1,bmosl,proofs,OPC R1 8B,1.0
221,GPT-5-mini (high),openai/gpt-5-mini,bmosl_A_2025_1,bmosl,proofs,OPC R1 8B,1.0
222,gemini-2.5-pro,gemini/gemini-pro-2.5,bmosl_A_2025_1,bmosl,proofs,OPC R1 8B,0.0
223,Qwen3-4B (25/07),qwen/qwen3_4b,bmosl_A_2025_1,bmosl,proofs,OPC R1 8B,0.0
224,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,bmosl_A_2025_1,bmosl,proofs,OPC R1 8B,1.0
225,Qwen3-4B (25/07),qwen/qwen3_4b,bmosl_A_2025_2,bmosl,proofs,OPC R1 8B,0.0
226,Grok 4,xai/grok-4,bmosl_A_2025_2,bmosl,proofs,OPC R1 8B,0.0
227,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,bmosl_A_2025_2,bmosl,proofs,OPC R1 8B,0.0
228,GPT-5 (high),openai/gpt-5,bmosl_A_2025_2,bmosl,proofs,OPC R1 8B,1.0
229,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,bmosl_A_2025_2,bmosl,proofs,OPC R1 8B,1.0
230,gemini-2.5-pro,gemini/gemini-pro-2.5,bmosl_A_2025_2,bmosl,proofs,OPC R1 8B,1.0
231,o4-mini (high),openai/o4-mini--high,bmosl_A_2025_2,bmosl,proofs,OPC R1 8B,1.0
232,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,bmosl_A_2025_2,bmosl,proofs,OPC R1 8B,0.0
233,GPT OSS 120B (high),openai/oss-120b,bmosl_A_2025_2,bmosl,proofs,OPC R1 8B,0.0
234,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,bmosl_A_2025_2,bmosl,proofs,OPC R1 8B,0.0
235,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,bmosl_A_2025_3,bmosl,proofs,OPC R1 8B,1.0
236,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,bmosl_A_2025_3,bmosl,proofs,OPC R1 8B,0.0
237,GPT-5 (high),openai/gpt-5,bmosl_A_2025_3,bmosl,proofs,OPC R1 8B,1.0
238,o4-mini (high),openai/o4-mini--high,bmosl_A_2025_3,bmosl,proofs,OPC R1 8B,1.0
239,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,bmosl_A_2025_3,bmosl,proofs,OPC R1 8B,0.0
240,gemini-2.5-pro,gemini/gemini-pro-2.5,bmosl_A_2025_3,bmosl,proofs,OPC R1 8B,1.0
241,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,bmosl_A_2025_3,bmosl,proofs,OPC R1 8B,0.0
242,GPT OSS 120B (high),openai/oss-120b,bmosl_A_2025_3,bmosl,proofs,OPC R1 8B,0.0
243,Qwen3-4B (25/07),qwen/qwen3_4b,bmosl_A_2025_3,bmosl,proofs,OPC R1 8B,0.0
244,o4-mini (high),openai/o4-mini--high,bmosl_A_2025_4,bmosl,proofs,OPC R1 8B,0.0
245,gemini-2.5-pro,gemini/gemini-pro-2.5,bmosl_A_2025_4,bmosl,proofs,OPC R1 8B,0.0
246,Grok 4,xai/grok-4,bmosl_A_2025_4,bmosl,proofs,OPC R1 8B,1.0
247,GPT-5 (high),openai/gpt-5,bmosl_A_2025_4,bmosl,proofs,OPC R1 8B,0.0
248,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,bmosl_A_2025_4,bmosl,proofs,OPC R1 8B,1.0
249,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,bmosl_A_2025_4,bmosl,proofs,OPC R1 8B,0.0
250,Qwen3-4B (25/07),qwen/qwen3_4b,bmosl_A_2025_4,bmosl,proofs,OPC R1 8B,0.0
251,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,bmosl_A_2025_4,bmosl,proofs,OPC R1 8B,0.0
252,GPT OSS 120B (high),openai/oss-120b,bmosl_A_2025_4,bmosl,proofs,OPC R1 8B,1.0
253,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,bmosl_A_2025_4,bmosl,proofs,OPC R1 8B,0.0
254,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,bmosl_A_2025_5,bmosl,proofs,OPC R1 8B,0.0
255,Grok 4,xai/grok-4,bmosl_A_2025_5,bmosl,proofs,OPC R1 8B,0.0
256,gemini-2.5-pro,gemini/gemini-pro-2.5,bmosl_A_2025_5,bmosl,proofs,OPC R1 8B,0.0
257,GPT OSS 120B (high),openai/oss-120b,bmosl_A_2025_5,bmosl,proofs,OPC R1 8B,0.0
258,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,bmosl_A_2025_5,bmosl,proofs,OPC R1 8B,0.0
259,o4-mini (high),openai/o4-mini--high,bmosl_A_2025_5,bmosl,proofs,OPC R1 8B,0.0
260,GPT-5-mini (high),openai/gpt-5-mini,bmosl_A_2025_5,bmosl,proofs,OPC R1 8B,1.0
261,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,bmosl_A_2025_5,bmosl,proofs,OPC R1 8B,0.0
262,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,bmosl_A_2025_5,bmosl,proofs,OPC R1 8B,0.0
263,Qwen3-4B (25/07),qwen/qwen3_4b,bmosl_A_2025_5,bmosl,proofs,OPC R1 8B,0.0
264,GPT OSS 120B (high),openai/oss-120b,bmosl_A_2025_6,bmosl,proofs,OPC R1 8B,0.0
265,Grok 4,xai/grok-4,bmosl_A_2025_6,bmosl,proofs,OPC R1 8B,0.0
266,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,bmosl_A_2025_6,bmosl,proofs,OPC R1 8B,0.0
267,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,bmosl_A_2025_6,bmosl,proofs,OPC R1 8B,0.0
268,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,bmosl_A_2025_6,bmosl,proofs,OPC R1 8B,0.0
269,o4-mini (high),openai/o4-mini--high,bmosl_A_2025_6,bmosl,proofs,OPC R1 8B,0.0
270,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,bmosl_A_2025_6,bmosl,proofs,OPC R1 8B,0.0
271,gemini-2.5-pro,gemini/gemini-pro-2.5,bmosl_A_2025_6,bmosl,proofs,OPC R1 8B,0.0
272,Qwen3-4B (25/07),qwen/qwen3_4b,bmosl_A_2025_6,bmosl,proofs,OPC R1 8B,0.0
273,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,bmosl_C_2025_1,bmosl,proofs,OPC R1 8B,0.0
274,GPT OSS 120B (high),openai/oss-120b,bmosl_C_2025_1,bmosl,proofs,OPC R1 8B,0.0
275,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,bmosl_C_2025_1,bmosl,proofs,OPC R1 8B,0.0
276,gemini-2.5-pro,gemini/gemini-pro-2.5,bmosl_C_2025_1,bmosl,proofs,OPC R1 8B,1.0
277,o4-mini (high),openai/o4-mini--high,bmosl_C_2025_1,bmosl,proofs,OPC R1 8B,1.0
278,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,bmosl_C_2025_1,bmosl,proofs,OPC R1 8B,0.0
279,Qwen3-4B (25/07),qwen/qwen3_4b,bmosl_C_2025_1,bmosl,proofs,OPC R1 8B,0.0
280,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,bmosl_C_2025_1,bmosl,proofs,OPC R1 8B,1.0
281,Grok 4,xai/grok-4,bmosl_C_2025_1,bmosl,proofs,OPC R1 8B,0.0
282,Qwen3-4B (25/07),qwen/qwen3_4b,bmosl_C_2025_2,bmosl,proofs,OPC R1 8B,0.0
283,GPT-5 (high),openai/gpt-5,bmosl_C_2025_2,bmosl,proofs,OPC R1 8B,1.0
284,GPT OSS 120B (high),openai/oss-120b,bmosl_C_2025_2,bmosl,proofs,OPC R1 8B,1.0
285,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,bmosl_C_2025_2,bmosl,proofs,OPC R1 8B,0.0
286,o4-mini (high),openai/o4-mini--high,bmosl_C_2025_2,bmosl,proofs,OPC R1 8B,0.0
287,GPT-5-mini (high),openai/gpt-5-mini,bmosl_C_2025_2,bmosl,proofs,OPC R1 8B,0.0
288,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,bmosl_C_2025_2,bmosl,proofs,OPC R1 8B,1.0
289,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,bmosl_C_2025_2,bmosl,proofs,OPC R1 8B,0.0
290,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,bmosl_C_2025_2,bmosl,proofs,OPC R1 8B,0.0
291,Grok 4,xai/grok-4,bmosl_C_2025_2,bmosl,proofs,OPC R1 8B,0.0
292,gemini-2.5-pro,gemini/gemini-pro-2.5,bmosl_C_2025_2,bmosl,proofs,OPC R1 8B,0.0
293,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,bmosl_C_2025_3,bmosl,proofs,OPC R1 8B,1.0
294,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,bmosl_C_2025_3,bmosl,proofs,OPC R1 8B,0.0
295,Grok 4,xai/grok-4,bmosl_C_2025_3,bmosl,proofs,OPC R1 8B,0.0
296,GPT-5-mini (high),openai/gpt-5-mini,bmosl_C_2025_3,bmosl,proofs,OPC R1 8B,1.0
297,o4-mini (high),openai/o4-mini--high,bmosl_C_2025_3,bmosl,proofs,OPC R1 8B,0.0
298,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,bmosl_C_2025_3,bmosl,proofs,OPC R1 8B,0.0
299,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,bmosl_C_2025_3,bmosl,proofs,OPC R1 8B,0.0
300,gemini-2.5-pro,gemini/gemini-pro-2.5,bmosl_C_2025_3,bmosl,proofs,OPC R1 8B,0.0
301,Qwen3-4B (25/07),qwen/qwen3_4b,bmosl_C_2025_3,bmosl,proofs,OPC R1 8B,0.0
302,GPT OSS 120B (high),openai/oss-120b,bmosl_C_2025_3,bmosl,proofs,OPC R1 8B,1.0
303,Grok 4,xai/grok-4,bmosl_C_2025_4,bmosl,proofs,OPC R1 8B,0.0
304,GPT OSS 120B (high),openai/oss-120b,bmosl_C_2025_4,bmosl,proofs,OPC R1 8B,1.0
305,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,bmosl_C_2025_4,bmosl,proofs,OPC R1 8B,0.0
306,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,bmosl_C_2025_4,bmosl,proofs,OPC R1 8B,0.0
307,o4-mini (high),openai/o4-mini--high,bmosl_C_2025_4,bmosl,proofs,OPC R1 8B,0.0
308,gemini-2.5-pro,gemini/gemini-pro-2.5,bmosl_C_2025_4,bmosl,proofs,OPC R1 8B,0.0
309,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,bmosl_C_2025_4,bmosl,proofs,OPC R1 8B,0.0
310,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,bmosl_C_2025_4,bmosl,proofs,OPC R1 8B,0.0
311,Qwen3-4B (25/07),qwen/qwen3_4b,bmosl_C_2025_4,bmosl,proofs,OPC R1 8B,0.0
312,GPT OSS 120B (high),openai/oss-120b,bmosl_C_2025_5,bmosl,proofs,OPC R1 8B,0.0
313,o4-mini (high),openai/o4-mini--high,bmosl_C_2025_5,bmosl,proofs,OPC R1 8B,0.0
314,gemini-2.5-pro,gemini/gemini-pro-2.5,bmosl_C_2025_5,bmosl,proofs,OPC R1 8B,0.0
315,Qwen3-4B (25/07),qwen/qwen3_4b,bmosl_C_2025_5,bmosl,proofs,OPC R1 8B,0.0
316,GPT-5-mini (high),openai/gpt-5-mini,bmosl_C_2025_5,bmosl,proofs,OPC R1 8B,0.0
317,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,bmosl_C_2025_5,bmosl,proofs,OPC R1 8B,0.0
318,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,bmosl_C_2025_5,bmosl,proofs,OPC R1 8B,0.0
319,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,bmosl_C_2025_5,bmosl,proofs,OPC R1 8B,0.0
320,Grok 4,xai/grok-4,bmosl_C_2025_5,bmosl,proofs,OPC R1 8B,0.0
321,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,bmosl_C_2025_5,bmosl,proofs,OPC R1 8B,0.0
322,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,bmosl_C_2025_6,bmosl,proofs,OPC R1 8B,0.0
323,gemini-2.5-pro,gemini/gemini-pro-2.5,bmosl_C_2025_6,bmosl,proofs,OPC R1 8B,0.0
324,Grok 4,xai/grok-4,bmosl_C_2025_6,bmosl,proofs,OPC R1 8B,0.0
325,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,bmosl_C_2025_6,bmosl,proofs,OPC R1 8B,1.0
326,o4-mini (high),openai/o4-mini--high,bmosl_C_2025_6,bmosl,proofs,OPC R1 8B,0.0
327,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,bmosl_C_2025_6,bmosl,proofs,OPC R1 8B,0.0
328,Qwen3-4B (25/07),qwen/qwen3_4b,bmosl_C_2025_6,bmosl,proofs,OPC R1 8B,1.0
329,GPT OSS 120B (high),openai/oss-120b,bmosl_C_2025_6,bmosl,proofs,OPC R1 8B,0.0
330,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,bmosl_C_2025_6,bmosl,proofs,OPC R1 8B,0.0
331,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,bmosl_G_2025_1,bmosl,proofs,OPC R1 8B,0.0
332,gemini-2.5-pro,gemini/gemini-pro-2.5,bmosl_G_2025_1,bmosl,proofs,OPC R1 8B,0.0
333,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,bmosl_G_2025_1,bmosl,proofs,OPC R1 8B,0.0
334,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,bmosl_G_2025_1,bmosl,proofs,OPC R1 8B,0.0
335,Qwen3-4B (25/07),qwen/qwen3_4b,bmosl_G_2025_1,bmosl,proofs,OPC R1 8B,0.0
336,GPT OSS 120B (high),openai/oss-120b,bmosl_G_2025_1,bmosl,proofs,OPC R1 8B,0.0
337,o4-mini (high),openai/o4-mini--high,bmosl_G_2025_1,bmosl,proofs,OPC R1 8B,0.0
338,Grok 4,xai/grok-4,bmosl_G_2025_1,bmosl,proofs,OPC R1 8B,0.0
339,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,bmosl_G_2025_1,bmosl,proofs,OPC R1 8B,0.0
340,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,bmosl_G_2025_2,bmosl,proofs,OPC R1 8B,0.0
341,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,bmosl_G_2025_2,bmosl,proofs,OPC R1 8B,0.0
342,Qwen3-4B (25/07),qwen/qwen3_4b,bmosl_G_2025_2,bmosl,proofs,OPC R1 8B,0.0
343,gemini-2.5-pro,gemini/gemini-pro-2.5,bmosl_G_2025_2,bmosl,proofs,OPC R1 8B,0.0
344,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,bmosl_G_2025_2,bmosl,proofs,OPC R1 8B,1.0
345,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,bmosl_G_2025_2,bmosl,proofs,OPC R1 8B,0.0
346,o4-mini (high),openai/o4-mini--high,bmosl_G_2025_2,bmosl,proofs,OPC R1 8B,0.0
347,Grok 4,xai/grok-4,bmosl_G_2025_2,bmosl,proofs,OPC R1 8B,0.0
348,GPT-5 (high),openai/gpt-5,bmosl_G_2025_2,bmosl,proofs,OPC R1 8B,1.0
349,GPT OSS 120B (high),openai/oss-120b,bmosl_G_2025_2,bmosl,proofs,OPC R1 8B,1.0
350,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,bmosl_G_2025_3,bmosl,proofs,OPC R1 8B,0.0
351,Grok 4,xai/grok-4,bmosl_G_2025_3,bmosl,proofs,OPC R1 8B,0.0
352,gemini-2.5-pro,gemini/gemini-pro-2.5,bmosl_G_2025_3,bmosl,proofs,OPC R1 8B,0.0
353,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,bmosl_G_2025_3,bmosl,proofs,OPC R1 8B,1.0
354,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,bmosl_G_2025_3,bmosl,proofs,OPC R1 8B,0.0
355,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,bmosl_G_2025_3,bmosl,proofs,OPC R1 8B,0.0
356,GPT OSS 120B (high),openai/oss-120b,bmosl_G_2025_3,bmosl,proofs,OPC R1 8B,0.0
357,GPT-5 (high),openai/gpt-5,bmosl_G_2025_3,bmosl,proofs,OPC R1 8B,0.0
358,Qwen3-4B (25/07),qwen/qwen3_4b,bmosl_G_2025_3,bmosl,proofs,OPC R1 8B,1.0
359,o4-mini (high),openai/o4-mini--high,bmosl_G_2025_3,bmosl,proofs,OPC R1 8B,1.0
360,GPT-5 (high),openai/gpt-5,bmosl_G_2025_4,bmosl,proofs,OPC R1 8B,1.0
361,gemini-2.5-pro,gemini/gemini-pro-2.5,bmosl_G_2025_4,bmosl,proofs,OPC R1 8B,0.0
362,GPT OSS 120B (high),openai/oss-120b,bmosl_G_2025_4,bmosl,proofs,OPC R1 8B,0.0
363,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,bmosl_G_2025_4,bmosl,proofs,OPC R1 8B,0.0
364,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,bmosl_G_2025_4,bmosl,proofs,OPC R1 8B,0.0
365,GPT-5-mini (high),openai/gpt-5-mini,bmosl_G_2025_4,bmosl,proofs,OPC R1 8B,0.0
366,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,bmosl_G_2025_4,bmosl,proofs,OPC R1 8B,0.0
367,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,bmosl_G_2025_4,bmosl,proofs,OPC R1 8B,0.0
368,o4-mini (high),openai/o4-mini--high,bmosl_G_2025_4,bmosl,proofs,OPC R1 8B,0.0
369,Qwen3-4B (25/07),qwen/qwen3_4b,bmosl_G_2025_4,bmosl,proofs,OPC R1 8B,0.0
370,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,bmosl_G_2025_5,bmosl,proofs,OPC R1 8B,0.0
371,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,bmosl_G_2025_5,bmosl,proofs,OPC R1 8B,1.0
372,gemini-2.5-pro,gemini/gemini-pro-2.5,bmosl_G_2025_5,bmosl,proofs,OPC R1 8B,0.0
373,Grok 4,xai/grok-4,bmosl_G_2025_5,bmosl,proofs,OPC R1 8B,0.0
374,GPT OSS 120B (high),openai/oss-120b,bmosl_G_2025_5,bmosl,proofs,OPC R1 8B,1.0
375,GPT-5-mini (high),openai/gpt-5-mini,bmosl_G_2025_5,bmosl,proofs,OPC R1 8B,1.0
376,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,bmosl_G_2025_5,bmosl,proofs,OPC R1 8B,0.0
377,o4-mini (high),openai/o4-mini--high,bmosl_G_2025_5,bmosl,proofs,OPC R1 8B,0.0
378,Qwen3-4B (25/07),qwen/qwen3_4b,bmosl_G_2025_5,bmosl,proofs,OPC R1 8B,1.0
379,GPT-5 (high),openai/gpt-5,bmosl_G_2025_5,bmosl,proofs,OPC R1 8B,1.0
380,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,bmosl_G_2025_5,bmosl,proofs,OPC R1 8B,0.0
381,o4-mini (high),openai/o4-mini--high,bmosl_G_2025_6,bmosl,proofs,OPC R1 8B,0.0
382,gemini-2.5-pro,gemini/gemini-pro-2.5,bmosl_G_2025_6,bmosl,proofs,OPC R1 8B,0.0
383,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,bmosl_G_2025_6,bmosl,proofs,OPC R1 8B,0.0
384,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,bmosl_G_2025_6,bmosl,proofs,OPC R1 8B,0.0
385,Qwen3-4B (25/07),qwen/qwen3_4b,bmosl_G_2025_6,bmosl,proofs,OPC R1 8B,0.0
386,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,bmosl_G_2025_6,bmosl,proofs,OPC R1 8B,0.0
387,Grok 4,xai/grok-4,bmosl_G_2025_6,bmosl,proofs,OPC R1 8B,0.0
388,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,bmosl_G_2025_6,bmosl,proofs,OPC R1 8B,0.0
389,GPT OSS 120B (high),openai/oss-120b,bmosl_G_2025_6,bmosl,proofs,OPC R1 8B,1.0
390,Qwen3-4B (25/07),qwen/qwen3_4b,bmosl_G_2025_7,bmosl,proofs,OPC R1 8B,0.0
391,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,bmosl_G_2025_7,bmosl,proofs,OPC R1 8B,0.0
392,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,bmosl_G_2025_7,bmosl,proofs,OPC R1 8B,0.0
393,Grok 4,xai/grok-4,bmosl_G_2025_7,bmosl,proofs,OPC R1 8B,0.0
394,GPT OSS 120B (high),openai/oss-120b,bmosl_G_2025_7,bmosl,proofs,OPC R1 8B,1.0
395,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,bmosl_G_2025_7,bmosl,proofs,OPC R1 8B,0.0
396,o4-mini (high),openai/o4-mini--high,bmosl_G_2025_7,bmosl,proofs,OPC R1 8B,0.0
397,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,bmosl_G_2025_7,bmosl,proofs,OPC R1 8B,0.0
398,gemini-2.5-pro,gemini/gemini-pro-2.5,bmosl_G_2025_7,bmosl,proofs,OPC R1 8B,0.0
399,o4-mini (high),openai/o4-mini--high,bmosl_NT_2025_1,bmosl,proofs,OPC R1 8B,0.0
400,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,bmosl_NT_2025_1,bmosl,proofs,OPC R1 8B,0.0
401,GPT OSS 120B (high),openai/oss-120b,bmosl_NT_2025_1,bmosl,proofs,OPC R1 8B,1.0
402,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,bmosl_NT_2025_1,bmosl,proofs,OPC R1 8B,0.0
403,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,bmosl_NT_2025_1,bmosl,proofs,OPC R1 8B,0.0
404,Grok 4,xai/grok-4,bmosl_NT_2025_1,bmosl,proofs,OPC R1 8B,0.0
405,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,bmosl_NT_2025_1,bmosl,proofs,OPC R1 8B,0.0
406,gemini-2.5-pro,gemini/gemini-pro-2.5,bmosl_NT_2025_1,bmosl,proofs,OPC R1 8B,0.0
407,Qwen3-4B (25/07),qwen/qwen3_4b,bmosl_NT_2025_1,bmosl,proofs,OPC R1 8B,0.0
408,GPT OSS 120B (high),openai/oss-120b,bmosl_NT_2025_2,bmosl,proofs,OPC R1 8B,0.0
409,gemini-2.5-pro,gemini/gemini-pro-2.5,bmosl_NT_2025_2,bmosl,proofs,OPC R1 8B,0.0
410,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,bmosl_NT_2025_2,bmosl,proofs,OPC R1 8B,0.0
411,Grok 4,xai/grok-4,bmosl_NT_2025_2,bmosl,proofs,OPC R1 8B,0.0
412,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,bmosl_NT_2025_2,bmosl,proofs,OPC R1 8B,0.0
413,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,bmosl_NT_2025_2,bmosl,proofs,OPC R1 8B,0.0
414,GPT-5 (high),openai/gpt-5,bmosl_NT_2025_2,bmosl,proofs,OPC R1 8B,0.0
415,o4-mini (high),openai/o4-mini--high,bmosl_NT_2025_2,bmosl,proofs,OPC R1 8B,0.0
416,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,bmosl_NT_2025_2,bmosl,proofs,OPC R1 8B,0.0
417,Qwen3-4B (25/07),qwen/qwen3_4b,bmosl_NT_2025_2,bmosl,proofs,OPC R1 8B,0.0
418,gemini-2.5-pro,gemini/gemini-pro-2.5,bmosl_NT_2025_3,bmosl,proofs,OPC R1 8B,1.0
419,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,bmosl_NT_2025_3,bmosl,proofs,OPC R1 8B,0.0
420,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,bmosl_NT_2025_3,bmosl,proofs,OPC R1 8B,0.0
421,GPT OSS 120B (high),openai/oss-120b,bmosl_NT_2025_3,bmosl,proofs,OPC R1 8B,0.0
422,o4-mini (high),openai/o4-mini--high,bmosl_NT_2025_3,bmosl,proofs,OPC R1 8B,0.0
423,Qwen3-4B (25/07),qwen/qwen3_4b,bmosl_NT_2025_3,bmosl,proofs,OPC R1 8B,0.0
424,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,bmosl_NT_2025_3,bmosl,proofs,OPC R1 8B,0.0
425,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,bmosl_NT_2025_3,bmosl,proofs,OPC R1 8B,0.0
426,Grok 4,xai/grok-4,bmosl_NT_2025_3,bmosl,proofs,OPC R1 8B,0.0
427,o4-mini (high),openai/o4-mini--high,bmosl_NT_2025_4,bmosl,proofs,OPC R1 8B,0.0
428,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,bmosl_NT_2025_4,bmosl,proofs,OPC R1 8B,0.0
429,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,bmosl_NT_2025_4,bmosl,proofs,OPC R1 8B,0.0
430,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,bmosl_NT_2025_4,bmosl,proofs,OPC R1 8B,0.0
431,gemini-2.5-pro,gemini/gemini-pro-2.5,bmosl_NT_2025_4,bmosl,proofs,OPC R1 8B,1.0
432,Grok 4,xai/grok-4,bmosl_NT_2025_4,bmosl,proofs,OPC R1 8B,0.0
433,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,bmosl_NT_2025_4,bmosl,proofs,OPC R1 8B,0.0
434,GPT OSS 120B (high),openai/oss-120b,bmosl_NT_2025_4,bmosl,proofs,OPC R1 8B,1.0
435,GPT-5-mini (high),openai/gpt-5-mini,bmosl_NT_2025_4,bmosl,proofs,OPC R1 8B,0.0
436,Qwen3-4B (25/07),qwen/qwen3_4b,bmosl_NT_2025_4,bmosl,proofs,OPC R1 8B,0.0
437,Qwen3-4B (25/07),qwen/qwen3_4b,bmosl_NT_2025_5,bmosl,proofs,OPC R1 8B,0.0
438,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,bmosl_NT_2025_5,bmosl,proofs,OPC R1 8B,1.0
439,GPT OSS 120B (high),openai/oss-120b,bmosl_NT_2025_5,bmosl,proofs,OPC R1 8B,1.0
440,Grok 4,xai/grok-4,bmosl_NT_2025_5,bmosl,proofs,OPC R1 8B,0.0
441,gemini-2.5-pro,gemini/gemini-pro-2.5,bmosl_NT_2025_5,bmosl,proofs,OPC R1 8B,0.0
442,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,bmosl_NT_2025_5,bmosl,proofs,OPC R1 8B,0.0
443,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,bmosl_NT_2025_5,bmosl,proofs,OPC R1 8B,0.0
444,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,bmosl_NT_2025_5,bmosl,proofs,OPC R1 8B,0.0
445,o4-mini (high),openai/o4-mini--high,bmosl_NT_2025_5,bmosl,proofs,OPC R1 8B,0.0
446,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,bmosl_NT_2025_6,bmosl,proofs,OPC R1 8B,1.0
447,GPT-5 (high),openai/gpt-5,bmosl_NT_2025_6,bmosl,proofs,OPC R1 8B,1.0
448,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,bmosl_NT_2025_6,bmosl,proofs,OPC R1 8B,0.0
449,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,bmosl_NT_2025_6,bmosl,proofs,OPC R1 8B,0.0
450,GPT-5-mini (high),openai/gpt-5-mini,bmosl_NT_2025_6,bmosl,proofs,OPC R1 8B,1.0
451,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,bmosl_NT_2025_6,bmosl,proofs,OPC R1 8B,1.0
452,o4-mini (high),openai/o4-mini--high,bmosl_NT_2025_6,bmosl,proofs,OPC R1 8B,1.0
453,GPT OSS 120B (high),openai/oss-120b,bmosl_NT_2025_6,bmosl,proofs,OPC R1 8B,0.0
454,Qwen3-4B (25/07),qwen/qwen3_4b,bmosl_NT_2025_6,bmosl,proofs,OPC R1 8B,0.0
455,gemini-2.5-pro,gemini/gemini-pro-2.5,bmosl_NT_2025_6,bmosl,proofs,OPC R1 8B,0.0
456,Grok 4,xai/grok-4,bmosl_NT_2025_6,bmosl,proofs,OPC R1 8B,0.0
457,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,bmosl_NT_2025_7,bmosl,proofs,OPC R1 8B,1.0
458,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,bmosl_NT_2025_7,bmosl,proofs,OPC R1 8B,0.0
459,o4-mini (high),openai/o4-mini--high,bmosl_NT_2025_7,bmosl,proofs,OPC R1 8B,0.0
460,Qwen3-4B (25/07),qwen/qwen3_4b,bmosl_NT_2025_7,bmosl,proofs,OPC R1 8B,0.0
461,GPT OSS 120B (high),openai/oss-120b,bmosl_NT_2025_7,bmosl,proofs,OPC R1 8B,1.0
462,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,bmosl_NT_2025_7,bmosl,proofs,OPC R1 8B,1.0
463,gemini-2.5-pro,gemini/gemini-pro-2.5,bmosl_NT_2025_7,bmosl,proofs,OPC R1 8B,1.0
464,GPT-5-mini (high),openai/gpt-5-mini,bmosl_NT_2025_7,bmosl,proofs,OPC R1 8B,0.0
465,Grok 4,xai/grok-4,bmosl_NT_2025_7,bmosl,proofs,OPC R1 8B,1.0
466,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,bmosl_NT_2025_7,bmosl,proofs,OPC R1 8B,1.0
467,GPT OSS 120B (high),openai/oss-120b,bulgaria_2025_1,bulgaria,proofs,OPC R1 8B,0.0
468,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,bulgaria_2025_1,bulgaria,proofs,OPC R1 8B,1.0
469,o4-mini (high),openai/o4-mini--high,bulgaria_2025_1,bulgaria,proofs,OPC R1 8B,1.0
470,Grok 4,xai/grok-4,bulgaria_2025_1,bulgaria,proofs,OPC R1 8B,1.0
471,GPT-5 (high),openai/gpt-5,bulgaria_2025_1,bulgaria,proofs,OPC R1 8B,0.0
472,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,bulgaria_2025_1,bulgaria,proofs,OPC R1 8B,0.0
473,GPT-5-mini (high),openai/gpt-5-mini,bulgaria_2025_1,bulgaria,proofs,OPC R1 8B,1.0
474,gemini-2.5-pro,gemini/gemini-pro-2.5,bulgaria_2025_1,bulgaria,proofs,OPC R1 8B,1.0
475,Qwen3-4B (25/07),qwen/qwen3_4b,bulgaria_2025_1,bulgaria,proofs,OPC R1 8B,0.0
476,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,bulgaria_2025_1,bulgaria,proofs,OPC R1 8B,1.0
477,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,bulgaria_2025_1,bulgaria,proofs,OPC R1 8B,0.0
478,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,bulgaria_2025_2,bulgaria,proofs,OPC R1 8B,0.0
479,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,bulgaria_2025_2,bulgaria,proofs,OPC R1 8B,0.0
480,GPT-5 (high),openai/gpt-5,bulgaria_2025_2,bulgaria,proofs,OPC R1 8B,0.0
481,Grok 4,xai/grok-4,bulgaria_2025_2,bulgaria,proofs,OPC R1 8B,0.0
482,GPT-5-mini (high),openai/gpt-5-mini,bulgaria_2025_2,bulgaria,proofs,OPC R1 8B,0.0
483,gemini-2.5-pro,gemini/gemini-pro-2.5,bulgaria_2025_2,bulgaria,proofs,OPC R1 8B,0.0
484,GPT OSS 120B (high),openai/oss-120b,bulgaria_2025_2,bulgaria,proofs,OPC R1 8B,0.0
485,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,bulgaria_2025_2,bulgaria,proofs,OPC R1 8B,0.0
486,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,bulgaria_2025_2,bulgaria,proofs,OPC R1 8B,0.0
487,o4-mini (high),openai/o4-mini--high,bulgaria_2025_2,bulgaria,proofs,OPC R1 8B,0.0
488,Qwen3-4B (25/07),qwen/qwen3_4b,bulgaria_2025_2,bulgaria,proofs,OPC R1 8B,1.0
489,GPT-5 (high),openai/gpt-5,bulgaria_2025_3,bulgaria,proofs,OPC R1 8B,0.0
490,o4-mini (high),openai/o4-mini--high,bulgaria_2025_3,bulgaria,proofs,OPC R1 8B,0.0
491,Grok 4,xai/grok-4,bulgaria_2025_3,bulgaria,proofs,OPC R1 8B,0.0
492,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,bulgaria_2025_3,bulgaria,proofs,OPC R1 8B,0.0
493,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,bulgaria_2025_3,bulgaria,proofs,OPC R1 8B,0.0
494,Qwen3-4B (25/07),qwen/qwen3_4b,bulgaria_2025_3,bulgaria,proofs,OPC R1 8B,0.0
495,GPT OSS 120B (high),openai/oss-120b,bulgaria_2025_3,bulgaria,proofs,OPC R1 8B,0.0
496,GPT-5-mini (high),openai/gpt-5-mini,bulgaria_2025_3,bulgaria,proofs,OPC R1 8B,0.0
497,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,bulgaria_2025_3,bulgaria,proofs,OPC R1 8B,0.0
498,gemini-2.5-pro,gemini/gemini-pro-2.5,bulgaria_2025_3,bulgaria,proofs,OPC R1 8B,0.0
499,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,bulgaria_2025_3,bulgaria,proofs,OPC R1 8B,0.0
500,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,bulgaria_2025_4,bulgaria,proofs,OPC R1 8B,1.0
501,GPT OSS 120B (high),openai/oss-120b,bulgaria_2025_4,bulgaria,proofs,OPC R1 8B,0.0
502,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,bulgaria_2025_4,bulgaria,proofs,OPC R1 8B,0.0
503,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,bulgaria_2025_4,bulgaria,proofs,OPC R1 8B,0.0
504,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,bulgaria_2025_4,bulgaria,proofs,OPC R1 8B,0.0
505,Qwen3-4B (25/07),qwen/qwen3_4b,bulgaria_2025_4,bulgaria,proofs,OPC R1 8B,1.0
506,o4-mini (high),openai/o4-mini--high,bulgaria_2025_4,bulgaria,proofs,OPC R1 8B,0.0
507,GPT-5 (high),openai/gpt-5,bulgaria_2025_4,bulgaria,proofs,OPC R1 8B,0.0
508,gemini-2.5-pro,gemini/gemini-pro-2.5,bulgaria_2025_4,bulgaria,proofs,OPC R1 8B,0.0
509,Grok 4,xai/grok-4,bulgaria_2025_4,bulgaria,proofs,OPC R1 8B,1.0
510,Qwen3-4B (25/07),qwen/qwen3_4b,bulgaria_2025_5,bulgaria,proofs,OPC R1 8B,0.0
511,GPT-5-mini (high),openai/gpt-5-mini,bulgaria_2025_5,bulgaria,proofs,OPC R1 8B,1.0
512,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,bulgaria_2025_5,bulgaria,proofs,OPC R1 8B,0.0
513,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,bulgaria_2025_5,bulgaria,proofs,OPC R1 8B,0.0
514,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,bulgaria_2025_5,bulgaria,proofs,OPC R1 8B,0.0
515,o4-mini (high),openai/o4-mini--high,bulgaria_2025_5,bulgaria,proofs,OPC R1 8B,0.0
516,GPT-5 (high),openai/gpt-5,bulgaria_2025_5,bulgaria,proofs,OPC R1 8B,0.0
517,GPT OSS 120B (high),openai/oss-120b,bulgaria_2025_5,bulgaria,proofs,OPC R1 8B,0.0
518,gemini-2.5-pro,gemini/gemini-pro-2.5,bulgaria_2025_5,bulgaria,proofs,OPC R1 8B,0.0
519,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,bulgaria_2025_5,bulgaria,proofs,OPC R1 8B,0.0
520,Grok 4,xai/grok-4,bulgaria_2025_5,bulgaria,proofs,OPC R1 8B,0.0
521,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,bulgaria_2025_6,bulgaria,proofs,OPC R1 8B,0.0
522,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,bulgaria_2025_6,bulgaria,proofs,OPC R1 8B,0.0
523,Grok 4,xai/grok-4,bulgaria_2025_6,bulgaria,proofs,OPC R1 8B,0.0
524,GPT-5-mini (high),openai/gpt-5-mini,bulgaria_2025_6,bulgaria,proofs,OPC R1 8B,1.0
525,GPT-5 (high),openai/gpt-5,bulgaria_2025_6,bulgaria,proofs,OPC R1 8B,1.0
526,gemini-2.5-pro,gemini/gemini-pro-2.5,bulgaria_2025_6,bulgaria,proofs,OPC R1 8B,0.0
527,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,bulgaria_2025_6,bulgaria,proofs,OPC R1 8B,0.0
528,GPT OSS 120B (high),openai/oss-120b,bulgaria_2025_6,bulgaria,proofs,OPC R1 8B,0.0
529,o4-mini (high),openai/o4-mini--high,bulgaria_2025_6,bulgaria,proofs,OPC R1 8B,1.0
530,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,bulgaria_2025_6,bulgaria,proofs,OPC R1 8B,1.0
531,Qwen3-4B (25/07),qwen/qwen3_4b,bulgaria_2025_6,bulgaria,proofs,OPC R1 8B,0.0
532,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,canada_2025_1,canada,proofs,OPC R1 8B,0.0
533,GPT-5 (high),openai/gpt-5,canada_2025_1,canada,proofs,OPC R1 8B,0.0
534,gemini-2.5-pro,gemini/gemini-pro-2.5,canada_2025_1,canada,proofs,OPC R1 8B,0.0
535,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,canada_2025_1,canada,proofs,OPC R1 8B,0.0
536,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,canada_2025_1,canada,proofs,OPC R1 8B,0.0
537,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,canada_2025_1,canada,proofs,OPC R1 8B,0.0
538,o4-mini (high),openai/o4-mini--high,canada_2025_1,canada,proofs,OPC R1 8B,0.0
539,GPT OSS 120B (high),openai/oss-120b,canada_2025_1,canada,proofs,OPC R1 8B,0.0
540,Qwen3-4B (25/07),qwen/qwen3_4b,canada_2025_1,canada,proofs,OPC R1 8B,0.0
541,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,canada_2025_2,canada,proofs,OPC R1 8B,1.0
542,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,canada_2025_2,canada,proofs,OPC R1 8B,1.0
543,gemini-2.5-pro,gemini/gemini-pro-2.5,canada_2025_2,canada,proofs,OPC R1 8B,1.0
544,Qwen3-4B (25/07),qwen/qwen3_4b,canada_2025_2,canada,proofs,OPC R1 8B,1.0
545,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,canada_2025_2,canada,proofs,OPC R1 8B,0.0
546,GPT-5 (high),openai/gpt-5,canada_2025_2,canada,proofs,OPC R1 8B,1.0
547,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,canada_2025_2,canada,proofs,OPC R1 8B,0.0
548,Grok 4,xai/grok-4,canada_2025_2,canada,proofs,OPC R1 8B,0.0
549,o4-mini (high),openai/o4-mini--high,canada_2025_2,canada,proofs,OPC R1 8B,0.0
550,GPT OSS 120B (high),openai/oss-120b,canada_2025_2,canada,proofs,OPC R1 8B,0.0
551,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,canada_2025_3,canada,proofs,OPC R1 8B,0.0
552,o4-mini (high),openai/o4-mini--high,canada_2025_3,canada,proofs,OPC R1 8B,0.0
553,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,canada_2025_3,canada,proofs,OPC R1 8B,0.0
554,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,canada_2025_3,canada,proofs,OPC R1 8B,0.0
555,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,canada_2025_3,canada,proofs,OPC R1 8B,1.0
556,Grok 4,xai/grok-4,canada_2025_3,canada,proofs,OPC R1 8B,1.0
557,gemini-2.5-pro,gemini/gemini-pro-2.5,canada_2025_3,canada,proofs,OPC R1 8B,0.0
558,Qwen3-4B (25/07),qwen/qwen3_4b,canada_2025_3,canada,proofs,OPC R1 8B,1.0
559,GPT-5 (high),openai/gpt-5,canada_2025_3,canada,proofs,OPC R1 8B,0.0
560,GPT OSS 120B (high),openai/oss-120b,canada_2025_3,canada,proofs,OPC R1 8B,1.0
561,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,canada_2025_4,canada,proofs,OPC R1 8B,0.0
562,gemini-2.5-pro,gemini/gemini-pro-2.5,canada_2025_4,canada,proofs,OPC R1 8B,0.0
563,Grok 4,xai/grok-4,canada_2025_4,canada,proofs,OPC R1 8B,0.0
564,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,canada_2025_4,canada,proofs,OPC R1 8B,0.0
565,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,canada_2025_4,canada,proofs,OPC R1 8B,0.0
566,Qwen3-4B (25/07),qwen/qwen3_4b,canada_2025_4,canada,proofs,OPC R1 8B,0.0
567,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,canada_2025_4,canada,proofs,OPC R1 8B,0.0
568,GPT OSS 120B (high),openai/oss-120b,canada_2025_4,canada,proofs,OPC R1 8B,0.0
569,o4-mini (high),openai/o4-mini--high,canada_2025_4,canada,proofs,OPC R1 8B,0.0
570,GPT-5 (high),openai/gpt-5,canada_2025_4,canada,proofs,OPC R1 8B,0.0
571,Qwen3-4B (25/07),qwen/qwen3_4b,canada_2025_5,canada,proofs,OPC R1 8B,0.0
572,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,canada_2025_5,canada,proofs,OPC R1 8B,1.0
573,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,canada_2025_5,canada,proofs,OPC R1 8B,0.0
574,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,canada_2025_5,canada,proofs,OPC R1 8B,0.0
575,gemini-2.5-pro,gemini/gemini-pro-2.5,canada_2025_5,canada,proofs,OPC R1 8B,0.0
576,o4-mini (high),openai/o4-mini--high,canada_2025_5,canada,proofs,OPC R1 8B,1.0
577,GPT OSS 120B (high),openai/oss-120b,canada_2025_5,canada,proofs,OPC R1 8B,1.0
578,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,canada_2025_5,canada,proofs,OPC R1 8B,0.0
579,GPT-5 (high),openai/gpt-5,canada_2025_5,canada,proofs,OPC R1 8B,0.0
580,Grok 4,xai/grok-4,canada_2025_5,canada,proofs,OPC R1 8B,0.0
581,gemini-2.5-pro,gemini/gemini-pro-2.5,china_2025_1,china,proofs,OPC R1 8B,0.0
582,GPT-5-mini (high),openai/gpt-5-mini,china_2025_1,china,proofs,OPC R1 8B,0.0
583,GPT OSS 120B (high),openai/oss-120b,china_2025_1,china,proofs,OPC R1 8B,1.0
584,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,china_2025_1,china,proofs,OPC R1 8B,0.0
585,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,china_2025_1,china,proofs,OPC R1 8B,0.0
586,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,china_2025_1,china,proofs,OPC R1 8B,0.0
587,GPT-5 (high),openai/gpt-5,china_2025_1,china,proofs,OPC R1 8B,1.0
588,Qwen3-4B (25/07),qwen/qwen3_4b,china_2025_1,china,proofs,OPC R1 8B,0.0
589,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,china_2025_1,china,proofs,OPC R1 8B,0.0
590,Grok 4,xai/grok-4,china_2025_1,china,proofs,OPC R1 8B,0.0
591,o4-mini (high),openai/o4-mini--high,china_2025_1,china,proofs,OPC R1 8B,0.0
592,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,china_2025_2,china,proofs,OPC R1 8B,0.0
593,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,china_2025_2,china,proofs,OPC R1 8B,0.0
594,GPT OSS 120B (high),openai/oss-120b,china_2025_2,china,proofs,OPC R1 8B,1.0
595,Grok 4,xai/grok-4,china_2025_2,china,proofs,OPC R1 8B,0.0
596,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,china_2025_2,china,proofs,OPC R1 8B,1.0
597,GPT-5 (high),openai/gpt-5,china_2025_2,china,proofs,OPC R1 8B,0.0
598,o4-mini (high),openai/o4-mini--high,china_2025_2,china,proofs,OPC R1 8B,0.0
599,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,china_2025_2,china,proofs,OPC R1 8B,0.0
600,Qwen3-4B (25/07),qwen/qwen3_4b,china_2025_2,china,proofs,OPC R1 8B,0.0
601,gemini-2.5-pro,gemini/gemini-pro-2.5,china_2025_2,china,proofs,OPC R1 8B,0.0
602,Qwen3-4B (25/07),qwen/qwen3_4b,china_2025_3,china,proofs,OPC R1 8B,0.0
603,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,china_2025_3,china,proofs,OPC R1 8B,0.0
604,GPT OSS 120B (high),openai/oss-120b,china_2025_3,china,proofs,OPC R1 8B,1.0
605,GPT-5-mini (high),openai/gpt-5-mini,china_2025_3,china,proofs,OPC R1 8B,0.0
606,Grok 4,xai/grok-4,china_2025_3,china,proofs,OPC R1 8B,0.0
607,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,china_2025_3,china,proofs,OPC R1 8B,0.0
608,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,china_2025_3,china,proofs,OPC R1 8B,0.0
609,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,china_2025_3,china,proofs,OPC R1 8B,0.0
610,gemini-2.5-pro,gemini/gemini-pro-2.5,china_2025_3,china,proofs,OPC R1 8B,1.0
611,o4-mini (high),openai/o4-mini--high,china_2025_3,china,proofs,OPC R1 8B,0.0
612,GPT-5-mini (high),openai/gpt-5-mini,china_2025_5,china,proofs,OPC R1 8B,0.0
613,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,china_2025_5,china,proofs,OPC R1 8B,0.0
614,o4-mini (high),openai/o4-mini--high,china_2025_5,china,proofs,OPC R1 8B,0.0
615,Grok 4,xai/grok-4,china_2025_5,china,proofs,OPC R1 8B,0.0
616,gemini-2.5-pro,gemini/gemini-pro-2.5,china_2025_5,china,proofs,OPC R1 8B,0.0
617,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,china_2025_5,china,proofs,OPC R1 8B,0.0
618,GPT-5 (high),openai/gpt-5,china_2025_5,china,proofs,OPC R1 8B,0.0
619,GPT OSS 120B (high),openai/oss-120b,china_2025_5,china,proofs,OPC R1 8B,0.0
620,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,china_2025_5,china,proofs,OPC R1 8B,0.0
621,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,china_2025_5,china,proofs,OPC R1 8B,0.0
622,Qwen3-4B (25/07),qwen/qwen3_4b,china_2025_5,china,proofs,OPC R1 8B,0.0
623,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,china_2025_6,china,proofs,OPC R1 8B,0.0
624,GPT-5 (high),openai/gpt-5,china_2025_6,china,proofs,OPC R1 8B,0.0
625,GPT-5-mini (high),openai/gpt-5-mini,china_2025_6,china,proofs,OPC R1 8B,0.0
626,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,china_2025_6,china,proofs,OPC R1 8B,0.0
627,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,china_2025_6,china,proofs,OPC R1 8B,0.0
628,gemini-2.5-pro,gemini/gemini-pro-2.5,china_2025_6,china,proofs,OPC R1 8B,0.0
629,GPT OSS 120B (high),openai/oss-120b,china_2025_6,china,proofs,OPC R1 8B,0.0
630,o4-mini (high),openai/o4-mini--high,china_2025_6,china,proofs,OPC R1 8B,1.0
631,Qwen3-4B (25/07),qwen/qwen3_4b,china_2025_6,china,proofs,OPC R1 8B,0.0
632,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,china_2025_6,china,proofs,OPC R1 8B,0.0
633,o4-mini (high),openai/o4-mini--high,chinatst_2025_1,chinatst,proofs,OPC R1 8B,0.0
634,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,chinatst_2025_1,chinatst,proofs,OPC R1 8B,0.0
635,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,chinatst_2025_1,chinatst,proofs,OPC R1 8B,0.0
636,GPT OSS 120B (high),openai/oss-120b,chinatst_2025_1,chinatst,proofs,OPC R1 8B,0.0
637,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,chinatst_2025_1,chinatst,proofs,OPC R1 8B,1.0
638,gemini-2.5-pro,gemini/gemini-pro-2.5,chinatst_2025_1,chinatst,proofs,OPC R1 8B,0.0
639,GPT-5 (high),openai/gpt-5,chinatst_2025_1,chinatst,proofs,OPC R1 8B,0.0
640,Grok 4,xai/grok-4,chinatst_2025_1,chinatst,proofs,OPC R1 8B,0.0
641,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,chinatst_2025_1,chinatst,proofs,OPC R1 8B,0.0
642,Qwen3-4B (25/07),qwen/qwen3_4b,chinatst_2025_1,chinatst,proofs,OPC R1 8B,0.0
643,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,chinatst_2025_10,chinatst,proofs,OPC R1 8B,0.0
644,o4-mini (high),openai/o4-mini--high,chinatst_2025_10,chinatst,proofs,OPC R1 8B,1.0
645,GPT-5 (high),openai/gpt-5,chinatst_2025_10,chinatst,proofs,OPC R1 8B,0.0
646,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,chinatst_2025_10,chinatst,proofs,OPC R1 8B,0.0
647,GPT-5-mini (high),openai/gpt-5-mini,chinatst_2025_10,chinatst,proofs,OPC R1 8B,1.0
648,Grok 4,xai/grok-4,chinatst_2025_10,chinatst,proofs,OPC R1 8B,0.0
649,GPT OSS 120B (high),openai/oss-120b,chinatst_2025_10,chinatst,proofs,OPC R1 8B,0.0
650,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,chinatst_2025_10,chinatst,proofs,OPC R1 8B,0.0
651,Qwen3-4B (25/07),qwen/qwen3_4b,chinatst_2025_10,chinatst,proofs,OPC R1 8B,0.0
652,gemini-2.5-pro,gemini/gemini-pro-2.5,chinatst_2025_10,chinatst,proofs,OPC R1 8B,1.0
653,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,chinatst_2025_10,chinatst,proofs,OPC R1 8B,0.0
654,o4-mini (high),openai/o4-mini--high,chinatst_2025_11,chinatst,proofs,OPC R1 8B,0.0
655,Grok 4,xai/grok-4,chinatst_2025_11,chinatst,proofs,OPC R1 8B,0.0
656,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,chinatst_2025_11,chinatst,proofs,OPC R1 8B,0.0
657,GPT-5-mini (high),openai/gpt-5-mini,chinatst_2025_11,chinatst,proofs,OPC R1 8B,0.0
658,gemini-2.5-pro,gemini/gemini-pro-2.5,chinatst_2025_11,chinatst,proofs,OPC R1 8B,0.0
659,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,chinatst_2025_11,chinatst,proofs,OPC R1 8B,0.0
660,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,chinatst_2025_11,chinatst,proofs,OPC R1 8B,0.0
661,GPT-5 (high),openai/gpt-5,chinatst_2025_11,chinatst,proofs,OPC R1 8B,0.0
662,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,chinatst_2025_11,chinatst,proofs,OPC R1 8B,0.0
663,GPT OSS 120B (high),openai/oss-120b,chinatst_2025_11,chinatst,proofs,OPC R1 8B,0.0
664,Qwen3-4B (25/07),qwen/qwen3_4b,chinatst_2025_11,chinatst,proofs,OPC R1 8B,0.0
665,o4-mini (high),openai/o4-mini--high,chinatst_2025_12,chinatst,proofs,OPC R1 8B,0.0
666,GPT OSS 120B (high),openai/oss-120b,chinatst_2025_12,chinatst,proofs,OPC R1 8B,0.0
667,GPT-5-mini (high),openai/gpt-5-mini,chinatst_2025_12,chinatst,proofs,OPC R1 8B,0.0
668,GPT-5 (high),openai/gpt-5,chinatst_2025_12,chinatst,proofs,OPC R1 8B,1.0
669,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,chinatst_2025_12,chinatst,proofs,OPC R1 8B,0.0
670,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,chinatst_2025_12,chinatst,proofs,OPC R1 8B,0.0
671,Qwen3-4B (25/07),qwen/qwen3_4b,chinatst_2025_12,chinatst,proofs,OPC R1 8B,0.0
672,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,chinatst_2025_12,chinatst,proofs,OPC R1 8B,0.0
673,gemini-2.5-pro,gemini/gemini-pro-2.5,chinatst_2025_12,chinatst,proofs,OPC R1 8B,0.0
674,Grok 4,xai/grok-4,chinatst_2025_12,chinatst,proofs,OPC R1 8B,1.0
675,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,chinatst_2025_12,chinatst,proofs,OPC R1 8B,0.0
676,gemini-2.5-pro,gemini/gemini-pro-2.5,chinatst_2025_13,chinatst,proofs,OPC R1 8B,0.0
677,Qwen3-4B (25/07),qwen/qwen3_4b,chinatst_2025_13,chinatst,proofs,OPC R1 8B,0.0
678,GPT-5 (high),openai/gpt-5,chinatst_2025_13,chinatst,proofs,OPC R1 8B,1.0
679,GPT OSS 120B (high),openai/oss-120b,chinatst_2025_13,chinatst,proofs,OPC R1 8B,0.0
680,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,chinatst_2025_13,chinatst,proofs,OPC R1 8B,0.0
681,GPT-5-mini (high),openai/gpt-5-mini,chinatst_2025_13,chinatst,proofs,OPC R1 8B,0.0
682,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,chinatst_2025_13,chinatst,proofs,OPC R1 8B,0.0
683,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,chinatst_2025_13,chinatst,proofs,OPC R1 8B,0.0
684,Grok 4,xai/grok-4,chinatst_2025_13,chinatst,proofs,OPC R1 8B,0.0
685,o4-mini (high),openai/o4-mini--high,chinatst_2025_13,chinatst,proofs,OPC R1 8B,0.0
686,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,chinatst_2025_13,chinatst,proofs,OPC R1 8B,0.0
687,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,chinatst_2025_14,chinatst,proofs,OPC R1 8B,0.0
688,o4-mini (high),openai/o4-mini--high,chinatst_2025_14,chinatst,proofs,OPC R1 8B,0.0
689,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,chinatst_2025_14,chinatst,proofs,OPC R1 8B,0.0
690,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,chinatst_2025_14,chinatst,proofs,OPC R1 8B,0.0
691,gemini-2.5-pro,gemini/gemini-pro-2.5,chinatst_2025_14,chinatst,proofs,OPC R1 8B,0.0
692,Qwen3-4B (25/07),qwen/qwen3_4b,chinatst_2025_14,chinatst,proofs,OPC R1 8B,0.0
693,GPT OSS 120B (high),openai/oss-120b,chinatst_2025_14,chinatst,proofs,OPC R1 8B,1.0
694,GPT-5-mini (high),openai/gpt-5-mini,chinatst_2025_14,chinatst,proofs,OPC R1 8B,0.0
695,Grok 4,xai/grok-4,chinatst_2025_14,chinatst,proofs,OPC R1 8B,0.0
696,GPT-5 (high),openai/gpt-5,chinatst_2025_14,chinatst,proofs,OPC R1 8B,0.0
697,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,chinatst_2025_14,chinatst,proofs,OPC R1 8B,0.0
698,o4-mini (high),openai/o4-mini--high,chinatst_2025_15,chinatst,proofs,OPC R1 8B,0.0
699,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,chinatst_2025_15,chinatst,proofs,OPC R1 8B,0.0
700,GPT-5 (high),openai/gpt-5,chinatst_2025_15,chinatst,proofs,OPC R1 8B,0.0
701,gemini-2.5-pro,gemini/gemini-pro-2.5,chinatst_2025_15,chinatst,proofs,OPC R1 8B,0.0
702,GPT OSS 120B (high),openai/oss-120b,chinatst_2025_15,chinatst,proofs,OPC R1 8B,0.0
703,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,chinatst_2025_15,chinatst,proofs,OPC R1 8B,0.0
704,Qwen3-4B (25/07),qwen/qwen3_4b,chinatst_2025_15,chinatst,proofs,OPC R1 8B,0.0
705,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,chinatst_2025_15,chinatst,proofs,OPC R1 8B,0.0
706,GPT-5-mini (high),openai/gpt-5-mini,chinatst_2025_15,chinatst,proofs,OPC R1 8B,0.0
707,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,chinatst_2025_15,chinatst,proofs,OPC R1 8B,0.0
708,GPT OSS 120B (high),openai/oss-120b,chinatst_2025_16,chinatst,proofs,OPC R1 8B,1.0
709,o4-mini (high),openai/o4-mini--high,chinatst_2025_16,chinatst,proofs,OPC R1 8B,0.0
710,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,chinatst_2025_16,chinatst,proofs,OPC R1 8B,0.0
711,Qwen3-4B (25/07),qwen/qwen3_4b,chinatst_2025_16,chinatst,proofs,OPC R1 8B,0.0
712,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,chinatst_2025_16,chinatst,proofs,OPC R1 8B,0.0
713,gemini-2.5-pro,gemini/gemini-pro-2.5,chinatst_2025_16,chinatst,proofs,OPC R1 8B,0.0
714,Grok 4,xai/grok-4,chinatst_2025_16,chinatst,proofs,OPC R1 8B,0.0
715,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,chinatst_2025_16,chinatst,proofs,OPC R1 8B,0.0
716,GPT-5-mini (high),openai/gpt-5-mini,chinatst_2025_16,chinatst,proofs,OPC R1 8B,0.0
717,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,chinatst_2025_16,chinatst,proofs,OPC R1 8B,0.0
718,GPT-5 (high),openai/gpt-5,chinatst_2025_16,chinatst,proofs,OPC R1 8B,0.0
719,GPT-5-mini (high),openai/gpt-5-mini,chinatst_2025_17,chinatst,proofs,OPC R1 8B,1.0
720,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,chinatst_2025_17,chinatst,proofs,OPC R1 8B,1.0
721,Grok 4,xai/grok-4,chinatst_2025_17,chinatst,proofs,OPC R1 8B,0.0
722,GPT-5 (high),openai/gpt-5,chinatst_2025_17,chinatst,proofs,OPC R1 8B,0.0
723,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,chinatst_2025_17,chinatst,proofs,OPC R1 8B,0.0
724,o4-mini (high),openai/o4-mini--high,chinatst_2025_17,chinatst,proofs,OPC R1 8B,0.0
725,gemini-2.5-pro,gemini/gemini-pro-2.5,chinatst_2025_17,chinatst,proofs,OPC R1 8B,0.0
726,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,chinatst_2025_17,chinatst,proofs,OPC R1 8B,0.0
727,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,chinatst_2025_17,chinatst,proofs,OPC R1 8B,0.0
728,Qwen3-4B (25/07),qwen/qwen3_4b,chinatst_2025_17,chinatst,proofs,OPC R1 8B,0.0
729,GPT OSS 120B (high),openai/oss-120b,chinatst_2025_17,chinatst,proofs,OPC R1 8B,1.0
730,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,chinatst_2025_18,chinatst,proofs,OPC R1 8B,0.0
731,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,chinatst_2025_18,chinatst,proofs,OPC R1 8B,0.0
732,GPT-5 (high),openai/gpt-5,chinatst_2025_18,chinatst,proofs,OPC R1 8B,0.0
733,GPT OSS 120B (high),openai/oss-120b,chinatst_2025_18,chinatst,proofs,OPC R1 8B,1.0
734,Qwen3-4B (25/07),qwen/qwen3_4b,chinatst_2025_18,chinatst,proofs,OPC R1 8B,0.0
735,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,chinatst_2025_18,chinatst,proofs,OPC R1 8B,0.0
736,gemini-2.5-pro,gemini/gemini-pro-2.5,chinatst_2025_18,chinatst,proofs,OPC R1 8B,0.0
737,GPT-5-mini (high),openai/gpt-5-mini,chinatst_2025_18,chinatst,proofs,OPC R1 8B,0.0
738,o4-mini (high),openai/o4-mini--high,chinatst_2025_18,chinatst,proofs,OPC R1 8B,0.0
739,Grok 4,xai/grok-4,chinatst_2025_18,chinatst,proofs,OPC R1 8B,0.0
740,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,chinatst_2025_18,chinatst,proofs,OPC R1 8B,0.0
741,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,chinatst_2025_19,chinatst,proofs,OPC R1 8B,0.0
742,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,chinatst_2025_19,chinatst,proofs,OPC R1 8B,0.0
743,o4-mini (high),openai/o4-mini--high,chinatst_2025_19,chinatst,proofs,OPC R1 8B,0.0
744,GPT OSS 120B (high),openai/oss-120b,chinatst_2025_19,chinatst,proofs,OPC R1 8B,0.0
745,Grok 4,xai/grok-4,chinatst_2025_19,chinatst,proofs,OPC R1 8B,0.0
746,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,chinatst_2025_19,chinatst,proofs,OPC R1 8B,0.0
747,Qwen3-4B (25/07),qwen/qwen3_4b,chinatst_2025_19,chinatst,proofs,OPC R1 8B,0.0
748,GPT-5-mini (high),openai/gpt-5-mini,chinatst_2025_19,chinatst,proofs,OPC R1 8B,0.0
749,GPT-5 (high),openai/gpt-5,chinatst_2025_19,chinatst,proofs,OPC R1 8B,0.0
750,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,chinatst_2025_19,chinatst,proofs,OPC R1 8B,0.0
751,gemini-2.5-pro,gemini/gemini-pro-2.5,chinatst_2025_19,chinatst,proofs,OPC R1 8B,0.0
752,o4-mini (high),openai/o4-mini--high,chinatst_2025_2,chinatst,proofs,OPC R1 8B,0.0
753,GPT-5-mini (high),openai/gpt-5-mini,chinatst_2025_2,chinatst,proofs,OPC R1 8B,0.0
754,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,chinatst_2025_2,chinatst,proofs,OPC R1 8B,0.0
755,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,chinatst_2025_2,chinatst,proofs,OPC R1 8B,1.0
756,Grok 4,xai/grok-4,chinatst_2025_2,chinatst,proofs,OPC R1 8B,0.0
757,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,chinatst_2025_2,chinatst,proofs,OPC R1 8B,0.0
758,gemini-2.5-pro,gemini/gemini-pro-2.5,chinatst_2025_2,chinatst,proofs,OPC R1 8B,0.0
759,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,chinatst_2025_2,chinatst,proofs,OPC R1 8B,0.0
760,GPT OSS 120B (high),openai/oss-120b,chinatst_2025_2,chinatst,proofs,OPC R1 8B,1.0
761,Qwen3-4B (25/07),qwen/qwen3_4b,chinatst_2025_2,chinatst,proofs,OPC R1 8B,0.0
762,GPT-5 (high),openai/gpt-5,chinatst_2025_2,chinatst,proofs,OPC R1 8B,0.0
763,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,chinatst_2025_20,chinatst,proofs,OPC R1 8B,0.0
764,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,chinatst_2025_20,chinatst,proofs,OPC R1 8B,0.0
765,Grok 4,xai/grok-4,chinatst_2025_20,chinatst,proofs,OPC R1 8B,0.0
766,Qwen3-4B (25/07),qwen/qwen3_4b,chinatst_2025_20,chinatst,proofs,OPC R1 8B,0.0
767,GPT-5-mini (high),openai/gpt-5-mini,chinatst_2025_20,chinatst,proofs,OPC R1 8B,0.0
768,GPT-5 (high),openai/gpt-5,chinatst_2025_20,chinatst,proofs,OPC R1 8B,1.0
769,gemini-2.5-pro,gemini/gemini-pro-2.5,chinatst_2025_20,chinatst,proofs,OPC R1 8B,0.0
770,o4-mini (high),openai/o4-mini--high,chinatst_2025_20,chinatst,proofs,OPC R1 8B,0.0
771,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,chinatst_2025_20,chinatst,proofs,OPC R1 8B,0.0
772,GPT OSS 120B (high),openai/oss-120b,chinatst_2025_20,chinatst,proofs,OPC R1 8B,0.0
773,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,chinatst_2025_20,chinatst,proofs,OPC R1 8B,0.0
774,Grok 4,xai/grok-4,chinatst_2025_21,chinatst,proofs,OPC R1 8B,0.0
775,Qwen3-4B (25/07),qwen/qwen3_4b,chinatst_2025_21,chinatst,proofs,OPC R1 8B,0.0
776,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,chinatst_2025_21,chinatst,proofs,OPC R1 8B,1.0
777,GPT-5 (high),openai/gpt-5,chinatst_2025_21,chinatst,proofs,OPC R1 8B,0.0
778,gemini-2.5-pro,gemini/gemini-pro-2.5,chinatst_2025_21,chinatst,proofs,OPC R1 8B,0.0
779,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,chinatst_2025_21,chinatst,proofs,OPC R1 8B,0.0
780,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,chinatst_2025_21,chinatst,proofs,OPC R1 8B,0.0
781,o4-mini (high),openai/o4-mini--high,chinatst_2025_21,chinatst,proofs,OPC R1 8B,0.0
782,GPT-5-mini (high),openai/gpt-5-mini,chinatst_2025_21,chinatst,proofs,OPC R1 8B,1.0
783,GPT OSS 120B (high),openai/oss-120b,chinatst_2025_21,chinatst,proofs,OPC R1 8B,1.0
784,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,chinatst_2025_21,chinatst,proofs,OPC R1 8B,0.0
785,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,chinatst_2025_22,chinatst,proofs,OPC R1 8B,0.0
786,Qwen3-4B (25/07),qwen/qwen3_4b,chinatst_2025_22,chinatst,proofs,OPC R1 8B,0.0
787,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,chinatst_2025_22,chinatst,proofs,OPC R1 8B,0.0
788,GPT OSS 120B (high),openai/oss-120b,chinatst_2025_22,chinatst,proofs,OPC R1 8B,0.0
789,gemini-2.5-pro,gemini/gemini-pro-2.5,chinatst_2025_22,chinatst,proofs,OPC R1 8B,0.0
790,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,chinatst_2025_22,chinatst,proofs,OPC R1 8B,0.0
791,o4-mini (high),openai/o4-mini--high,chinatst_2025_22,chinatst,proofs,OPC R1 8B,0.0
792,Grok 4,xai/grok-4,chinatst_2025_22,chinatst,proofs,OPC R1 8B,0.0
793,GPT-5 (high),openai/gpt-5,chinatst_2025_22,chinatst,proofs,OPC R1 8B,1.0
794,GPT-5-mini (high),openai/gpt-5-mini,chinatst_2025_22,chinatst,proofs,OPC R1 8B,0.0
795,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,chinatst_2025_22,chinatst,proofs,OPC R1 8B,1.0
796,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,chinatst_2025_3,chinatst,proofs,OPC R1 8B,0.0
797,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,chinatst_2025_3,chinatst,proofs,OPC R1 8B,0.0
798,gemini-2.5-pro,gemini/gemini-pro-2.5,chinatst_2025_3,chinatst,proofs,OPC R1 8B,0.0
799,GPT-5-mini (high),openai/gpt-5-mini,chinatst_2025_3,chinatst,proofs,OPC R1 8B,0.0
800,GPT-5 (high),openai/gpt-5,chinatst_2025_3,chinatst,proofs,OPC R1 8B,1.0
801,GPT OSS 120B (high),openai/oss-120b,chinatst_2025_3,chinatst,proofs,OPC R1 8B,0.0
802,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,chinatst_2025_3,chinatst,proofs,OPC R1 8B,0.0
803,o4-mini (high),openai/o4-mini--high,chinatst_2025_3,chinatst,proofs,OPC R1 8B,0.0
804,Grok 4,xai/grok-4,chinatst_2025_3,chinatst,proofs,OPC R1 8B,0.0
805,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,chinatst_2025_3,chinatst,proofs,OPC R1 8B,0.0
806,Qwen3-4B (25/07),qwen/qwen3_4b,chinatst_2025_3,chinatst,proofs,OPC R1 8B,0.0
807,GPT OSS 120B (high),openai/oss-120b,chinatst_2025_4,chinatst,proofs,OPC R1 8B,0.0
808,gemini-2.5-pro,gemini/gemini-pro-2.5,chinatst_2025_4,chinatst,proofs,OPC R1 8B,0.0
809,Grok 4,xai/grok-4,chinatst_2025_4,chinatst,proofs,OPC R1 8B,0.0
810,o4-mini (high),openai/o4-mini--high,chinatst_2025_4,chinatst,proofs,OPC R1 8B,1.0
811,Qwen3-4B (25/07),qwen/qwen3_4b,chinatst_2025_4,chinatst,proofs,OPC R1 8B,0.0
812,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,chinatst_2025_4,chinatst,proofs,OPC R1 8B,0.0
813,GPT-5 (high),openai/gpt-5,chinatst_2025_4,chinatst,proofs,OPC R1 8B,0.0
814,GPT-5-mini (high),openai/gpt-5-mini,chinatst_2025_4,chinatst,proofs,OPC R1 8B,1.0
815,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,chinatst_2025_4,chinatst,proofs,OPC R1 8B,1.0
816,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,chinatst_2025_4,chinatst,proofs,OPC R1 8B,0.0
817,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,chinatst_2025_4,chinatst,proofs,OPC R1 8B,0.0
818,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,chinatst_2025_5,chinatst,proofs,OPC R1 8B,0.0
819,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,chinatst_2025_5,chinatst,proofs,OPC R1 8B,0.0
820,Grok 4,xai/grok-4,chinatst_2025_5,chinatst,proofs,OPC R1 8B,1.0
821,GPT-5-mini (high),openai/gpt-5-mini,chinatst_2025_5,chinatst,proofs,OPC R1 8B,1.0
822,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,chinatst_2025_5,chinatst,proofs,OPC R1 8B,0.0
823,GPT-5 (high),openai/gpt-5,chinatst_2025_5,chinatst,proofs,OPC R1 8B,0.0
824,o4-mini (high),openai/o4-mini--high,chinatst_2025_5,chinatst,proofs,OPC R1 8B,0.0
825,gemini-2.5-pro,gemini/gemini-pro-2.5,chinatst_2025_5,chinatst,proofs,OPC R1 8B,0.0
826,GPT OSS 120B (high),openai/oss-120b,chinatst_2025_5,chinatst,proofs,OPC R1 8B,0.0
827,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,chinatst_2025_5,chinatst,proofs,OPC R1 8B,0.0
828,Qwen3-4B (25/07),qwen/qwen3_4b,chinatst_2025_5,chinatst,proofs,OPC R1 8B,0.0
829,GPT-5 (high),openai/gpt-5,chinatst_2025_6,chinatst,proofs,OPC R1 8B,0.0
830,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,chinatst_2025_6,chinatst,proofs,OPC R1 8B,0.0
831,GPT-5-mini (high),openai/gpt-5-mini,chinatst_2025_6,chinatst,proofs,OPC R1 8B,1.0
832,Grok 4,xai/grok-4,chinatst_2025_6,chinatst,proofs,OPC R1 8B,1.0
833,Qwen3-4B (25/07),qwen/qwen3_4b,chinatst_2025_6,chinatst,proofs,OPC R1 8B,0.0
834,GPT OSS 120B (high),openai/oss-120b,chinatst_2025_6,chinatst,proofs,OPC R1 8B,0.0
835,gemini-2.5-pro,gemini/gemini-pro-2.5,chinatst_2025_6,chinatst,proofs,OPC R1 8B,0.0
836,o4-mini (high),openai/o4-mini--high,chinatst_2025_6,chinatst,proofs,OPC R1 8B,0.0
837,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,chinatst_2025_6,chinatst,proofs,OPC R1 8B,1.0
838,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,chinatst_2025_6,chinatst,proofs,OPC R1 8B,0.0
839,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,chinatst_2025_6,chinatst,proofs,OPC R1 8B,0.0
840,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,chinatst_2025_7,chinatst,proofs,OPC R1 8B,0.0
841,GPT-5 (high),openai/gpt-5,chinatst_2025_7,chinatst,proofs,OPC R1 8B,0.0
842,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,chinatst_2025_7,chinatst,proofs,OPC R1 8B,0.0
843,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,chinatst_2025_7,chinatst,proofs,OPC R1 8B,0.0
844,GPT-5-mini (high),openai/gpt-5-mini,chinatst_2025_7,chinatst,proofs,OPC R1 8B,0.0
845,gemini-2.5-pro,gemini/gemini-pro-2.5,chinatst_2025_7,chinatst,proofs,OPC R1 8B,0.0
846,Grok 4,xai/grok-4,chinatst_2025_7,chinatst,proofs,OPC R1 8B,0.0
847,Qwen3-4B (25/07),qwen/qwen3_4b,chinatst_2025_7,chinatst,proofs,OPC R1 8B,0.0
848,o4-mini (high),openai/o4-mini--high,chinatst_2025_7,chinatst,proofs,OPC R1 8B,0.0
849,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,chinatst_2025_7,chinatst,proofs,OPC R1 8B,0.0
850,GPT OSS 120B (high),openai/oss-120b,chinatst_2025_7,chinatst,proofs,OPC R1 8B,0.0
851,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,chinatst_2025_8,chinatst,proofs,OPC R1 8B,0.0
852,gemini-2.5-pro,gemini/gemini-pro-2.5,chinatst_2025_8,chinatst,proofs,OPC R1 8B,0.0
853,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,chinatst_2025_8,chinatst,proofs,OPC R1 8B,0.0
854,Qwen3-4B (25/07),qwen/qwen3_4b,chinatst_2025_8,chinatst,proofs,OPC R1 8B,0.0
855,o4-mini (high),openai/o4-mini--high,chinatst_2025_8,chinatst,proofs,OPC R1 8B,0.0
856,GPT-5 (high),openai/gpt-5,chinatst_2025_8,chinatst,proofs,OPC R1 8B,0.0
857,GPT-5-mini (high),openai/gpt-5-mini,chinatst_2025_8,chinatst,proofs,OPC R1 8B,0.0
858,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,chinatst_2025_8,chinatst,proofs,OPC R1 8B,0.0
859,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,chinatst_2025_8,chinatst,proofs,OPC R1 8B,0.0
860,Grok 4,xai/grok-4,chinatst_2025_8,chinatst,proofs,OPC R1 8B,0.0
861,GPT OSS 120B (high),openai/oss-120b,chinatst_2025_8,chinatst,proofs,OPC R1 8B,0.0
862,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,chinatst_2025_9,chinatst,proofs,OPC R1 8B,0.0
863,Qwen3-4B (25/07),qwen/qwen3_4b,chinatst_2025_9,chinatst,proofs,OPC R1 8B,0.0
864,o4-mini (high),openai/o4-mini--high,chinatst_2025_9,chinatst,proofs,OPC R1 8B,0.0
865,GPT-5 (high),openai/gpt-5,chinatst_2025_9,chinatst,proofs,OPC R1 8B,0.0
866,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,chinatst_2025_9,chinatst,proofs,OPC R1 8B,0.0
867,Grok 4,xai/grok-4,chinatst_2025_9,chinatst,proofs,OPC R1 8B,0.0
868,GPT-5-mini (high),openai/gpt-5-mini,chinatst_2025_9,chinatst,proofs,OPC R1 8B,0.0
869,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,chinatst_2025_9,chinatst,proofs,OPC R1 8B,0.0
870,GPT OSS 120B (high),openai/oss-120b,chinatst_2025_9,chinatst,proofs,OPC R1 8B,0.0
871,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,chinatst_2025_9,chinatst,proofs,OPC R1 8B,0.0
872,gemini-2.5-pro,gemini/gemini-pro-2.5,chinatst_2025_9,chinatst,proofs,OPC R1 8B,0.0
873,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,egmo_2025_1,egmo,proofs,OPC R1 8B,0.0
874,gemini-2.5-pro,gemini/gemini-pro-2.5,egmo_2025_1,egmo,proofs,OPC R1 8B,0.0
875,Qwen3-4B (25/07),qwen/qwen3_4b,egmo_2025_1,egmo,proofs,OPC R1 8B,0.0
876,GPT-5 (high),openai/gpt-5,egmo_2025_1,egmo,proofs,OPC R1 8B,1.0
877,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,egmo_2025_1,egmo,proofs,OPC R1 8B,0.0
878,o4-mini (high),openai/o4-mini--high,egmo_2025_1,egmo,proofs,OPC R1 8B,0.0
879,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,egmo_2025_1,egmo,proofs,OPC R1 8B,0.0
880,GPT-5-mini (high),openai/gpt-5-mini,egmo_2025_1,egmo,proofs,OPC R1 8B,0.0
881,GPT OSS 120B (high),openai/oss-120b,egmo_2025_1,egmo,proofs,OPC R1 8B,0.0
882,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,egmo_2025_1,egmo,proofs,OPC R1 8B,0.0
883,Grok 4,xai/grok-4,egmo_2025_1,egmo,proofs,OPC R1 8B,0.0
884,Grok 4,xai/grok-4,egmo_2025_2,egmo,proofs,OPC R1 8B,0.0
885,Qwen3-4B (25/07),qwen/qwen3_4b,egmo_2025_2,egmo,proofs,OPC R1 8B,0.0
886,gemini-2.5-pro,gemini/gemini-pro-2.5,egmo_2025_2,egmo,proofs,OPC R1 8B,1.0
887,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,egmo_2025_2,egmo,proofs,OPC R1 8B,0.0
888,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,egmo_2025_2,egmo,proofs,OPC R1 8B,0.0
889,GPT OSS 120B (high),openai/oss-120b,egmo_2025_2,egmo,proofs,OPC R1 8B,0.0
890,o4-mini (high),openai/o4-mini--high,egmo_2025_2,egmo,proofs,OPC R1 8B,0.0
891,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,egmo_2025_2,egmo,proofs,OPC R1 8B,0.0
892,GPT-5 (high),openai/gpt-5,egmo_2025_2,egmo,proofs,OPC R1 8B,0.0
893,GPT-5-mini (high),openai/gpt-5-mini,egmo_2025_2,egmo,proofs,OPC R1 8B,1.0
894,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,egmo_2025_2,egmo,proofs,OPC R1 8B,0.0
895,gemini-2.5-pro,gemini/gemini-pro-2.5,egmo_2025_3,egmo,proofs,OPC R1 8B,0.0
896,Qwen3-4B (25/07),qwen/qwen3_4b,egmo_2025_3,egmo,proofs,OPC R1 8B,0.0
897,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,egmo_2025_3,egmo,proofs,OPC R1 8B,0.0
898,GPT-5 (high),openai/gpt-5,egmo_2025_3,egmo,proofs,OPC R1 8B,0.0
899,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,egmo_2025_3,egmo,proofs,OPC R1 8B,0.0
900,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,egmo_2025_3,egmo,proofs,OPC R1 8B,0.0
901,o4-mini (high),openai/o4-mini--high,egmo_2025_3,egmo,proofs,OPC R1 8B,0.0
902,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,egmo_2025_3,egmo,proofs,OPC R1 8B,0.0
903,GPT OSS 120B (high),openai/oss-120b,egmo_2025_3,egmo,proofs,OPC R1 8B,0.0
904,Grok 4,xai/grok-4,egmo_2025_3,egmo,proofs,OPC R1 8B,0.0
905,GPT-5 (high),openai/gpt-5,egmo_2025_4,egmo,proofs,OPC R1 8B,0.0
906,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,egmo_2025_4,egmo,proofs,OPC R1 8B,0.0
907,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,egmo_2025_4,egmo,proofs,OPC R1 8B,0.0
908,o4-mini (high),openai/o4-mini--high,egmo_2025_4,egmo,proofs,OPC R1 8B,0.0
909,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,egmo_2025_4,egmo,proofs,OPC R1 8B,0.0
910,gemini-2.5-pro,gemini/gemini-pro-2.5,egmo_2025_4,egmo,proofs,OPC R1 8B,0.0
911,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,egmo_2025_4,egmo,proofs,OPC R1 8B,0.0
912,GPT OSS 120B (high),openai/oss-120b,egmo_2025_4,egmo,proofs,OPC R1 8B,1.0
913,GPT-5-mini (high),openai/gpt-5-mini,egmo_2025_4,egmo,proofs,OPC R1 8B,0.0
914,Qwen3-4B (25/07),qwen/qwen3_4b,egmo_2025_4,egmo,proofs,OPC R1 8B,0.0
915,Grok 4,xai/grok-4,egmo_2025_4,egmo,proofs,OPC R1 8B,0.0
916,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,egmo_2025_5,egmo,proofs,OPC R1 8B,1.0
917,gemini-2.5-pro,gemini/gemini-pro-2.5,egmo_2025_5,egmo,proofs,OPC R1 8B,0.0
918,Grok 4,xai/grok-4,egmo_2025_5,egmo,proofs,OPC R1 8B,0.0
919,GPT OSS 120B (high),openai/oss-120b,egmo_2025_5,egmo,proofs,OPC R1 8B,0.0
920,GPT-5-mini (high),openai/gpt-5-mini,egmo_2025_5,egmo,proofs,OPC R1 8B,0.0
921,GPT-5 (high),openai/gpt-5,egmo_2025_5,egmo,proofs,OPC R1 8B,0.0
922,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,egmo_2025_5,egmo,proofs,OPC R1 8B,0.0
923,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,egmo_2025_5,egmo,proofs,OPC R1 8B,0.0
924,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,egmo_2025_5,egmo,proofs,OPC R1 8B,0.0
925,Qwen3-4B (25/07),qwen/qwen3_4b,egmo_2025_5,egmo,proofs,OPC R1 8B,0.0
926,o4-mini (high),openai/o4-mini--high,egmo_2025_5,egmo,proofs,OPC R1 8B,0.0
927,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,egmo_2025_6,egmo,proofs,OPC R1 8B,1.0
928,gemini-2.5-pro,gemini/gemini-pro-2.5,egmo_2025_6,egmo,proofs,OPC R1 8B,0.0
929,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,egmo_2025_6,egmo,proofs,OPC R1 8B,0.0
930,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,egmo_2025_6,egmo,proofs,OPC R1 8B,1.0
931,GPT-5 (high),openai/gpt-5,egmo_2025_6,egmo,proofs,OPC R1 8B,1.0
932,o4-mini (high),openai/o4-mini--high,egmo_2025_6,egmo,proofs,OPC R1 8B,1.0
933,Grok 4,xai/grok-4,egmo_2025_6,egmo,proofs,OPC R1 8B,1.0
934,GPT OSS 120B (high),openai/oss-120b,egmo_2025_6,egmo,proofs,OPC R1 8B,0.0
935,GPT-5-mini (high),openai/gpt-5-mini,egmo_2025_6,egmo,proofs,OPC R1 8B,0.0
936,Qwen3-4B (25/07),qwen/qwen3_4b,egmo_2025_6,egmo,proofs,OPC R1 8B,1.0
937,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,egmo_2025_6,egmo,proofs,OPC R1 8B,1.0
938,o4-mini (high),openai/o4-mini--high,elmosl_A_2025_1,elmosl,proofs,OPC R1 8B,0.0
939,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,elmosl_A_2025_1,elmosl,proofs,OPC R1 8B,0.0
940,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,elmosl_A_2025_1,elmosl,proofs,OPC R1 8B,0.0
941,Qwen3-4B (25/07),qwen/qwen3_4b,elmosl_A_2025_1,elmosl,proofs,OPC R1 8B,0.0
942,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,elmosl_A_2025_1,elmosl,proofs,OPC R1 8B,0.0
943,GPT OSS 120B (high),openai/oss-120b,elmosl_A_2025_1,elmosl,proofs,OPC R1 8B,1.0
944,GPT-5 (high),openai/gpt-5,elmosl_A_2025_1,elmosl,proofs,OPC R1 8B,0.0
945,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,elmosl_A_2025_1,elmosl,proofs,OPC R1 8B,0.0
946,Grok 4,xai/grok-4,elmosl_A_2025_1,elmosl,proofs,OPC R1 8B,0.0
947,gemini-2.5-pro,gemini/gemini-pro-2.5,elmosl_A_2025_1,elmosl,proofs,OPC R1 8B,0.0
948,Qwen3-4B (25/07),qwen/qwen3_4b,elmosl_A_2025_2,elmosl,proofs,OPC R1 8B,0.0
949,gemini-2.5-pro,gemini/gemini-pro-2.5,elmosl_A_2025_2,elmosl,proofs,OPC R1 8B,1.0
950,Grok 4,xai/grok-4,elmosl_A_2025_2,elmosl,proofs,OPC R1 8B,0.0
951,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,elmosl_A_2025_2,elmosl,proofs,OPC R1 8B,1.0
952,GPT OSS 120B (high),openai/oss-120b,elmosl_A_2025_2,elmosl,proofs,OPC R1 8B,0.0
953,o4-mini (high),openai/o4-mini--high,elmosl_A_2025_2,elmosl,proofs,OPC R1 8B,0.0
954,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,elmosl_A_2025_2,elmosl,proofs,OPC R1 8B,0.0
955,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,elmosl_A_2025_2,elmosl,proofs,OPC R1 8B,0.0
956,GPT-5 (high),openai/gpt-5,elmosl_A_2025_2,elmosl,proofs,OPC R1 8B,1.0
957,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,elmosl_A_2025_2,elmosl,proofs,OPC R1 8B,1.0
958,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,elmosl_A_2025_3,elmosl,proofs,OPC R1 8B,0.0
959,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,elmosl_A_2025_3,elmosl,proofs,OPC R1 8B,0.0
960,GPT OSS 120B (high),openai/oss-120b,elmosl_A_2025_3,elmosl,proofs,OPC R1 8B,0.0
961,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,elmosl_A_2025_3,elmosl,proofs,OPC R1 8B,0.0
962,gemini-2.5-pro,gemini/gemini-pro-2.5,elmosl_A_2025_3,elmosl,proofs,OPC R1 8B,0.0
963,Grok 4,xai/grok-4,elmosl_A_2025_3,elmosl,proofs,OPC R1 8B,1.0
964,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,elmosl_A_2025_3,elmosl,proofs,OPC R1 8B,0.0
965,Qwen3-4B (25/07),qwen/qwen3_4b,elmosl_A_2025_3,elmosl,proofs,OPC R1 8B,0.0
966,GPT-5 (high),openai/gpt-5,elmosl_A_2025_3,elmosl,proofs,OPC R1 8B,1.0
967,o4-mini (high),openai/o4-mini--high,elmosl_A_2025_3,elmosl,proofs,OPC R1 8B,0.0
968,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,elmosl_A_2025_5,elmosl,proofs,OPC R1 8B,0.0
969,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,elmosl_A_2025_5,elmosl,proofs,OPC R1 8B,1.0
970,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,elmosl_A_2025_5,elmosl,proofs,OPC R1 8B,0.0
971,GPT-5 (high),openai/gpt-5,elmosl_A_2025_5,elmosl,proofs,OPC R1 8B,1.0
972,GPT OSS 120B (high),openai/oss-120b,elmosl_A_2025_5,elmosl,proofs,OPC R1 8B,0.0
973,o4-mini (high),openai/o4-mini--high,elmosl_A_2025_5,elmosl,proofs,OPC R1 8B,0.0
974,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,elmosl_A_2025_5,elmosl,proofs,OPC R1 8B,0.0
975,Qwen3-4B (25/07),qwen/qwen3_4b,elmosl_A_2025_5,elmosl,proofs,OPC R1 8B,0.0
976,Grok 4,xai/grok-4,elmosl_A_2025_5,elmosl,proofs,OPC R1 8B,0.0
977,gemini-2.5-pro,gemini/gemini-pro-2.5,elmosl_A_2025_5,elmosl,proofs,OPC R1 8B,0.0
978,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,elmosl_A_2025_6,elmosl,proofs,OPC R1 8B,0.0
979,GPT OSS 120B (high),openai/oss-120b,elmosl_A_2025_6,elmosl,proofs,OPC R1 8B,1.0
980,Qwen3-4B (25/07),qwen/qwen3_4b,elmosl_A_2025_6,elmosl,proofs,OPC R1 8B,1.0
981,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,elmosl_A_2025_6,elmosl,proofs,OPC R1 8B,1.0
982,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,elmosl_A_2025_6,elmosl,proofs,OPC R1 8B,1.0
983,Grok 4,xai/grok-4,elmosl_A_2025_6,elmosl,proofs,OPC R1 8B,1.0
984,GPT-5 (high),openai/gpt-5,elmosl_A_2025_6,elmosl,proofs,OPC R1 8B,1.0
985,gemini-2.5-pro,gemini/gemini-pro-2.5,elmosl_A_2025_6,elmosl,proofs,OPC R1 8B,1.0
986,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,elmosl_A_2025_6,elmosl,proofs,OPC R1 8B,1.0
987,o4-mini (high),openai/o4-mini--high,elmosl_A_2025_6,elmosl,proofs,OPC R1 8B,1.0
988,GPT OSS 120B (high),openai/oss-120b,elmosl_A_2025_7,elmosl,proofs,OPC R1 8B,0.0
989,Qwen3-4B (25/07),qwen/qwen3_4b,elmosl_A_2025_7,elmosl,proofs,OPC R1 8B,0.0
990,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,elmosl_A_2025_7,elmosl,proofs,OPC R1 8B,0.0
991,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,elmosl_A_2025_7,elmosl,proofs,OPC R1 8B,0.0
992,o4-mini (high),openai/o4-mini--high,elmosl_A_2025_7,elmosl,proofs,OPC R1 8B,0.0
993,Grok 4,xai/grok-4,elmosl_A_2025_7,elmosl,proofs,OPC R1 8B,0.0
994,gemini-2.5-pro,gemini/gemini-pro-2.5,elmosl_A_2025_7,elmosl,proofs,OPC R1 8B,0.0
995,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,elmosl_A_2025_7,elmosl,proofs,OPC R1 8B,0.0
996,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,elmosl_A_2025_7,elmosl,proofs,OPC R1 8B,0.0
997,GPT-5 (high),openai/gpt-5,elmosl_A_2025_7,elmosl,proofs,OPC R1 8B,0.0
998,o4-mini (high),openai/o4-mini--high,elmosl_A_2025_8,elmosl,proofs,OPC R1 8B,0.0
999,GPT OSS 120B (high),openai/oss-120b,elmosl_A_2025_8,elmosl,proofs,OPC R1 8B,0.0
1000,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,elmosl_A_2025_8,elmosl,proofs,OPC R1 8B,0.0
1001,gemini-2.5-pro,gemini/gemini-pro-2.5,elmosl_A_2025_8,elmosl,proofs,OPC R1 8B,0.0
1002,Qwen3-4B (25/07),qwen/qwen3_4b,elmosl_A_2025_8,elmosl,proofs,OPC R1 8B,0.0
1003,GPT-5 (high),openai/gpt-5,elmosl_A_2025_8,elmosl,proofs,OPC R1 8B,0.0
1004,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,elmosl_A_2025_8,elmosl,proofs,OPC R1 8B,0.0
1005,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,elmosl_A_2025_8,elmosl,proofs,OPC R1 8B,0.0
1006,Grok 4,xai/grok-4,elmosl_A_2025_8,elmosl,proofs,OPC R1 8B,0.0
1007,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,elmosl_A_2025_8,elmosl,proofs,OPC R1 8B,0.0
1008,Qwen3-4B (25/07),qwen/qwen3_4b,elmosl_C_2025_1,elmosl,proofs,OPC R1 8B,0.0
1009,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,elmosl_C_2025_1,elmosl,proofs,OPC R1 8B,0.0
1010,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,elmosl_C_2025_1,elmosl,proofs,OPC R1 8B,0.0
1011,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,elmosl_C_2025_1,elmosl,proofs,OPC R1 8B,0.0
1012,Grok 4,xai/grok-4,elmosl_C_2025_1,elmosl,proofs,OPC R1 8B,0.0
1013,GPT-5 (high),openai/gpt-5,elmosl_C_2025_1,elmosl,proofs,OPC R1 8B,1.0
1014,o4-mini (high),openai/o4-mini--high,elmosl_C_2025_1,elmosl,proofs,OPC R1 8B,0.0
1015,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,elmosl_C_2025_1,elmosl,proofs,OPC R1 8B,0.0
1016,GPT OSS 120B (high),openai/oss-120b,elmosl_C_2025_1,elmosl,proofs,OPC R1 8B,0.0
1017,gemini-2.5-pro,gemini/gemini-pro-2.5,elmosl_C_2025_1,elmosl,proofs,OPC R1 8B,0.0
1018,Qwen3-4B (25/07),qwen/qwen3_4b,elmosl_C_2025_2,elmosl,proofs,OPC R1 8B,1.0
1019,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,elmosl_C_2025_2,elmosl,proofs,OPC R1 8B,1.0
1020,Grok 4,xai/grok-4,elmosl_C_2025_2,elmosl,proofs,OPC R1 8B,0.0
1021,o4-mini (high),openai/o4-mini--high,elmosl_C_2025_2,elmosl,proofs,OPC R1 8B,0.0
1022,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,elmosl_C_2025_2,elmosl,proofs,OPC R1 8B,1.0
1023,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,elmosl_C_2025_2,elmosl,proofs,OPC R1 8B,0.0
1024,gemini-2.5-pro,gemini/gemini-pro-2.5,elmosl_C_2025_2,elmosl,proofs,OPC R1 8B,1.0
1025,GPT OSS 120B (high),openai/oss-120b,elmosl_C_2025_2,elmosl,proofs,OPC R1 8B,0.0
1026,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,elmosl_C_2025_2,elmosl,proofs,OPC R1 8B,1.0
1027,GPT-5 (high),openai/gpt-5,elmosl_C_2025_2,elmosl,proofs,OPC R1 8B,1.0
1028,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,elmosl_C_2025_3,elmosl,proofs,OPC R1 8B,1.0
1029,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,elmosl_C_2025_3,elmosl,proofs,OPC R1 8B,1.0
1030,gemini-2.5-pro,gemini/gemini-pro-2.5,elmosl_C_2025_3,elmosl,proofs,OPC R1 8B,1.0
1031,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,elmosl_C_2025_3,elmosl,proofs,OPC R1 8B,1.0
1032,GPT OSS 120B (high),openai/oss-120b,elmosl_C_2025_3,elmosl,proofs,OPC R1 8B,0.0
1033,GPT-5 (high),openai/gpt-5,elmosl_C_2025_3,elmosl,proofs,OPC R1 8B,1.0
1034,o4-mini (high),openai/o4-mini--high,elmosl_C_2025_3,elmosl,proofs,OPC R1 8B,1.0
1035,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,elmosl_C_2025_3,elmosl,proofs,OPC R1 8B,0.0
1036,Grok 4,xai/grok-4,elmosl_C_2025_3,elmosl,proofs,OPC R1 8B,0.0
1037,Qwen3-4B (25/07),qwen/qwen3_4b,elmosl_C_2025_3,elmosl,proofs,OPC R1 8B,1.0
1038,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,elmosl_C_2025_4,elmosl,proofs,OPC R1 8B,0.0
1039,o4-mini (high),openai/o4-mini--high,elmosl_C_2025_4,elmosl,proofs,OPC R1 8B,0.0
1040,gemini-2.5-pro,gemini/gemini-pro-2.5,elmosl_C_2025_4,elmosl,proofs,OPC R1 8B,1.0
1041,Grok 4,xai/grok-4,elmosl_C_2025_4,elmosl,proofs,OPC R1 8B,1.0
1042,GPT OSS 120B (high),openai/oss-120b,elmosl_C_2025_4,elmosl,proofs,OPC R1 8B,0.0
1043,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,elmosl_C_2025_4,elmosl,proofs,OPC R1 8B,0.0
1044,Qwen3-4B (25/07),qwen/qwen3_4b,elmosl_C_2025_4,elmosl,proofs,OPC R1 8B,1.0
1045,GPT-5 (high),openai/gpt-5,elmosl_C_2025_4,elmosl,proofs,OPC R1 8B,0.0
1046,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,elmosl_C_2025_4,elmosl,proofs,OPC R1 8B,0.0
1047,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,elmosl_C_2025_4,elmosl,proofs,OPC R1 8B,0.0
1048,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,elmosl_C_2025_5,elmosl,proofs,OPC R1 8B,1.0
1049,GPT OSS 120B (high),openai/oss-120b,elmosl_C_2025_5,elmosl,proofs,OPC R1 8B,0.0
1050,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,elmosl_C_2025_5,elmosl,proofs,OPC R1 8B,0.0
1051,Qwen3-4B (25/07),qwen/qwen3_4b,elmosl_C_2025_5,elmosl,proofs,OPC R1 8B,1.0
1052,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,elmosl_C_2025_5,elmosl,proofs,OPC R1 8B,0.0
1053,Grok 4,xai/grok-4,elmosl_C_2025_5,elmosl,proofs,OPC R1 8B,1.0
1054,gemini-2.5-pro,gemini/gemini-pro-2.5,elmosl_C_2025_5,elmosl,proofs,OPC R1 8B,0.0
1055,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,elmosl_C_2025_5,elmosl,proofs,OPC R1 8B,0.0
1056,o4-mini (high),openai/o4-mini--high,elmosl_C_2025_5,elmosl,proofs,OPC R1 8B,0.0
1057,GPT-5 (high),openai/gpt-5,elmosl_C_2025_5,elmosl,proofs,OPC R1 8B,0.0
1058,GPT OSS 120B (high),openai/oss-120b,elmosl_C_2025_6,elmosl,proofs,OPC R1 8B,0.0
1059,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,elmosl_C_2025_6,elmosl,proofs,OPC R1 8B,0.0
1060,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,elmosl_C_2025_6,elmosl,proofs,OPC R1 8B,0.0
1061,gemini-2.5-pro,gemini/gemini-pro-2.5,elmosl_C_2025_6,elmosl,proofs,OPC R1 8B,0.0
1062,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,elmosl_C_2025_6,elmosl,proofs,OPC R1 8B,1.0
1063,o4-mini (high),openai/o4-mini--high,elmosl_C_2025_6,elmosl,proofs,OPC R1 8B,0.0
1064,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,elmosl_C_2025_6,elmosl,proofs,OPC R1 8B,0.0
1065,GPT-5 (high),openai/gpt-5,elmosl_C_2025_6,elmosl,proofs,OPC R1 8B,0.0
1066,Qwen3-4B (25/07),qwen/qwen3_4b,elmosl_C_2025_6,elmosl,proofs,OPC R1 8B,0.0
1067,Grok 4,xai/grok-4,elmosl_C_2025_6,elmosl,proofs,OPC R1 8B,0.0
1068,gemini-2.5-pro,gemini/gemini-pro-2.5,elmosl_C_2025_7,elmosl,proofs,OPC R1 8B,0.0
1069,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,elmosl_C_2025_7,elmosl,proofs,OPC R1 8B,0.0
1070,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,elmosl_C_2025_7,elmosl,proofs,OPC R1 8B,0.0
1071,Qwen3-4B (25/07),qwen/qwen3_4b,elmosl_C_2025_7,elmosl,proofs,OPC R1 8B,0.0
1072,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,elmosl_C_2025_7,elmosl,proofs,OPC R1 8B,0.0
1073,o4-mini (high),openai/o4-mini--high,elmosl_C_2025_7,elmosl,proofs,OPC R1 8B,0.0
1074,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,elmosl_C_2025_7,elmosl,proofs,OPC R1 8B,0.0
1075,Grok 4,xai/grok-4,elmosl_C_2025_7,elmosl,proofs,OPC R1 8B,0.0
1076,GPT OSS 120B (high),openai/oss-120b,elmosl_C_2025_7,elmosl,proofs,OPC R1 8B,0.0
1077,GPT-5 (high),openai/gpt-5,elmosl_C_2025_7,elmosl,proofs,OPC R1 8B,1.0
1078,GPT-5 (high),openai/gpt-5,elmosl_C_2025_8,elmosl,proofs,OPC R1 8B,0.0
1079,o4-mini (high),openai/o4-mini--high,elmosl_C_2025_8,elmosl,proofs,OPC R1 8B,1.0
1080,Grok 4,xai/grok-4,elmosl_C_2025_8,elmosl,proofs,OPC R1 8B,0.0
1081,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,elmosl_C_2025_8,elmosl,proofs,OPC R1 8B,0.0
1082,GPT OSS 120B (high),openai/oss-120b,elmosl_C_2025_8,elmosl,proofs,OPC R1 8B,0.0
1083,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,elmosl_C_2025_8,elmosl,proofs,OPC R1 8B,0.0
1084,Qwen3-4B (25/07),qwen/qwen3_4b,elmosl_C_2025_8,elmosl,proofs,OPC R1 8B,0.0
1085,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,elmosl_C_2025_8,elmosl,proofs,OPC R1 8B,1.0
1086,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,elmosl_C_2025_8,elmosl,proofs,OPC R1 8B,0.0
1087,gemini-2.5-pro,gemini/gemini-pro-2.5,elmosl_C_2025_8,elmosl,proofs,OPC R1 8B,0.0
1088,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,elmosl_C_2025_9,elmosl,proofs,OPC R1 8B,0.0
1089,GPT-5 (high),openai/gpt-5,elmosl_C_2025_9,elmosl,proofs,OPC R1 8B,0.0
1090,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,elmosl_C_2025_9,elmosl,proofs,OPC R1 8B,0.0
1091,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,elmosl_C_2025_9,elmosl,proofs,OPC R1 8B,0.0
1092,o4-mini (high),openai/o4-mini--high,elmosl_C_2025_9,elmosl,proofs,OPC R1 8B,0.0
1093,Grok 4,xai/grok-4,elmosl_C_2025_9,elmosl,proofs,OPC R1 8B,0.0
1094,gemini-2.5-pro,gemini/gemini-pro-2.5,elmosl_C_2025_9,elmosl,proofs,OPC R1 8B,0.0
1095,GPT OSS 120B (high),openai/oss-120b,elmosl_C_2025_9,elmosl,proofs,OPC R1 8B,0.0
1096,Qwen3-4B (25/07),qwen/qwen3_4b,elmosl_C_2025_9,elmosl,proofs,OPC R1 8B,0.0
1097,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,elmosl_C_2025_9,elmosl,proofs,OPC R1 8B,0.0
1098,o4-mini (high),openai/o4-mini--high,elmosl_G_2025_1,elmosl,proofs,OPC R1 8B,0.0
1099,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,elmosl_G_2025_1,elmosl,proofs,OPC R1 8B,0.0
1100,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,elmosl_G_2025_1,elmosl,proofs,OPC R1 8B,1.0
1101,Qwen3-4B (25/07),qwen/qwen3_4b,elmosl_G_2025_1,elmosl,proofs,OPC R1 8B,0.0
1102,gemini-2.5-pro,gemini/gemini-pro-2.5,elmosl_G_2025_1,elmosl,proofs,OPC R1 8B,0.0
1103,GPT OSS 120B (high),openai/oss-120b,elmosl_G_2025_1,elmosl,proofs,OPC R1 8B,1.0
1104,Grok 4,xai/grok-4,elmosl_G_2025_1,elmosl,proofs,OPC R1 8B,0.0
1105,GPT-5 (high),openai/gpt-5,elmosl_G_2025_1,elmosl,proofs,OPC R1 8B,1.0
1106,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,elmosl_G_2025_1,elmosl,proofs,OPC R1 8B,0.0
1107,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,elmosl_G_2025_1,elmosl,proofs,OPC R1 8B,0.0
1108,Qwen3-4B (25/07),qwen/qwen3_4b,elmosl_G_2025_2,elmosl,proofs,OPC R1 8B,0.0
1109,gemini-2.5-pro,gemini/gemini-pro-2.5,elmosl_G_2025_2,elmosl,proofs,OPC R1 8B,0.0
1110,Grok 4,xai/grok-4,elmosl_G_2025_2,elmosl,proofs,OPC R1 8B,0.0
1111,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,elmosl_G_2025_2,elmosl,proofs,OPC R1 8B,0.0
1112,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,elmosl_G_2025_2,elmosl,proofs,OPC R1 8B,0.0
1113,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,elmosl_G_2025_2,elmosl,proofs,OPC R1 8B,0.0
1114,GPT OSS 120B (high),openai/oss-120b,elmosl_G_2025_2,elmosl,proofs,OPC R1 8B,0.0
1115,GPT-5 (high),openai/gpt-5,elmosl_G_2025_2,elmosl,proofs,OPC R1 8B,0.0
1116,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,elmosl_G_2025_2,elmosl,proofs,OPC R1 8B,0.0
1117,o4-mini (high),openai/o4-mini--high,elmosl_G_2025_2,elmosl,proofs,OPC R1 8B,0.0
1118,o4-mini (high),openai/o4-mini--high,elmosl_G_2025_3,elmosl,proofs,OPC R1 8B,0.0
1119,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,elmosl_G_2025_3,elmosl,proofs,OPC R1 8B,0.0
1120,GPT-5 (high),openai/gpt-5,elmosl_G_2025_3,elmosl,proofs,OPC R1 8B,0.0
1121,Grok 4,xai/grok-4,elmosl_G_2025_3,elmosl,proofs,OPC R1 8B,0.0
1122,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,elmosl_G_2025_3,elmosl,proofs,OPC R1 8B,0.0
1123,Qwen3-4B (25/07),qwen/qwen3_4b,elmosl_G_2025_3,elmosl,proofs,OPC R1 8B,0.0
1124,GPT OSS 120B (high),openai/oss-120b,elmosl_G_2025_3,elmosl,proofs,OPC R1 8B,1.0
1125,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,elmosl_G_2025_3,elmosl,proofs,OPC R1 8B,1.0
1126,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,elmosl_G_2025_3,elmosl,proofs,OPC R1 8B,0.0
1127,gemini-2.5-pro,gemini/gemini-pro-2.5,elmosl_G_2025_3,elmosl,proofs,OPC R1 8B,0.0
1128,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,elmosl_G_2025_4,elmosl,proofs,OPC R1 8B,1.0
1129,GPT OSS 120B (high),openai/oss-120b,elmosl_G_2025_4,elmosl,proofs,OPC R1 8B,0.0
1130,Qwen3-4B (25/07),qwen/qwen3_4b,elmosl_G_2025_4,elmosl,proofs,OPC R1 8B,0.0
1131,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,elmosl_G_2025_4,elmosl,proofs,OPC R1 8B,1.0
1132,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,elmosl_G_2025_4,elmosl,proofs,OPC R1 8B,0.0
1133,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,elmosl_G_2025_4,elmosl,proofs,OPC R1 8B,1.0
1134,o4-mini (high),openai/o4-mini--high,elmosl_G_2025_4,elmosl,proofs,OPC R1 8B,0.0
1135,Grok 4,xai/grok-4,elmosl_G_2025_4,elmosl,proofs,OPC R1 8B,1.0
1136,gemini-2.5-pro,gemini/gemini-pro-2.5,elmosl_G_2025_4,elmosl,proofs,OPC R1 8B,1.0
1137,GPT-5 (high),openai/gpt-5,elmosl_G_2025_4,elmosl,proofs,OPC R1 8B,1.0
1138,Qwen3-4B (25/07),qwen/qwen3_4b,elmosl_G_2025_5,elmosl,proofs,OPC R1 8B,0.0
1139,Grok 4,xai/grok-4,elmosl_G_2025_5,elmosl,proofs,OPC R1 8B,0.0
1140,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,elmosl_G_2025_5,elmosl,proofs,OPC R1 8B,1.0
1141,GPT OSS 120B (high),openai/oss-120b,elmosl_G_2025_5,elmosl,proofs,OPC R1 8B,0.0
1142,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,elmosl_G_2025_5,elmosl,proofs,OPC R1 8B,0.0
1143,o4-mini (high),openai/o4-mini--high,elmosl_G_2025_5,elmosl,proofs,OPC R1 8B,0.0
1144,gemini-2.5-pro,gemini/gemini-pro-2.5,elmosl_G_2025_5,elmosl,proofs,OPC R1 8B,1.0
1145,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,elmosl_G_2025_5,elmosl,proofs,OPC R1 8B,1.0
1146,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,elmosl_G_2025_5,elmosl,proofs,OPC R1 8B,0.0
1147,GPT-5 (high),openai/gpt-5,elmosl_G_2025_5,elmosl,proofs,OPC R1 8B,0.0
1148,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,elmosl_G_2025_6,elmosl,proofs,OPC R1 8B,0.0
1149,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,elmosl_G_2025_6,elmosl,proofs,OPC R1 8B,0.0
1150,GPT-5 (high),openai/gpt-5,elmosl_G_2025_6,elmosl,proofs,OPC R1 8B,0.0
1151,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,elmosl_G_2025_6,elmosl,proofs,OPC R1 8B,0.0
1152,Qwen3-4B (25/07),qwen/qwen3_4b,elmosl_G_2025_6,elmosl,proofs,OPC R1 8B,0.0
1153,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,elmosl_G_2025_6,elmosl,proofs,OPC R1 8B,0.0
1154,Grok 4,xai/grok-4,elmosl_G_2025_6,elmosl,proofs,OPC R1 8B,0.0
1155,GPT OSS 120B (high),openai/oss-120b,elmosl_G_2025_6,elmosl,proofs,OPC R1 8B,1.0
1156,gemini-2.5-pro,gemini/gemini-pro-2.5,elmosl_G_2025_6,elmosl,proofs,OPC R1 8B,0.0
1157,o4-mini (high),openai/o4-mini--high,elmosl_G_2025_6,elmosl,proofs,OPC R1 8B,0.0
1158,Grok 4,xai/grok-4,elmosl_G_2025_7,elmosl,proofs,OPC R1 8B,0.0
1159,gemini-2.5-pro,gemini/gemini-pro-2.5,elmosl_G_2025_7,elmosl,proofs,OPC R1 8B,0.0
1160,GPT-5 (high),openai/gpt-5,elmosl_G_2025_7,elmosl,proofs,OPC R1 8B,0.0
1161,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,elmosl_G_2025_7,elmosl,proofs,OPC R1 8B,0.0
1162,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,elmosl_G_2025_7,elmosl,proofs,OPC R1 8B,0.0
1163,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,elmosl_G_2025_7,elmosl,proofs,OPC R1 8B,0.0
1164,GPT OSS 120B (high),openai/oss-120b,elmosl_G_2025_7,elmosl,proofs,OPC R1 8B,1.0
1165,o4-mini (high),openai/o4-mini--high,elmosl_G_2025_7,elmosl,proofs,OPC R1 8B,0.0
1166,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,elmosl_G_2025_7,elmosl,proofs,OPC R1 8B,0.0
1167,Qwen3-4B (25/07),qwen/qwen3_4b,elmosl_G_2025_7,elmosl,proofs,OPC R1 8B,0.0
1168,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,elmosl_G_2025_8,elmosl,proofs,OPC R1 8B,0.0
1169,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,elmosl_G_2025_8,elmosl,proofs,OPC R1 8B,0.0
1170,Qwen3-4B (25/07),qwen/qwen3_4b,elmosl_G_2025_8,elmosl,proofs,OPC R1 8B,0.0
1171,GPT OSS 120B (high),openai/oss-120b,elmosl_G_2025_8,elmosl,proofs,OPC R1 8B,1.0
1172,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,elmosl_G_2025_8,elmosl,proofs,OPC R1 8B,0.0
1173,Grok 4,xai/grok-4,elmosl_G_2025_8,elmosl,proofs,OPC R1 8B,0.0
1174,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,elmosl_G_2025_8,elmosl,proofs,OPC R1 8B,0.0
1175,gemini-2.5-pro,gemini/gemini-pro-2.5,elmosl_G_2025_8,elmosl,proofs,OPC R1 8B,0.0
1176,GPT-5 (high),openai/gpt-5,elmosl_G_2025_8,elmosl,proofs,OPC R1 8B,0.0
1177,o4-mini (high),openai/o4-mini--high,elmosl_G_2025_8,elmosl,proofs,OPC R1 8B,0.0
1178,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,elmosl_G_2025_9,elmosl,proofs,OPC R1 8B,0.0
1179,Grok 4,xai/grok-4,elmosl_G_2025_9,elmosl,proofs,OPC R1 8B,0.0
1180,Qwen3-4B (25/07),qwen/qwen3_4b,elmosl_G_2025_9,elmosl,proofs,OPC R1 8B,0.0
1181,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,elmosl_G_2025_9,elmosl,proofs,OPC R1 8B,0.0
1182,GPT OSS 120B (high),openai/oss-120b,elmosl_G_2025_9,elmosl,proofs,OPC R1 8B,0.0
1183,gemini-2.5-pro,gemini/gemini-pro-2.5,elmosl_G_2025_9,elmosl,proofs,OPC R1 8B,0.0
1184,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,elmosl_G_2025_9,elmosl,proofs,OPC R1 8B,0.0
1185,GPT-5 (high),openai/gpt-5,elmosl_G_2025_9,elmosl,proofs,OPC R1 8B,0.0
1186,o4-mini (high),openai/o4-mini--high,elmosl_G_2025_9,elmosl,proofs,OPC R1 8B,0.0
1187,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,elmosl_G_2025_9,elmosl,proofs,OPC R1 8B,0.0
1188,o4-mini (high),openai/o4-mini--high,elmosl_NT_2025_1,elmosl,proofs,OPC R1 8B,0.0
1189,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,elmosl_NT_2025_1,elmosl,proofs,OPC R1 8B,0.0
1190,gemini-2.5-pro,gemini/gemini-pro-2.5,elmosl_NT_2025_1,elmosl,proofs,OPC R1 8B,1.0
1191,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,elmosl_NT_2025_1,elmosl,proofs,OPC R1 8B,1.0
1192,GPT OSS 120B (high),openai/oss-120b,elmosl_NT_2025_1,elmosl,proofs,OPC R1 8B,0.0
1193,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,elmosl_NT_2025_1,elmosl,proofs,OPC R1 8B,1.0
1194,Grok 4,xai/grok-4,elmosl_NT_2025_1,elmosl,proofs,OPC R1 8B,0.0
1195,Qwen3-4B (25/07),qwen/qwen3_4b,elmosl_NT_2025_1,elmosl,proofs,OPC R1 8B,0.0
1196,GPT-5 (high),openai/gpt-5,elmosl_NT_2025_1,elmosl,proofs,OPC R1 8B,0.0
1197,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,elmosl_NT_2025_1,elmosl,proofs,OPC R1 8B,1.0
1198,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,elmosl_NT_2025_2,elmosl,proofs,OPC R1 8B,0.0
1199,GPT OSS 120B (high),openai/oss-120b,elmosl_NT_2025_2,elmosl,proofs,OPC R1 8B,0.0
1200,o4-mini (high),openai/o4-mini--high,elmosl_NT_2025_2,elmosl,proofs,OPC R1 8B,0.0
1201,gemini-2.5-pro,gemini/gemini-pro-2.5,elmosl_NT_2025_2,elmosl,proofs,OPC R1 8B,1.0
1202,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,elmosl_NT_2025_2,elmosl,proofs,OPC R1 8B,0.0
1203,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,elmosl_NT_2025_2,elmosl,proofs,OPC R1 8B,1.0
1204,Qwen3-4B (25/07),qwen/qwen3_4b,elmosl_NT_2025_2,elmosl,proofs,OPC R1 8B,0.0
1205,Grok 4,xai/grok-4,elmosl_NT_2025_2,elmosl,proofs,OPC R1 8B,0.0
1206,GPT-5 (high),openai/gpt-5,elmosl_NT_2025_2,elmosl,proofs,OPC R1 8B,0.0
1207,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,elmosl_NT_2025_2,elmosl,proofs,OPC R1 8B,0.0
1208,o4-mini (high),openai/o4-mini--high,elmosl_NT_2025_3,elmosl,proofs,OPC R1 8B,1.0
1209,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,elmosl_NT_2025_3,elmosl,proofs,OPC R1 8B,0.0
1210,GPT-5 (high),openai/gpt-5,elmosl_NT_2025_3,elmosl,proofs,OPC R1 8B,0.0
1211,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,elmosl_NT_2025_3,elmosl,proofs,OPC R1 8B,0.0
1212,Grok 4,xai/grok-4,elmosl_NT_2025_3,elmosl,proofs,OPC R1 8B,0.0
1213,Qwen3-4B (25/07),qwen/qwen3_4b,elmosl_NT_2025_3,elmosl,proofs,OPC R1 8B,0.0
1214,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,elmosl_NT_2025_3,elmosl,proofs,OPC R1 8B,1.0
1215,gemini-2.5-pro,gemini/gemini-pro-2.5,elmosl_NT_2025_3,elmosl,proofs,OPC R1 8B,1.0
1216,GPT OSS 120B (high),openai/oss-120b,elmosl_NT_2025_3,elmosl,proofs,OPC R1 8B,0.0
1217,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,elmosl_NT_2025_3,elmosl,proofs,OPC R1 8B,0.0
1218,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,elmosl_NT_2025_4,elmosl,proofs,OPC R1 8B,1.0
1219,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,elmosl_NT_2025_4,elmosl,proofs,OPC R1 8B,0.0
1220,o4-mini (high),openai/o4-mini--high,elmosl_NT_2025_4,elmosl,proofs,OPC R1 8B,1.0
1221,GPT OSS 120B (high),openai/oss-120b,elmosl_NT_2025_4,elmosl,proofs,OPC R1 8B,0.0
1222,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,elmosl_NT_2025_4,elmosl,proofs,OPC R1 8B,0.0
1223,Qwen3-4B (25/07),qwen/qwen3_4b,elmosl_NT_2025_4,elmosl,proofs,OPC R1 8B,0.0
1224,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,elmosl_NT_2025_4,elmosl,proofs,OPC R1 8B,1.0
1225,gemini-2.5-pro,gemini/gemini-pro-2.5,elmosl_NT_2025_4,elmosl,proofs,OPC R1 8B,0.0
1226,GPT-5 (high),openai/gpt-5,elmosl_NT_2025_4,elmosl,proofs,OPC R1 8B,0.0
1227,Grok 4,xai/grok-4,elmosl_NT_2025_4,elmosl,proofs,OPC R1 8B,0.0
1228,GPT OSS 120B (high),openai/oss-120b,elmosl_NT_2025_5,elmosl,proofs,OPC R1 8B,0.0
1229,gemini-2.5-pro,gemini/gemini-pro-2.5,elmosl_NT_2025_5,elmosl,proofs,OPC R1 8B,1.0
1230,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,elmosl_NT_2025_5,elmosl,proofs,OPC R1 8B,1.0
1231,o4-mini (high),openai/o4-mini--high,elmosl_NT_2025_5,elmosl,proofs,OPC R1 8B,0.0
1232,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,elmosl_NT_2025_5,elmosl,proofs,OPC R1 8B,0.0
1233,Grok 4,xai/grok-4,elmosl_NT_2025_5,elmosl,proofs,OPC R1 8B,0.0
1234,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,elmosl_NT_2025_5,elmosl,proofs,OPC R1 8B,0.0
1235,GPT-5 (high),openai/gpt-5,elmosl_NT_2025_5,elmosl,proofs,OPC R1 8B,0.0
1236,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,elmosl_NT_2025_5,elmosl,proofs,OPC R1 8B,0.0
1237,Qwen3-4B (25/07),qwen/qwen3_4b,elmosl_NT_2025_5,elmosl,proofs,OPC R1 8B,0.0
1238,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,elmosl_NT_2025_6,elmosl,proofs,OPC R1 8B,1.0
1239,gemini-2.5-pro,gemini/gemini-pro-2.5,elmosl_NT_2025_6,elmosl,proofs,OPC R1 8B,0.0
1240,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,elmosl_NT_2025_6,elmosl,proofs,OPC R1 8B,1.0
1241,Grok 4,xai/grok-4,elmosl_NT_2025_6,elmosl,proofs,OPC R1 8B,1.0
1242,GPT OSS 120B (high),openai/oss-120b,elmosl_NT_2025_6,elmosl,proofs,OPC R1 8B,0.0
1243,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,elmosl_NT_2025_6,elmosl,proofs,OPC R1 8B,1.0
1244,o4-mini (high),openai/o4-mini--high,elmosl_NT_2025_6,elmosl,proofs,OPC R1 8B,1.0
1245,GPT-5 (high),openai/gpt-5,elmosl_NT_2025_6,elmosl,proofs,OPC R1 8B,1.0
1246,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,elmosl_NT_2025_6,elmosl,proofs,OPC R1 8B,1.0
1247,Qwen3-4B (25/07),qwen/qwen3_4b,elmosl_NT_2025_6,elmosl,proofs,OPC R1 8B,0.0
1248,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,elmosl_NT_2025_7,elmosl,proofs,OPC R1 8B,0.0
1249,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,elmosl_NT_2025_7,elmosl,proofs,OPC R1 8B,0.0
1250,Grok 4,xai/grok-4,elmosl_NT_2025_7,elmosl,proofs,OPC R1 8B,0.0
1251,GPT-5 (high),openai/gpt-5,elmosl_NT_2025_7,elmosl,proofs,OPC R1 8B,0.0
1252,Qwen3-4B (25/07),qwen/qwen3_4b,elmosl_NT_2025_7,elmosl,proofs,OPC R1 8B,0.0
1253,GPT OSS 120B (high),openai/oss-120b,elmosl_NT_2025_7,elmosl,proofs,OPC R1 8B,0.0
1254,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,elmosl_NT_2025_7,elmosl,proofs,OPC R1 8B,0.0
1255,o4-mini (high),openai/o4-mini--high,elmosl_NT_2025_7,elmosl,proofs,OPC R1 8B,0.0
1256,gemini-2.5-pro,gemini/gemini-pro-2.5,elmosl_NT_2025_7,elmosl,proofs,OPC R1 8B,0.0
1257,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,elmosl_NT_2025_7,elmosl,proofs,OPC R1 8B,0.0
1258,o4-mini (high),openai/o4-mini--high,german_2025_1,german,proofs,OPC R1 8B,1.0
1259,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,german_2025_1,german,proofs,OPC R1 8B,1.0
1260,gemini-2.5-pro,gemini/gemini-pro-2.5,german_2025_1,german,proofs,OPC R1 8B,1.0
1261,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,german_2025_1,german,proofs,OPC R1 8B,1.0
1262,Grok 4,xai/grok-4,german_2025_1,german,proofs,OPC R1 8B,1.0
1263,GPT-5 (high),openai/gpt-5,german_2025_1,german,proofs,OPC R1 8B,1.0
1264,Qwen3-4B (25/07),qwen/qwen3_4b,german_2025_1,german,proofs,OPC R1 8B,1.0
1265,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,german_2025_1,german,proofs,OPC R1 8B,1.0
1266,GPT OSS 120B (high),openai/oss-120b,german_2025_1,german,proofs,OPC R1 8B,1.0
1267,GPT-5-mini (high),openai/gpt-5-mini,german_2025_1,german,proofs,OPC R1 8B,1.0
1268,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,german_2025_1,german,proofs,OPC R1 8B,1.0
1269,gemini-2.5-pro,gemini/gemini-pro-2.5,german_2025_2,german,proofs,OPC R1 8B,0.0
1270,o4-mini (high),openai/o4-mini--high,german_2025_2,german,proofs,OPC R1 8B,0.0
1271,GPT-5 (high),openai/gpt-5,german_2025_2,german,proofs,OPC R1 8B,0.0
1272,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,german_2025_2,german,proofs,OPC R1 8B,0.0
1273,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,german_2025_2,german,proofs,OPC R1 8B,0.0
1274,GPT-5-mini (high),openai/gpt-5-mini,german_2025_2,german,proofs,OPC R1 8B,0.0
1275,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,german_2025_2,german,proofs,OPC R1 8B,0.0
1276,Qwen3-4B (25/07),qwen/qwen3_4b,german_2025_2,german,proofs,OPC R1 8B,0.0
1277,GPT OSS 120B (high),openai/oss-120b,german_2025_2,german,proofs,OPC R1 8B,1.0
1278,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,german_2025_2,german,proofs,OPC R1 8B,0.0
1279,Grok 4,xai/grok-4,german_2025_2,german,proofs,OPC R1 8B,0.0
1280,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,german_2025_3,german,proofs,OPC R1 8B,0.0
1281,Qwen3-4B (25/07),qwen/qwen3_4b,german_2025_3,german,proofs,OPC R1 8B,1.0
1282,Grok 4,xai/grok-4,german_2025_3,german,proofs,OPC R1 8B,1.0
1283,o4-mini (high),openai/o4-mini--high,german_2025_3,german,proofs,OPC R1 8B,0.0
1284,gemini-2.5-pro,gemini/gemini-pro-2.5,german_2025_3,german,proofs,OPC R1 8B,0.0
1285,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,german_2025_3,german,proofs,OPC R1 8B,0.0
1286,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,german_2025_3,german,proofs,OPC R1 8B,1.0
1287,GPT-5 (high),openai/gpt-5,german_2025_3,german,proofs,OPC R1 8B,1.0
1288,GPT OSS 120B (high),openai/oss-120b,german_2025_3,german,proofs,OPC R1 8B,0.0
1289,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,german_2025_3,german,proofs,OPC R1 8B,1.0
1290,GPT-5-mini (high),openai/gpt-5-mini,german_2025_3,german,proofs,OPC R1 8B,1.0
1291,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,german_2025_4,german,proofs,OPC R1 8B,1.0
1292,Grok 4,xai/grok-4,german_2025_4,german,proofs,OPC R1 8B,1.0
1293,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,german_2025_4,german,proofs,OPC R1 8B,0.0
1294,gemini-2.5-pro,gemini/gemini-pro-2.5,german_2025_4,german,proofs,OPC R1 8B,0.0
1295,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,german_2025_4,german,proofs,OPC R1 8B,1.0
1296,o4-mini (high),openai/o4-mini--high,german_2025_4,german,proofs,OPC R1 8B,0.0
1297,GPT OSS 120B (high),openai/oss-120b,german_2025_4,german,proofs,OPC R1 8B,0.0
1298,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,german_2025_4,german,proofs,OPC R1 8B,1.0
1299,Qwen3-4B (25/07),qwen/qwen3_4b,german_2025_4,german,proofs,OPC R1 8B,0.0
1300,GPT-5-mini (high),openai/gpt-5-mini,german_2025_4,german,proofs,OPC R1 8B,0.0
1301,GPT-5 (high),openai/gpt-5,german_2025_4,german,proofs,OPC R1 8B,0.0
1302,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,greece_2025_1,greece,proofs,OPC R1 8B,1.0
1303,GPT-5 (high),openai/gpt-5,greece_2025_1,greece,proofs,OPC R1 8B,1.0
1304,GPT OSS 120B (high),openai/oss-120b,greece_2025_1,greece,proofs,OPC R1 8B,0.0
1305,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,greece_2025_1,greece,proofs,OPC R1 8B,0.0
1306,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,greece_2025_1,greece,proofs,OPC R1 8B,0.0
1307,gemini-2.5-pro,gemini/gemini-pro-2.5,greece_2025_1,greece,proofs,OPC R1 8B,1.0
1308,Qwen3-4B (25/07),qwen/qwen3_4b,greece_2025_1,greece,proofs,OPC R1 8B,0.0
1309,o4-mini (high),openai/o4-mini--high,greece_2025_1,greece,proofs,OPC R1 8B,1.0
1310,GPT-5-mini (high),openai/gpt-5-mini,greece_2025_1,greece,proofs,OPC R1 8B,1.0
1311,Grok 4,xai/grok-4,greece_2025_1,greece,proofs,OPC R1 8B,1.0
1312,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,greece_2025_1,greece,proofs,OPC R1 8B,1.0
1313,Grok 4,xai/grok-4,greece_2025_2,greece,proofs,OPC R1 8B,0.0
1314,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,greece_2025_2,greece,proofs,OPC R1 8B,0.0
1315,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,greece_2025_2,greece,proofs,OPC R1 8B,0.0
1316,GPT-5-mini (high),openai/gpt-5-mini,greece_2025_2,greece,proofs,OPC R1 8B,0.0
1317,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,greece_2025_2,greece,proofs,OPC R1 8B,0.0
1318,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,greece_2025_2,greece,proofs,OPC R1 8B,0.0
1319,gemini-2.5-pro,gemini/gemini-pro-2.5,greece_2025_2,greece,proofs,OPC R1 8B,0.0
1320,GPT OSS 120B (high),openai/oss-120b,greece_2025_2,greece,proofs,OPC R1 8B,1.0
1321,o4-mini (high),openai/o4-mini--high,greece_2025_2,greece,proofs,OPC R1 8B,0.0
1322,Qwen3-4B (25/07),qwen/qwen3_4b,greece_2025_2,greece,proofs,OPC R1 8B,0.0
1323,GPT-5 (high),openai/gpt-5,greece_2025_2,greece,proofs,OPC R1 8B,1.0
1324,GPT-5-mini (high),openai/gpt-5-mini,greece_2025_3,greece,proofs,OPC R1 8B,0.0
1325,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,greece_2025_3,greece,proofs,OPC R1 8B,1.0
1326,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,greece_2025_3,greece,proofs,OPC R1 8B,1.0
1327,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,greece_2025_3,greece,proofs,OPC R1 8B,0.0
1328,GPT OSS 120B (high),openai/oss-120b,greece_2025_3,greece,proofs,OPC R1 8B,0.0
1329,gemini-2.5-pro,gemini/gemini-pro-2.5,greece_2025_3,greece,proofs,OPC R1 8B,1.0
1330,GPT-5 (high),openai/gpt-5,greece_2025_3,greece,proofs,OPC R1 8B,0.0
1331,o4-mini (high),openai/o4-mini--high,greece_2025_3,greece,proofs,OPC R1 8B,0.0
1332,Qwen3-4B (25/07),qwen/qwen3_4b,greece_2025_3,greece,proofs,OPC R1 8B,0.0
1333,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,greece_2025_3,greece,proofs,OPC R1 8B,0.0
1334,Grok 4,xai/grok-4,greece_2025_3,greece,proofs,OPC R1 8B,1.0
1335,GPT-5-mini (high),openai/gpt-5-mini,greece_2025_4,greece,proofs,OPC R1 8B,0.0
1336,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,greece_2025_4,greece,proofs,OPC R1 8B,0.0
1337,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,greece_2025_4,greece,proofs,OPC R1 8B,0.0
1338,Qwen3-4B (25/07),qwen/qwen3_4b,greece_2025_4,greece,proofs,OPC R1 8B,0.0
1339,Grok 4,xai/grok-4,greece_2025_4,greece,proofs,OPC R1 8B,0.0
1340,gemini-2.5-pro,gemini/gemini-pro-2.5,greece_2025_4,greece,proofs,OPC R1 8B,0.0
1341,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,greece_2025_4,greece,proofs,OPC R1 8B,1.0
1342,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,greece_2025_4,greece,proofs,OPC R1 8B,0.0
1343,GPT-5 (high),openai/gpt-5,greece_2025_4,greece,proofs,OPC R1 8B,0.0
1344,o4-mini (high),openai/o4-mini--high,greece_2025_4,greece,proofs,OPC R1 8B,0.0
1345,GPT OSS 120B (high),openai/oss-120b,greece_2025_4,greece,proofs,OPC R1 8B,0.0
1346,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_1,imosl,proofs,OPC R1 8B,1.0
1347,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_1,imosl,proofs,OPC R1 8B,0.0
1348,o4-mini (high),openai/o4-mini--high,imosl_2025_1,imosl,proofs,OPC R1 8B,0.0
1349,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_1,imosl,proofs,OPC R1 8B,0.0
1350,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_1,imosl,proofs,OPC R1 8B,1.0
1351,Grok 4,xai/grok-4,imosl_2025_1,imosl,proofs,OPC R1 8B,1.0
1352,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_1,imosl,proofs,OPC R1 8B,0.0
1353,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_1,imosl,proofs,OPC R1 8B,1.0
1354,GPT OSS 120B (high),openai/oss-120b,imosl_2025_1,imosl,proofs,OPC R1 8B,0.0
1355,GPT-5 (high),openai/gpt-5,imosl_2025_1,imosl,proofs,OPC R1 8B,1.0
1356,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_10,imosl,proofs,OPC R1 8B,0.0
1357,o4-mini (high),openai/o4-mini--high,imosl_2025_10,imosl,proofs,OPC R1 8B,0.0
1358,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_10,imosl,proofs,OPC R1 8B,0.0
1359,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_10,imosl,proofs,OPC R1 8B,0.0
1360,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_10,imosl,proofs,OPC R1 8B,0.0
1361,GPT OSS 120B (high),openai/oss-120b,imosl_2025_10,imosl,proofs,OPC R1 8B,0.0
1362,Grok 4,xai/grok-4,imosl_2025_10,imosl,proofs,OPC R1 8B,0.0
1363,GPT-5-mini (high),openai/gpt-5-mini,imosl_2025_10,imosl,proofs,OPC R1 8B,0.0
1364,GPT-5 (high),openai/gpt-5,imosl_2025_10,imosl,proofs,OPC R1 8B,0.0
1365,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_10,imosl,proofs,OPC R1 8B,0.0
1366,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_10,imosl,proofs,OPC R1 8B,0.0
1367,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_11,imosl,proofs,OPC R1 8B,0.0
1368,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_11,imosl,proofs,OPC R1 8B,0.0
1369,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_11,imosl,proofs,OPC R1 8B,0.0
1370,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_11,imosl,proofs,OPC R1 8B,0.0
1371,Grok 4,xai/grok-4,imosl_2025_11,imosl,proofs,OPC R1 8B,1.0
1372,GPT-5 (high),openai/gpt-5,imosl_2025_11,imosl,proofs,OPC R1 8B,0.0
1373,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_11,imosl,proofs,OPC R1 8B,0.0
1374,GPT OSS 120B (high),openai/oss-120b,imosl_2025_11,imosl,proofs,OPC R1 8B,0.0
1375,o4-mini (high),openai/o4-mini--high,imosl_2025_11,imosl,proofs,OPC R1 8B,0.0
1376,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_11,imosl,proofs,OPC R1 8B,0.0
1377,GPT-5-mini (high),openai/gpt-5-mini,imosl_2025_11,imosl,proofs,OPC R1 8B,0.0
1378,GPT-5-mini (high),openai/gpt-5-mini,imosl_2025_12,imosl,proofs,OPC R1 8B,1.0
1379,GPT OSS 120B (high),openai/oss-120b,imosl_2025_12,imosl,proofs,OPC R1 8B,0.0
1380,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_12,imosl,proofs,OPC R1 8B,1.0
1381,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_12,imosl,proofs,OPC R1 8B,1.0
1382,GPT-5 (high),openai/gpt-5,imosl_2025_12,imosl,proofs,OPC R1 8B,0.0
1383,Grok 4,xai/grok-4,imosl_2025_12,imosl,proofs,OPC R1 8B,1.0
1384,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_12,imosl,proofs,OPC R1 8B,0.0
1385,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_12,imosl,proofs,OPC R1 8B,1.0
1386,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_12,imosl,proofs,OPC R1 8B,0.0
1387,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_12,imosl,proofs,OPC R1 8B,1.0
1388,o4-mini (high),openai/o4-mini--high,imosl_2025_12,imosl,proofs,OPC R1 8B,1.0
1389,GPT OSS 120B (high),openai/oss-120b,imosl_2025_13,imosl,proofs,OPC R1 8B,0.0
1390,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_13,imosl,proofs,OPC R1 8B,0.0
1391,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_13,imosl,proofs,OPC R1 8B,0.0
1392,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_13,imosl,proofs,OPC R1 8B,0.0
1393,GPT-5 (high),openai/gpt-5,imosl_2025_13,imosl,proofs,OPC R1 8B,0.0
1394,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_13,imosl,proofs,OPC R1 8B,0.0
1395,Grok 4,xai/grok-4,imosl_2025_13,imosl,proofs,OPC R1 8B,0.0
1396,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_13,imosl,proofs,OPC R1 8B,0.0
1397,o4-mini (high),openai/o4-mini--high,imosl_2025_13,imosl,proofs,OPC R1 8B,0.0
1398,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_13,imosl,proofs,OPC R1 8B,0.0
1399,GPT-5-mini (high),openai/gpt-5-mini,imosl_2025_14,imosl,proofs,OPC R1 8B,0.0
1400,GPT-5 (high),openai/gpt-5,imosl_2025_14,imosl,proofs,OPC R1 8B,0.0
1401,o4-mini (high),openai/o4-mini--high,imosl_2025_14,imosl,proofs,OPC R1 8B,0.0
1402,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_14,imosl,proofs,OPC R1 8B,0.0
1403,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_14,imosl,proofs,OPC R1 8B,0.0
1404,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_14,imosl,proofs,OPC R1 8B,0.0
1405,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_14,imosl,proofs,OPC R1 8B,0.0
1406,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_14,imosl,proofs,OPC R1 8B,0.0
1407,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_14,imosl,proofs,OPC R1 8B,0.0
1408,GPT OSS 120B (high),openai/oss-120b,imosl_2025_14,imosl,proofs,OPC R1 8B,0.0
1409,GPT-5 (high),openai/gpt-5,imosl_2025_15,imosl,proofs,OPC R1 8B,0.0
1410,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_15,imosl,proofs,OPC R1 8B,0.0
1411,o4-mini (high),openai/o4-mini--high,imosl_2025_15,imosl,proofs,OPC R1 8B,0.0
1412,GPT OSS 120B (high),openai/oss-120b,imosl_2025_15,imosl,proofs,OPC R1 8B,1.0
1413,Grok 4,xai/grok-4,imosl_2025_15,imosl,proofs,OPC R1 8B,0.0
1414,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_15,imosl,proofs,OPC R1 8B,0.0
1415,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_15,imosl,proofs,OPC R1 8B,0.0
1416,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_15,imosl,proofs,OPC R1 8B,0.0
1417,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_15,imosl,proofs,OPC R1 8B,0.0
1418,GPT-5-mini (high),openai/gpt-5-mini,imosl_2025_15,imosl,proofs,OPC R1 8B,0.0
1419,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_15,imosl,proofs,OPC R1 8B,0.0
1420,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_16,imosl,proofs,OPC R1 8B,0.0
1421,o4-mini (high),openai/o4-mini--high,imosl_2025_16,imosl,proofs,OPC R1 8B,0.0
1422,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_16,imosl,proofs,OPC R1 8B,0.0
1423,Grok 4,xai/grok-4,imosl_2025_16,imosl,proofs,OPC R1 8B,0.0
1424,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_16,imosl,proofs,OPC R1 8B,0.0
1425,GPT-5-mini (high),openai/gpt-5-mini,imosl_2025_16,imosl,proofs,OPC R1 8B,0.0
1426,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_16,imosl,proofs,OPC R1 8B,0.0
1427,GPT OSS 120B (high),openai/oss-120b,imosl_2025_16,imosl,proofs,OPC R1 8B,0.0
1428,GPT-5 (high),openai/gpt-5,imosl_2025_16,imosl,proofs,OPC R1 8B,0.0
1429,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_16,imosl,proofs,OPC R1 8B,0.0
1430,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_16,imosl,proofs,OPC R1 8B,0.0
1431,Grok 4,xai/grok-4,imosl_2025_17,imosl,proofs,OPC R1 8B,0.0
1432,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_17,imosl,proofs,OPC R1 8B,0.0
1433,o4-mini (high),openai/o4-mini--high,imosl_2025_17,imosl,proofs,OPC R1 8B,0.0
1434,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_17,imosl,proofs,OPC R1 8B,0.0
1435,GPT-5 (high),openai/gpt-5,imosl_2025_17,imosl,proofs,OPC R1 8B,0.0
1436,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_17,imosl,proofs,OPC R1 8B,0.0
1437,GPT-5-mini (high),openai/gpt-5-mini,imosl_2025_17,imosl,proofs,OPC R1 8B,0.0
1438,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_17,imosl,proofs,OPC R1 8B,0.0
1439,GPT OSS 120B (high),openai/oss-120b,imosl_2025_17,imosl,proofs,OPC R1 8B,1.0
1440,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_17,imosl,proofs,OPC R1 8B,0.0
1441,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_17,imosl,proofs,OPC R1 8B,0.0
1442,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_18,imosl,proofs,OPC R1 8B,0.0
1443,GPT-5 (high),openai/gpt-5,imosl_2025_18,imosl,proofs,OPC R1 8B,0.0
1444,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_18,imosl,proofs,OPC R1 8B,0.0
1445,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_18,imosl,proofs,OPC R1 8B,1.0
1446,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_18,imosl,proofs,OPC R1 8B,0.0
1447,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_18,imosl,proofs,OPC R1 8B,0.0
1448,GPT OSS 120B (high),openai/oss-120b,imosl_2025_18,imosl,proofs,OPC R1 8B,0.0
1449,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_18,imosl,proofs,OPC R1 8B,0.0
1450,o4-mini (high),openai/o4-mini--high,imosl_2025_18,imosl,proofs,OPC R1 8B,0.0
1451,GPT OSS 120B (high),openai/oss-120b,imosl_2025_19,imosl,proofs,OPC R1 8B,0.0
1452,GPT-5 (high),openai/gpt-5,imosl_2025_19,imosl,proofs,OPC R1 8B,0.0
1453,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_19,imosl,proofs,OPC R1 8B,0.0
1454,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_19,imosl,proofs,OPC R1 8B,0.0
1455,GPT-5-mini (high),openai/gpt-5-mini,imosl_2025_19,imosl,proofs,OPC R1 8B,0.0
1456,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_19,imosl,proofs,OPC R1 8B,0.0
1457,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_19,imosl,proofs,OPC R1 8B,0.0
1458,Grok 4,xai/grok-4,imosl_2025_19,imosl,proofs,OPC R1 8B,0.0
1459,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_19,imosl,proofs,OPC R1 8B,0.0
1460,o4-mini (high),openai/o4-mini--high,imosl_2025_19,imosl,proofs,OPC R1 8B,0.0
1461,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_19,imosl,proofs,OPC R1 8B,0.0
1462,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_2,imosl,proofs,OPC R1 8B,1.0
1463,GPT OSS 120B (high),openai/oss-120b,imosl_2025_2,imosl,proofs,OPC R1 8B,0.0
1464,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_2,imosl,proofs,OPC R1 8B,0.0
1465,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_2,imosl,proofs,OPC R1 8B,0.0
1466,Grok 4,xai/grok-4,imosl_2025_2,imosl,proofs,OPC R1 8B,1.0
1467,GPT-5 (high),openai/gpt-5,imosl_2025_2,imosl,proofs,OPC R1 8B,1.0
1468,GPT-5-mini (high),openai/gpt-5-mini,imosl_2025_2,imosl,proofs,OPC R1 8B,1.0
1469,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_2,imosl,proofs,OPC R1 8B,0.0
1470,o4-mini (high),openai/o4-mini--high,imosl_2025_2,imosl,proofs,OPC R1 8B,0.0
1471,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_2,imosl,proofs,OPC R1 8B,0.0
1472,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_2,imosl,proofs,OPC R1 8B,1.0
1473,GPT-5 (high),openai/gpt-5,imosl_2025_20,imosl,proofs,OPC R1 8B,1.0
1474,GPT-5-mini (high),openai/gpt-5-mini,imosl_2025_20,imosl,proofs,OPC R1 8B,0.0
1475,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_20,imosl,proofs,OPC R1 8B,0.0
1476,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_20,imosl,proofs,OPC R1 8B,0.0
1477,GPT OSS 120B (high),openai/oss-120b,imosl_2025_20,imosl,proofs,OPC R1 8B,0.0
1478,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_20,imosl,proofs,OPC R1 8B,0.0
1479,o4-mini (high),openai/o4-mini--high,imosl_2025_20,imosl,proofs,OPC R1 8B,0.0
1480,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_20,imosl,proofs,OPC R1 8B,0.0
1481,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_20,imosl,proofs,OPC R1 8B,0.0
1482,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_20,imosl,proofs,OPC R1 8B,0.0
1483,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_21,imosl,proofs,OPC R1 8B,0.0
1484,Grok 4,xai/grok-4,imosl_2025_21,imosl,proofs,OPC R1 8B,0.0
1485,o4-mini (high),openai/o4-mini--high,imosl_2025_21,imosl,proofs,OPC R1 8B,0.0
1486,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_21,imosl,proofs,OPC R1 8B,0.0
1487,GPT-5 (high),openai/gpt-5,imosl_2025_21,imosl,proofs,OPC R1 8B,0.0
1488,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_21,imosl,proofs,OPC R1 8B,0.0
1489,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_21,imosl,proofs,OPC R1 8B,0.0
1490,GPT OSS 120B (high),openai/oss-120b,imosl_2025_21,imosl,proofs,OPC R1 8B,1.0
1491,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_21,imosl,proofs,OPC R1 8B,0.0
1492,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_21,imosl,proofs,OPC R1 8B,0.0
1493,Grok 4,xai/grok-4,imosl_2025_22,imosl,proofs,OPC R1 8B,0.0
1494,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_22,imosl,proofs,OPC R1 8B,0.0
1495,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_22,imosl,proofs,OPC R1 8B,0.0
1496,GPT-5 (high),openai/gpt-5,imosl_2025_22,imosl,proofs,OPC R1 8B,0.0
1497,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_22,imosl,proofs,OPC R1 8B,0.0
1498,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_22,imosl,proofs,OPC R1 8B,0.0
1499,GPT-5-mini (high),openai/gpt-5-mini,imosl_2025_22,imosl,proofs,OPC R1 8B,0.0
1500,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_22,imosl,proofs,OPC R1 8B,0.0
1501,GPT OSS 120B (high),openai/oss-120b,imosl_2025_22,imosl,proofs,OPC R1 8B,0.0
1502,o4-mini (high),openai/o4-mini--high,imosl_2025_22,imosl,proofs,OPC R1 8B,0.0
1503,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_22,imosl,proofs,OPC R1 8B,0.0
1504,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_23,imosl,proofs,OPC R1 8B,0.0
1505,Grok 4,xai/grok-4,imosl_2025_23,imosl,proofs,OPC R1 8B,0.0
1506,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_23,imosl,proofs,OPC R1 8B,0.0
1507,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_23,imosl,proofs,OPC R1 8B,1.0
1508,o4-mini (high),openai/o4-mini--high,imosl_2025_23,imosl,proofs,OPC R1 8B,0.0
1509,GPT-5 (high),openai/gpt-5,imosl_2025_23,imosl,proofs,OPC R1 8B,0.0
1510,GPT OSS 120B (high),openai/oss-120b,imosl_2025_23,imosl,proofs,OPC R1 8B,0.0
1511,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_23,imosl,proofs,OPC R1 8B,0.0
1512,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_23,imosl,proofs,OPC R1 8B,0.0
1513,GPT-5-mini (high),openai/gpt-5-mini,imosl_2025_23,imosl,proofs,OPC R1 8B,0.0
1514,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_23,imosl,proofs,OPC R1 8B,0.0
1515,GPT OSS 120B (high),openai/oss-120b,imosl_2025_24,imosl,proofs,OPC R1 8B,0.0
1516,GPT-5 (high),openai/gpt-5,imosl_2025_24,imosl,proofs,OPC R1 8B,0.0
1517,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_24,imosl,proofs,OPC R1 8B,0.0
1518,GPT-5-mini (high),openai/gpt-5-mini,imosl_2025_24,imosl,proofs,OPC R1 8B,0.0
1519,Grok 4,xai/grok-4,imosl_2025_24,imosl,proofs,OPC R1 8B,0.0
1520,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_24,imosl,proofs,OPC R1 8B,0.0
1521,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_24,imosl,proofs,OPC R1 8B,0.0
1522,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_24,imosl,proofs,OPC R1 8B,0.0
1523,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_24,imosl,proofs,OPC R1 8B,0.0
1524,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_24,imosl,proofs,OPC R1 8B,0.0
1525,o4-mini (high),openai/o4-mini--high,imosl_2025_24,imosl,proofs,OPC R1 8B,0.0
1526,GPT OSS 120B (high),openai/oss-120b,imosl_2025_25,imosl,proofs,OPC R1 8B,0.0
1527,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_25,imosl,proofs,OPC R1 8B,1.0
1528,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_25,imosl,proofs,OPC R1 8B,0.0
1529,o4-mini (high),openai/o4-mini--high,imosl_2025_25,imosl,proofs,OPC R1 8B,0.0
1530,GPT-5 (high),openai/gpt-5,imosl_2025_25,imosl,proofs,OPC R1 8B,0.0
1531,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_25,imosl,proofs,OPC R1 8B,1.0
1532,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_25,imosl,proofs,OPC R1 8B,0.0
1533,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_25,imosl,proofs,OPC R1 8B,0.0
1534,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_25,imosl,proofs,OPC R1 8B,0.0
1535,Grok 4,xai/grok-4,imosl_2025_25,imosl,proofs,OPC R1 8B,1.0
1536,GPT OSS 120B (high),openai/oss-120b,imosl_2025_26,imosl,proofs,OPC R1 8B,0.0
1537,GPT-5 (high),openai/gpt-5,imosl_2025_26,imosl,proofs,OPC R1 8B,1.0
1538,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_26,imosl,proofs,OPC R1 8B,1.0
1539,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_26,imosl,proofs,OPC R1 8B,0.0
1540,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_26,imosl,proofs,OPC R1 8B,1.0
1541,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_26,imosl,proofs,OPC R1 8B,0.0
1542,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_26,imosl,proofs,OPC R1 8B,0.0
1543,Grok 4,xai/grok-4,imosl_2025_26,imosl,proofs,OPC R1 8B,1.0
1544,GPT-5-mini (high),openai/gpt-5-mini,imosl_2025_26,imosl,proofs,OPC R1 8B,1.0
1545,o4-mini (high),openai/o4-mini--high,imosl_2025_26,imosl,proofs,OPC R1 8B,0.0
1546,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_26,imosl,proofs,OPC R1 8B,1.0
1547,GPT-5 (high),openai/gpt-5,imosl_2025_27,imosl,proofs,OPC R1 8B,0.0
1548,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_27,imosl,proofs,OPC R1 8B,0.0
1549,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_27,imosl,proofs,OPC R1 8B,0.0
1550,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_27,imosl,proofs,OPC R1 8B,0.0
1551,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_27,imosl,proofs,OPC R1 8B,0.0
1552,o4-mini (high),openai/o4-mini--high,imosl_2025_27,imosl,proofs,OPC R1 8B,0.0
1553,Grok 4,xai/grok-4,imosl_2025_27,imosl,proofs,OPC R1 8B,0.0
1554,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_27,imosl,proofs,OPC R1 8B,0.0
1555,GPT OSS 120B (high),openai/oss-120b,imosl_2025_27,imosl,proofs,OPC R1 8B,0.0
1556,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_27,imosl,proofs,OPC R1 8B,1.0
1557,Grok 4,xai/grok-4,imosl_2025_28,imosl,proofs,OPC R1 8B,0.0
1558,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_28,imosl,proofs,OPC R1 8B,0.0
1559,GPT-5-mini (high),openai/gpt-5-mini,imosl_2025_28,imosl,proofs,OPC R1 8B,0.0
1560,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_28,imosl,proofs,OPC R1 8B,0.0
1561,GPT-5 (high),openai/gpt-5,imosl_2025_28,imosl,proofs,OPC R1 8B,0.0
1562,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_28,imosl,proofs,OPC R1 8B,1.0
1563,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_28,imosl,proofs,OPC R1 8B,0.0
1564,GPT OSS 120B (high),openai/oss-120b,imosl_2025_28,imosl,proofs,OPC R1 8B,0.0
1565,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_28,imosl,proofs,OPC R1 8B,0.0
1566,o4-mini (high),openai/o4-mini--high,imosl_2025_28,imosl,proofs,OPC R1 8B,1.0
1567,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_28,imosl,proofs,OPC R1 8B,0.0
1568,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_29,imosl,proofs,OPC R1 8B,0.0
1569,GPT-5-mini (high),openai/gpt-5-mini,imosl_2025_29,imosl,proofs,OPC R1 8B,0.0
1570,Grok 4,xai/grok-4,imosl_2025_29,imosl,proofs,OPC R1 8B,0.0
1571,GPT-5 (high),openai/gpt-5,imosl_2025_29,imosl,proofs,OPC R1 8B,0.0
1572,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_29,imosl,proofs,OPC R1 8B,0.0
1573,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_29,imosl,proofs,OPC R1 8B,0.0
1574,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_29,imosl,proofs,OPC R1 8B,0.0
1575,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_29,imosl,proofs,OPC R1 8B,0.0
1576,o4-mini (high),openai/o4-mini--high,imosl_2025_29,imosl,proofs,OPC R1 8B,0.0
1577,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_29,imosl,proofs,OPC R1 8B,0.0
1578,GPT OSS 120B (high),openai/oss-120b,imosl_2025_29,imosl,proofs,OPC R1 8B,0.0
1579,GPT-5-mini (high),openai/gpt-5-mini,imosl_2025_3,imosl,proofs,OPC R1 8B,1.0
1580,GPT-5 (high),openai/gpt-5,imosl_2025_3,imosl,proofs,OPC R1 8B,1.0
1581,GPT OSS 120B (high),openai/oss-120b,imosl_2025_3,imosl,proofs,OPC R1 8B,1.0
1582,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_3,imosl,proofs,OPC R1 8B,0.0
1583,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_3,imosl,proofs,OPC R1 8B,0.0
1584,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_3,imosl,proofs,OPC R1 8B,0.0
1585,Grok 4,xai/grok-4,imosl_2025_3,imosl,proofs,OPC R1 8B,0.0
1586,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_3,imosl,proofs,OPC R1 8B,0.0
1587,o4-mini (high),openai/o4-mini--high,imosl_2025_3,imosl,proofs,OPC R1 8B,1.0
1588,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_3,imosl,proofs,OPC R1 8B,0.0
1589,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_3,imosl,proofs,OPC R1 8B,0.0
1590,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_30,imosl,proofs,OPC R1 8B,0.0
1591,Grok 4,xai/grok-4,imosl_2025_30,imosl,proofs,OPC R1 8B,0.0
1592,GPT OSS 120B (high),openai/oss-120b,imosl_2025_30,imosl,proofs,OPC R1 8B,0.0
1593,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_30,imosl,proofs,OPC R1 8B,0.0
1594,GPT-5 (high),openai/gpt-5,imosl_2025_30,imosl,proofs,OPC R1 8B,0.0
1595,o4-mini (high),openai/o4-mini--high,imosl_2025_30,imosl,proofs,OPC R1 8B,0.0
1596,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_30,imosl,proofs,OPC R1 8B,0.0
1597,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_30,imosl,proofs,OPC R1 8B,0.0
1598,GPT-5-mini (high),openai/gpt-5-mini,imosl_2025_30,imosl,proofs,OPC R1 8B,0.0
1599,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_30,imosl,proofs,OPC R1 8B,0.0
1600,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_30,imosl,proofs,OPC R1 8B,0.0
1601,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_31,imosl,proofs,OPC R1 8B,0.0
1602,GPT-5-mini (high),openai/gpt-5-mini,imosl_2025_31,imosl,proofs,OPC R1 8B,1.0
1603,o4-mini (high),openai/o4-mini--high,imosl_2025_31,imosl,proofs,OPC R1 8B,0.0
1604,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_31,imosl,proofs,OPC R1 8B,0.0
1605,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_31,imosl,proofs,OPC R1 8B,1.0
1606,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_31,imosl,proofs,OPC R1 8B,0.0
1607,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_31,imosl,proofs,OPC R1 8B,0.0
1608,GPT OSS 120B (high),openai/oss-120b,imosl_2025_31,imosl,proofs,OPC R1 8B,0.0
1609,GPT-5 (high),openai/gpt-5,imosl_2025_31,imosl,proofs,OPC R1 8B,0.0
1610,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_31,imosl,proofs,OPC R1 8B,0.0
1611,Grok 4,xai/grok-4,imosl_2025_31,imosl,proofs,OPC R1 8B,0.0
1612,GPT OSS 120B (high),openai/oss-120b,imosl_2025_32,imosl,proofs,OPC R1 8B,0.0
1613,o4-mini (high),openai/o4-mini--high,imosl_2025_32,imosl,proofs,OPC R1 8B,0.0
1614,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_32,imosl,proofs,OPC R1 8B,0.0
1615,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_32,imosl,proofs,OPC R1 8B,0.0
1616,GPT-5 (high),openai/gpt-5,imosl_2025_32,imosl,proofs,OPC R1 8B,0.0
1617,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_32,imosl,proofs,OPC R1 8B,0.0
1618,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_32,imosl,proofs,OPC R1 8B,0.0
1619,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_32,imosl,proofs,OPC R1 8B,0.0
1620,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_32,imosl,proofs,OPC R1 8B,0.0
1621,GPT-5-mini (high),openai/gpt-5-mini,imosl_2025_32,imosl,proofs,OPC R1 8B,0.0
1622,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_33,imosl,proofs,OPC R1 8B,0.0
1623,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_33,imosl,proofs,OPC R1 8B,0.0
1624,Grok 4,xai/grok-4,imosl_2025_33,imosl,proofs,OPC R1 8B,0.0
1625,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_33,imosl,proofs,OPC R1 8B,0.0
1626,GPT-5-mini (high),openai/gpt-5-mini,imosl_2025_33,imosl,proofs,OPC R1 8B,1.0
1627,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_33,imosl,proofs,OPC R1 8B,0.0
1628,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_33,imosl,proofs,OPC R1 8B,0.0
1629,GPT-5 (high),openai/gpt-5,imosl_2025_33,imosl,proofs,OPC R1 8B,1.0
1630,o4-mini (high),openai/o4-mini--high,imosl_2025_33,imosl,proofs,OPC R1 8B,0.0
1631,GPT OSS 120B (high),openai/oss-120b,imosl_2025_33,imosl,proofs,OPC R1 8B,1.0
1632,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_33,imosl,proofs,OPC R1 8B,0.0
1633,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_34,imosl,proofs,OPC R1 8B,0.0
1634,GPT OSS 120B (high),openai/oss-120b,imosl_2025_34,imosl,proofs,OPC R1 8B,0.0
1635,Grok 4,xai/grok-4,imosl_2025_34,imosl,proofs,OPC R1 8B,0.0
1636,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_34,imosl,proofs,OPC R1 8B,0.0
1637,GPT-5 (high),openai/gpt-5,imosl_2025_34,imosl,proofs,OPC R1 8B,0.0
1638,GPT-5-mini (high),openai/gpt-5-mini,imosl_2025_34,imosl,proofs,OPC R1 8B,0.0
1639,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_34,imosl,proofs,OPC R1 8B,0.0
1640,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_34,imosl,proofs,OPC R1 8B,0.0
1641,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_34,imosl,proofs,OPC R1 8B,0.0
1642,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_34,imosl,proofs,OPC R1 8B,0.0
1643,o4-mini (high),openai/o4-mini--high,imosl_2025_34,imosl,proofs,OPC R1 8B,0.0
1644,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_35,imosl,proofs,OPC R1 8B,0.0
1645,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_35,imosl,proofs,OPC R1 8B,0.0
1646,Grok 4,xai/grok-4,imosl_2025_35,imosl,proofs,OPC R1 8B,0.0
1647,GPT OSS 120B (high),openai/oss-120b,imosl_2025_35,imosl,proofs,OPC R1 8B,1.0
1648,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_35,imosl,proofs,OPC R1 8B,0.0
1649,GPT-5 (high),openai/gpt-5,imosl_2025_35,imosl,proofs,OPC R1 8B,0.0
1650,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_35,imosl,proofs,OPC R1 8B,0.0
1651,o4-mini (high),openai/o4-mini--high,imosl_2025_35,imosl,proofs,OPC R1 8B,0.0
1652,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_35,imosl,proofs,OPC R1 8B,0.0
1653,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_35,imosl,proofs,OPC R1 8B,0.0
1654,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_36,imosl,proofs,OPC R1 8B,0.0
1655,GPT-5 (high),openai/gpt-5,imosl_2025_36,imosl,proofs,OPC R1 8B,0.0
1656,Grok 4,xai/grok-4,imosl_2025_36,imosl,proofs,OPC R1 8B,0.0
1657,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_36,imosl,proofs,OPC R1 8B,0.0
1658,GPT OSS 120B (high),openai/oss-120b,imosl_2025_36,imosl,proofs,OPC R1 8B,1.0
1659,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_36,imosl,proofs,OPC R1 8B,0.0
1660,o4-mini (high),openai/o4-mini--high,imosl_2025_36,imosl,proofs,OPC R1 8B,0.0
1661,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_36,imosl,proofs,OPC R1 8B,0.0
1662,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_36,imosl,proofs,OPC R1 8B,0.0
1663,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_36,imosl,proofs,OPC R1 8B,1.0
1664,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_37,imosl,proofs,OPC R1 8B,0.0
1665,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_37,imosl,proofs,OPC R1 8B,0.0
1666,o4-mini (high),openai/o4-mini--high,imosl_2025_37,imosl,proofs,OPC R1 8B,0.0
1667,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_37,imosl,proofs,OPC R1 8B,0.0
1668,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_37,imosl,proofs,OPC R1 8B,0.0
1669,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_37,imosl,proofs,OPC R1 8B,0.0
1670,GPT-5-mini (high),openai/gpt-5-mini,imosl_2025_37,imosl,proofs,OPC R1 8B,0.0
1671,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_37,imosl,proofs,OPC R1 8B,0.0
1672,Grok 4,xai/grok-4,imosl_2025_37,imosl,proofs,OPC R1 8B,0.0
1673,GPT OSS 120B (high),openai/oss-120b,imosl_2025_37,imosl,proofs,OPC R1 8B,0.0
1674,GPT-5 (high),openai/gpt-5,imosl_2025_37,imosl,proofs,OPC R1 8B,0.0
1675,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_4,imosl,proofs,OPC R1 8B,0.0
1676,Grok 4,xai/grok-4,imosl_2025_4,imosl,proofs,OPC R1 8B,0.0
1677,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_4,imosl,proofs,OPC R1 8B,0.0
1678,GPT-5-mini (high),openai/gpt-5-mini,imosl_2025_4,imosl,proofs,OPC R1 8B,0.0
1679,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_4,imosl,proofs,OPC R1 8B,0.0
1680,o4-mini (high),openai/o4-mini--high,imosl_2025_4,imosl,proofs,OPC R1 8B,0.0
1681,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_4,imosl,proofs,OPC R1 8B,0.0
1682,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_4,imosl,proofs,OPC R1 8B,0.0
1683,GPT OSS 120B (high),openai/oss-120b,imosl_2025_4,imosl,proofs,OPC R1 8B,0.0
1684,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_4,imosl,proofs,OPC R1 8B,0.0
1685,GPT-5 (high),openai/gpt-5,imosl_2025_4,imosl,proofs,OPC R1 8B,0.0
1686,o4-mini (high),openai/o4-mini--high,imosl_2025_5,imosl,proofs,OPC R1 8B,1.0
1687,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_5,imosl,proofs,OPC R1 8B,0.0
1688,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_5,imosl,proofs,OPC R1 8B,0.0
1689,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_5,imosl,proofs,OPC R1 8B,0.0
1690,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_5,imosl,proofs,OPC R1 8B,0.0
1691,GPT-5 (high),openai/gpt-5,imosl_2025_5,imosl,proofs,OPC R1 8B,0.0
1692,GPT-5-mini (high),openai/gpt-5-mini,imosl_2025_5,imosl,proofs,OPC R1 8B,1.0
1693,GPT OSS 120B (high),openai/oss-120b,imosl_2025_5,imosl,proofs,OPC R1 8B,0.0
1694,Grok 4,xai/grok-4,imosl_2025_5,imosl,proofs,OPC R1 8B,0.0
1695,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_5,imosl,proofs,OPC R1 8B,0.0
1696,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_5,imosl,proofs,OPC R1 8B,1.0
1697,GPT-5 (high),openai/gpt-5,imosl_2025_6,imosl,proofs,OPC R1 8B,0.0
1698,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_6,imosl,proofs,OPC R1 8B,0.0
1699,GPT OSS 120B (high),openai/oss-120b,imosl_2025_6,imosl,proofs,OPC R1 8B,1.0
1700,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_6,imosl,proofs,OPC R1 8B,0.0
1701,o4-mini (high),openai/o4-mini--high,imosl_2025_6,imosl,proofs,OPC R1 8B,0.0
1702,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_6,imosl,proofs,OPC R1 8B,0.0
1703,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_6,imosl,proofs,OPC R1 8B,0.0
1704,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_6,imosl,proofs,OPC R1 8B,0.0
1705,Grok 4,xai/grok-4,imosl_2025_6,imosl,proofs,OPC R1 8B,0.0
1706,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_6,imosl,proofs,OPC R1 8B,0.0
1707,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_7,imosl,proofs,OPC R1 8B,1.0
1708,GPT OSS 120B (high),openai/oss-120b,imosl_2025_7,imosl,proofs,OPC R1 8B,0.0
1709,o4-mini (high),openai/o4-mini--high,imosl_2025_7,imosl,proofs,OPC R1 8B,0.0
1710,Grok 4,xai/grok-4,imosl_2025_7,imosl,proofs,OPC R1 8B,0.0
1711,GPT-5-mini (high),openai/gpt-5-mini,imosl_2025_7,imosl,proofs,OPC R1 8B,0.0
1712,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_7,imosl,proofs,OPC R1 8B,0.0
1713,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_7,imosl,proofs,OPC R1 8B,0.0
1714,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_7,imosl,proofs,OPC R1 8B,1.0
1715,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_7,imosl,proofs,OPC R1 8B,1.0
1716,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_7,imosl,proofs,OPC R1 8B,0.0
1717,GPT-5 (high),openai/gpt-5,imosl_2025_7,imosl,proofs,OPC R1 8B,0.0
1718,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_8,imosl,proofs,OPC R1 8B,0.0
1719,GPT OSS 120B (high),openai/oss-120b,imosl_2025_8,imosl,proofs,OPC R1 8B,0.0
1720,GPT-5-mini (high),openai/gpt-5-mini,imosl_2025_8,imosl,proofs,OPC R1 8B,1.0
1721,o4-mini (high),openai/o4-mini--high,imosl_2025_8,imosl,proofs,OPC R1 8B,0.0
1722,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_8,imosl,proofs,OPC R1 8B,0.0
1723,GPT-5 (high),openai/gpt-5,imosl_2025_8,imosl,proofs,OPC R1 8B,0.0
1724,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_8,imosl,proofs,OPC R1 8B,0.0
1725,Grok 4,xai/grok-4,imosl_2025_8,imosl,proofs,OPC R1 8B,0.0
1726,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_8,imosl,proofs,OPC R1 8B,0.0
1727,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_8,imosl,proofs,OPC R1 8B,0.0
1728,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_8,imosl,proofs,OPC R1 8B,0.0
1729,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_9,imosl,proofs,OPC R1 8B,1.0
1730,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_9,imosl,proofs,OPC R1 8B,1.0
1731,o4-mini (high),openai/o4-mini--high,imosl_2025_9,imosl,proofs,OPC R1 8B,0.0
1732,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_9,imosl,proofs,OPC R1 8B,0.0
1733,GPT OSS 120B (high),openai/oss-120b,imosl_2025_9,imosl,proofs,OPC R1 8B,0.0
1734,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_9,imosl,proofs,OPC R1 8B,0.0
1735,GPT-5-mini (high),openai/gpt-5-mini,imosl_2025_9,imosl,proofs,OPC R1 8B,1.0
1736,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_9,imosl,proofs,OPC R1 8B,1.0
1737,Grok 4,xai/grok-4,imosl_2025_9,imosl,proofs,OPC R1 8B,0.0
1738,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_9,imosl,proofs,OPC R1 8B,1.0
1739,GPT-5 (high),openai/gpt-5,imosl_2025_9,imosl,proofs,OPC R1 8B,0.0
1740,gemini-2.5-pro,gemini/gemini-pro-2.5,india_2025_1,india,proofs,OPC R1 8B,1.0
1741,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,india_2025_1,india,proofs,OPC R1 8B,1.0
1742,Qwen3-4B (25/07),qwen/qwen3_4b,india_2025_1,india,proofs,OPC R1 8B,0.0
1743,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,india_2025_1,india,proofs,OPC R1 8B,0.0
1744,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,india_2025_1,india,proofs,OPC R1 8B,0.0
1745,GPT-5-mini (high),openai/gpt-5-mini,india_2025_1,india,proofs,OPC R1 8B,1.0
1746,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,india_2025_1,india,proofs,OPC R1 8B,1.0
1747,GPT-5 (high),openai/gpt-5,india_2025_1,india,proofs,OPC R1 8B,1.0
1748,o4-mini (high),openai/o4-mini--high,india_2025_1,india,proofs,OPC R1 8B,1.0
1749,GPT OSS 120B (high),openai/oss-120b,india_2025_1,india,proofs,OPC R1 8B,0.0
1750,Grok 4,xai/grok-4,india_2025_1,india,proofs,OPC R1 8B,1.0
1751,o4-mini (high),openai/o4-mini--high,india_2025_2,india,proofs,OPC R1 8B,0.0
1752,GPT-5-mini (high),openai/gpt-5-mini,india_2025_2,india,proofs,OPC R1 8B,0.0
1753,Qwen3-4B (25/07),qwen/qwen3_4b,india_2025_2,india,proofs,OPC R1 8B,0.0
1754,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,india_2025_2,india,proofs,OPC R1 8B,0.0
1755,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,india_2025_2,india,proofs,OPC R1 8B,0.0
1756,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,india_2025_2,india,proofs,OPC R1 8B,0.0
1757,GPT-5 (high),openai/gpt-5,india_2025_2,india,proofs,OPC R1 8B,0.0
1758,GPT OSS 120B (high),openai/oss-120b,india_2025_2,india,proofs,OPC R1 8B,0.0
1759,gemini-2.5-pro,gemini/gemini-pro-2.5,india_2025_2,india,proofs,OPC R1 8B,0.0
1760,Grok 4,xai/grok-4,india_2025_2,india,proofs,OPC R1 8B,0.0
1761,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,india_2025_2,india,proofs,OPC R1 8B,0.0
1762,GPT-5 (high),openai/gpt-5,india_2025_3,india,proofs,OPC R1 8B,0.0
1763,GPT-5-mini (high),openai/gpt-5-mini,india_2025_3,india,proofs,OPC R1 8B,0.0
1764,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,india_2025_3,india,proofs,OPC R1 8B,0.0
1765,o4-mini (high),openai/o4-mini--high,india_2025_3,india,proofs,OPC R1 8B,0.0
1766,gemini-2.5-pro,gemini/gemini-pro-2.5,india_2025_3,india,proofs,OPC R1 8B,0.0
1767,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,india_2025_3,india,proofs,OPC R1 8B,0.0
1768,GPT OSS 120B (high),openai/oss-120b,india_2025_3,india,proofs,OPC R1 8B,1.0
1769,Qwen3-4B (25/07),qwen/qwen3_4b,india_2025_3,india,proofs,OPC R1 8B,0.0
1770,Grok 4,xai/grok-4,india_2025_3,india,proofs,OPC R1 8B,0.0
1771,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,india_2025_3,india,proofs,OPC R1 8B,0.0
1772,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,india_2025_3,india,proofs,OPC R1 8B,0.0
1773,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,india_2025_4,india,proofs,OPC R1 8B,0.0
1774,Qwen3-4B (25/07),qwen/qwen3_4b,india_2025_4,india,proofs,OPC R1 8B,0.0
1775,Grok 4,xai/grok-4,india_2025_4,india,proofs,OPC R1 8B,1.0
1776,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,india_2025_4,india,proofs,OPC R1 8B,0.0
1777,o4-mini (high),openai/o4-mini--high,india_2025_4,india,proofs,OPC R1 8B,0.0
1778,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,india_2025_4,india,proofs,OPC R1 8B,1.0
1779,GPT-5 (high),openai/gpt-5,india_2025_4,india,proofs,OPC R1 8B,0.0
1780,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,india_2025_4,india,proofs,OPC R1 8B,1.0
1781,GPT-5-mini (high),openai/gpt-5-mini,india_2025_4,india,proofs,OPC R1 8B,0.0
1782,gemini-2.5-pro,gemini/gemini-pro-2.5,india_2025_4,india,proofs,OPC R1 8B,1.0
1783,GPT OSS 120B (high),openai/oss-120b,india_2025_4,india,proofs,OPC R1 8B,0.0
1784,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,india_2025_5,india,proofs,OPC R1 8B,0.0
1785,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,india_2025_5,india,proofs,OPC R1 8B,0.0
1786,GPT OSS 120B (high),openai/oss-120b,india_2025_5,india,proofs,OPC R1 8B,0.0
1787,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,india_2025_5,india,proofs,OPC R1 8B,0.0
1788,gemini-2.5-pro,gemini/gemini-pro-2.5,india_2025_5,india,proofs,OPC R1 8B,0.0
1789,Qwen3-4B (25/07),qwen/qwen3_4b,india_2025_5,india,proofs,OPC R1 8B,0.0
1790,Grok 4,xai/grok-4,india_2025_5,india,proofs,OPC R1 8B,0.0
1791,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,india_2025_5,india,proofs,OPC R1 8B,0.0
1792,o4-mini (high),openai/o4-mini--high,india_2025_5,india,proofs,OPC R1 8B,0.0
1793,GPT-5 (high),openai/gpt-5,india_2025_5,india,proofs,OPC R1 8B,0.0
1794,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,india_2025_6,india,proofs,OPC R1 8B,0.0
1795,GPT-5 (high),openai/gpt-5,india_2025_6,india,proofs,OPC R1 8B,0.0
1796,o4-mini (high),openai/o4-mini--high,india_2025_6,india,proofs,OPC R1 8B,0.0
1797,GPT-5-mini (high),openai/gpt-5-mini,india_2025_6,india,proofs,OPC R1 8B,0.0
1798,GPT OSS 120B (high),openai/oss-120b,india_2025_6,india,proofs,OPC R1 8B,1.0
1799,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,india_2025_6,india,proofs,OPC R1 8B,0.0
1800,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,india_2025_6,india,proofs,OPC R1 8B,0.0
1801,Qwen3-4B (25/07),qwen/qwen3_4b,india_2025_6,india,proofs,OPC R1 8B,0.0
1802,Grok 4,xai/grok-4,india_2025_6,india,proofs,OPC R1 8B,0.0
1803,gemini-2.5-pro,gemini/gemini-pro-2.5,india_2025_6,india,proofs,OPC R1 8B,0.0
1804,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,india_2025_6,india,proofs,OPC R1 8B,0.0
1805,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,india_prep_2025_1,india,proofs,OPC R1 8B,0.0
1806,gemini-2.5-pro,gemini/gemini-pro-2.5,india_prep_2025_1,india,proofs,OPC R1 8B,0.0
1807,GPT OSS 120B (high),openai/oss-120b,india_prep_2025_1,india,proofs,OPC R1 8B,0.0
1808,o4-mini (high),openai/o4-mini--high,india_prep_2025_1,india,proofs,OPC R1 8B,0.0
1809,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,india_prep_2025_1,india,proofs,OPC R1 8B,0.0
1810,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,india_prep_2025_1,india,proofs,OPC R1 8B,0.0
1811,Grok 4,xai/grok-4,india_prep_2025_1,india,proofs,OPC R1 8B,0.0
1812,Qwen3-4B (25/07),qwen/qwen3_4b,india_prep_2025_1,india,proofs,OPC R1 8B,0.0
1813,GPT-5 (high),openai/gpt-5,india_prep_2025_1,india,proofs,OPC R1 8B,0.0
1814,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,india_prep_2025_1,india,proofs,OPC R1 8B,0.0
1815,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,india_prep_2025_10,india,proofs,OPC R1 8B,0.0
1816,GPT-5-mini (high),openai/gpt-5-mini,india_prep_2025_10,india,proofs,OPC R1 8B,1.0
1817,gemini-2.5-pro,gemini/gemini-pro-2.5,india_prep_2025_10,india,proofs,OPC R1 8B,0.0
1818,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,india_prep_2025_10,india,proofs,OPC R1 8B,0.0
1819,GPT-5 (high),openai/gpt-5,india_prep_2025_10,india,proofs,OPC R1 8B,0.0
1820,Grok 4,xai/grok-4,india_prep_2025_10,india,proofs,OPC R1 8B,0.0
1821,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,india_prep_2025_10,india,proofs,OPC R1 8B,1.0
1822,Qwen3-4B (25/07),qwen/qwen3_4b,india_prep_2025_10,india,proofs,OPC R1 8B,1.0
1823,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,india_prep_2025_10,india,proofs,OPC R1 8B,0.0
1824,o4-mini (high),openai/o4-mini--high,india_prep_2025_10,india,proofs,OPC R1 8B,0.0
1825,GPT OSS 120B (high),openai/oss-120b,india_prep_2025_10,india,proofs,OPC R1 8B,0.0
1826,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,india_prep_2025_11,india,proofs,OPC R1 8B,0.0
1827,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,india_prep_2025_11,india,proofs,OPC R1 8B,0.0
1828,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,india_prep_2025_11,india,proofs,OPC R1 8B,0.0
1829,o4-mini (high),openai/o4-mini--high,india_prep_2025_11,india,proofs,OPC R1 8B,0.0
1830,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,india_prep_2025_11,india,proofs,OPC R1 8B,0.0
1831,gemini-2.5-pro,gemini/gemini-pro-2.5,india_prep_2025_11,india,proofs,OPC R1 8B,0.0
1832,GPT-5-mini (high),openai/gpt-5-mini,india_prep_2025_11,india,proofs,OPC R1 8B,0.0
1833,Qwen3-4B (25/07),qwen/qwen3_4b,india_prep_2025_11,india,proofs,OPC R1 8B,0.0
1834,GPT OSS 120B (high),openai/oss-120b,india_prep_2025_11,india,proofs,OPC R1 8B,0.0
1835,GPT-5 (high),openai/gpt-5,india_prep_2025_11,india,proofs,OPC R1 8B,0.0
1836,Grok 4,xai/grok-4,india_prep_2025_11,india,proofs,OPC R1 8B,0.0
1837,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,india_prep_2025_12,india,proofs,OPC R1 8B,1.0
1838,GPT-5-mini (high),openai/gpt-5-mini,india_prep_2025_12,india,proofs,OPC R1 8B,1.0
1839,GPT-5 (high),openai/gpt-5,india_prep_2025_12,india,proofs,OPC R1 8B,1.0
1840,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,india_prep_2025_12,india,proofs,OPC R1 8B,0.0
1841,o4-mini (high),openai/o4-mini--high,india_prep_2025_12,india,proofs,OPC R1 8B,0.0
1842,GPT OSS 120B (high),openai/oss-120b,india_prep_2025_12,india,proofs,OPC R1 8B,0.0
1843,Qwen3-4B (25/07),qwen/qwen3_4b,india_prep_2025_12,india,proofs,OPC R1 8B,0.0
1844,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,india_prep_2025_12,india,proofs,OPC R1 8B,0.0
1845,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,india_prep_2025_12,india,proofs,OPC R1 8B,1.0
1846,gemini-2.5-pro,gemini/gemini-pro-2.5,india_prep_2025_12,india,proofs,OPC R1 8B,1.0
1847,Grok 4,xai/grok-4,india_prep_2025_12,india,proofs,OPC R1 8B,1.0
1848,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,india_prep_2025_13,india,proofs,OPC R1 8B,1.0
1849,o4-mini (high),openai/o4-mini--high,india_prep_2025_13,india,proofs,OPC R1 8B,0.0
1850,GPT-5 (high),openai/gpt-5,india_prep_2025_13,india,proofs,OPC R1 8B,1.0
1851,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,india_prep_2025_13,india,proofs,OPC R1 8B,0.0
1852,gemini-2.5-pro,gemini/gemini-pro-2.5,india_prep_2025_13,india,proofs,OPC R1 8B,1.0
1853,GPT OSS 120B (high),openai/oss-120b,india_prep_2025_13,india,proofs,OPC R1 8B,0.0
1854,Qwen3-4B (25/07),qwen/qwen3_4b,india_prep_2025_13,india,proofs,OPC R1 8B,0.0
1855,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,india_prep_2025_13,india,proofs,OPC R1 8B,1.0
1856,GPT-5-mini (high),openai/gpt-5-mini,india_prep_2025_13,india,proofs,OPC R1 8B,1.0
1857,Grok 4,xai/grok-4,india_prep_2025_13,india,proofs,OPC R1 8B,0.0
1858,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,india_prep_2025_13,india,proofs,OPC R1 8B,0.0
1859,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,india_prep_2025_14,india,proofs,OPC R1 8B,0.0
1860,Qwen3-4B (25/07),qwen/qwen3_4b,india_prep_2025_14,india,proofs,OPC R1 8B,0.0
1861,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,india_prep_2025_14,india,proofs,OPC R1 8B,0.0
1862,GPT OSS 120B (high),openai/oss-120b,india_prep_2025_14,india,proofs,OPC R1 8B,0.0
1863,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,india_prep_2025_14,india,proofs,OPC R1 8B,1.0
1864,Grok 4,xai/grok-4,india_prep_2025_14,india,proofs,OPC R1 8B,1.0
1865,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,india_prep_2025_14,india,proofs,OPC R1 8B,0.0
1866,GPT-5-mini (high),openai/gpt-5-mini,india_prep_2025_14,india,proofs,OPC R1 8B,1.0
1867,o4-mini (high),openai/o4-mini--high,india_prep_2025_14,india,proofs,OPC R1 8B,0.0
1868,GPT-5 (high),openai/gpt-5,india_prep_2025_14,india,proofs,OPC R1 8B,1.0
1869,gemini-2.5-pro,gemini/gemini-pro-2.5,india_prep_2025_14,india,proofs,OPC R1 8B,1.0
1870,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,india_prep_2025_15,india,proofs,OPC R1 8B,0.0
1871,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,india_prep_2025_15,india,proofs,OPC R1 8B,0.0
1872,GPT-5-mini (high),openai/gpt-5-mini,india_prep_2025_15,india,proofs,OPC R1 8B,0.0
1873,Qwen3-4B (25/07),qwen/qwen3_4b,india_prep_2025_15,india,proofs,OPC R1 8B,0.0
1874,o4-mini (high),openai/o4-mini--high,india_prep_2025_15,india,proofs,OPC R1 8B,0.0
1875,gemini-2.5-pro,gemini/gemini-pro-2.5,india_prep_2025_15,india,proofs,OPC R1 8B,0.0
1876,GPT OSS 120B (high),openai/oss-120b,india_prep_2025_15,india,proofs,OPC R1 8B,1.0
1877,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,india_prep_2025_15,india,proofs,OPC R1 8B,0.0
1878,Grok 4,xai/grok-4,india_prep_2025_15,india,proofs,OPC R1 8B,0.0
1879,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,india_prep_2025_15,india,proofs,OPC R1 8B,0.0
1880,GPT-5 (high),openai/gpt-5,india_prep_2025_15,india,proofs,OPC R1 8B,0.0
1881,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,india_prep_2025_16,india,proofs,OPC R1 8B,0.0
1882,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,india_prep_2025_16,india,proofs,OPC R1 8B,0.0
1883,GPT OSS 120B (high),openai/oss-120b,india_prep_2025_16,india,proofs,OPC R1 8B,1.0
1884,gemini-2.5-pro,gemini/gemini-pro-2.5,india_prep_2025_16,india,proofs,OPC R1 8B,0.0
1885,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,india_prep_2025_16,india,proofs,OPC R1 8B,0.0
1886,GPT-5-mini (high),openai/gpt-5-mini,india_prep_2025_16,india,proofs,OPC R1 8B,1.0
1887,Qwen3-4B (25/07),qwen/qwen3_4b,india_prep_2025_16,india,proofs,OPC R1 8B,0.0
1888,Grok 4,xai/grok-4,india_prep_2025_16,india,proofs,OPC R1 8B,0.0
1889,GPT-5 (high),openai/gpt-5,india_prep_2025_16,india,proofs,OPC R1 8B,1.0
1890,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,india_prep_2025_16,india,proofs,OPC R1 8B,0.0
1891,o4-mini (high),openai/o4-mini--high,india_prep_2025_16,india,proofs,OPC R1 8B,1.0
1892,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,india_prep_2025_17,india,proofs,OPC R1 8B,0.0
1893,GPT-5 (high),openai/gpt-5,india_prep_2025_17,india,proofs,OPC R1 8B,0.0
1894,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,india_prep_2025_17,india,proofs,OPC R1 8B,1.0
1895,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,india_prep_2025_17,india,proofs,OPC R1 8B,0.0
1896,gemini-2.5-pro,gemini/gemini-pro-2.5,india_prep_2025_17,india,proofs,OPC R1 8B,1.0
1897,GPT-5-mini (high),openai/gpt-5-mini,india_prep_2025_17,india,proofs,OPC R1 8B,0.0
1898,Qwen3-4B (25/07),qwen/qwen3_4b,india_prep_2025_17,india,proofs,OPC R1 8B,0.0
1899,GPT OSS 120B (high),openai/oss-120b,india_prep_2025_17,india,proofs,OPC R1 8B,0.0
1900,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,india_prep_2025_17,india,proofs,OPC R1 8B,0.0
1901,o4-mini (high),openai/o4-mini--high,india_prep_2025_17,india,proofs,OPC R1 8B,0.0
1902,gemini-2.5-pro,gemini/gemini-pro-2.5,india_prep_2025_18,india,proofs,OPC R1 8B,0.0
1903,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,india_prep_2025_18,india,proofs,OPC R1 8B,0.0
1904,o4-mini (high),openai/o4-mini--high,india_prep_2025_18,india,proofs,OPC R1 8B,0.0
1905,GPT-5 (high),openai/gpt-5,india_prep_2025_18,india,proofs,OPC R1 8B,0.0
1906,Qwen3-4B (25/07),qwen/qwen3_4b,india_prep_2025_18,india,proofs,OPC R1 8B,0.0
1907,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,india_prep_2025_18,india,proofs,OPC R1 8B,0.0
1908,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,india_prep_2025_18,india,proofs,OPC R1 8B,0.0
1909,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,india_prep_2025_18,india,proofs,OPC R1 8B,0.0
1910,GPT OSS 120B (high),openai/oss-120b,india_prep_2025_18,india,proofs,OPC R1 8B,0.0
1911,GPT-5-mini (high),openai/gpt-5-mini,india_prep_2025_18,india,proofs,OPC R1 8B,0.0
1912,Grok 4,xai/grok-4,india_prep_2025_18,india,proofs,OPC R1 8B,0.0
1913,GPT-5 (high),openai/gpt-5,india_prep_2025_19,india,proofs,OPC R1 8B,0.0
1914,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,india_prep_2025_19,india,proofs,OPC R1 8B,1.0
1915,GPT-5-mini (high),openai/gpt-5-mini,india_prep_2025_19,india,proofs,OPC R1 8B,0.0
1916,gemini-2.5-pro,gemini/gemini-pro-2.5,india_prep_2025_19,india,proofs,OPC R1 8B,0.0
1917,Grok 4,xai/grok-4,india_prep_2025_19,india,proofs,OPC R1 8B,0.0
1918,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,india_prep_2025_19,india,proofs,OPC R1 8B,0.0
1919,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,india_prep_2025_19,india,proofs,OPC R1 8B,0.0
1920,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,india_prep_2025_19,india,proofs,OPC R1 8B,1.0
1921,o4-mini (high),openai/o4-mini--high,india_prep_2025_19,india,proofs,OPC R1 8B,0.0
1922,Qwen3-4B (25/07),qwen/qwen3_4b,india_prep_2025_19,india,proofs,OPC R1 8B,0.0
1923,GPT OSS 120B (high),openai/oss-120b,india_prep_2025_19,india,proofs,OPC R1 8B,0.0
1924,GPT-5-mini (high),openai/gpt-5-mini,india_prep_2025_2,india,proofs,OPC R1 8B,1.0
1925,GPT OSS 120B (high),openai/oss-120b,india_prep_2025_2,india,proofs,OPC R1 8B,0.0
1926,GPT-5 (high),openai/gpt-5,india_prep_2025_2,india,proofs,OPC R1 8B,0.0
1927,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,india_prep_2025_2,india,proofs,OPC R1 8B,0.0
1928,Grok 4,xai/grok-4,india_prep_2025_2,india,proofs,OPC R1 8B,0.0
1929,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,india_prep_2025_2,india,proofs,OPC R1 8B,0.0
1930,Qwen3-4B (25/07),qwen/qwen3_4b,india_prep_2025_2,india,proofs,OPC R1 8B,0.0
1931,gemini-2.5-pro,gemini/gemini-pro-2.5,india_prep_2025_2,india,proofs,OPC R1 8B,0.0
1932,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,india_prep_2025_2,india,proofs,OPC R1 8B,0.0
1933,o4-mini (high),openai/o4-mini--high,india_prep_2025_2,india,proofs,OPC R1 8B,0.0
1934,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,india_prep_2025_2,india,proofs,OPC R1 8B,0.0
1935,Qwen3-4B (25/07),qwen/qwen3_4b,india_prep_2025_20,india,proofs,OPC R1 8B,0.0
1936,GPT-5 (high),openai/gpt-5,india_prep_2025_20,india,proofs,OPC R1 8B,0.0
1937,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,india_prep_2025_20,india,proofs,OPC R1 8B,0.0
1938,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,india_prep_2025_20,india,proofs,OPC R1 8B,0.0
1939,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,india_prep_2025_20,india,proofs,OPC R1 8B,0.0
1940,gemini-2.5-pro,gemini/gemini-pro-2.5,india_prep_2025_20,india,proofs,OPC R1 8B,0.0
1941,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,india_prep_2025_20,india,proofs,OPC R1 8B,0.0
1942,GPT OSS 120B (high),openai/oss-120b,india_prep_2025_20,india,proofs,OPC R1 8B,1.0
1943,GPT-5-mini (high),openai/gpt-5-mini,india_prep_2025_20,india,proofs,OPC R1 8B,0.0
1944,o4-mini (high),openai/o4-mini--high,india_prep_2025_20,india,proofs,OPC R1 8B,0.0
1945,Grok 4,xai/grok-4,india_prep_2025_20,india,proofs,OPC R1 8B,0.0
1946,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,india_prep_2025_21,india,proofs,OPC R1 8B,0.0
1947,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,india_prep_2025_21,india,proofs,OPC R1 8B,0.0
1948,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,india_prep_2025_21,india,proofs,OPC R1 8B,0.0
1949,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,india_prep_2025_21,india,proofs,OPC R1 8B,0.0
1950,o4-mini (high),openai/o4-mini--high,india_prep_2025_21,india,proofs,OPC R1 8B,0.0
1951,Qwen3-4B (25/07),qwen/qwen3_4b,india_prep_2025_21,india,proofs,OPC R1 8B,0.0
1952,GPT OSS 120B (high),openai/oss-120b,india_prep_2025_21,india,proofs,OPC R1 8B,0.0
1953,GPT-5 (high),openai/gpt-5,india_prep_2025_21,india,proofs,OPC R1 8B,0.0
1954,GPT-5-mini (high),openai/gpt-5-mini,india_prep_2025_21,india,proofs,OPC R1 8B,0.0
1955,gemini-2.5-pro,gemini/gemini-pro-2.5,india_prep_2025_21,india,proofs,OPC R1 8B,1.0
1956,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,india_prep_2025_3,india,proofs,OPC R1 8B,0.0
1957,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,india_prep_2025_3,india,proofs,OPC R1 8B,0.0
1958,GPT-5-mini (high),openai/gpt-5-mini,india_prep_2025_3,india,proofs,OPC R1 8B,0.0
1959,Grok 4,xai/grok-4,india_prep_2025_3,india,proofs,OPC R1 8B,0.0
1960,Qwen3-4B (25/07),qwen/qwen3_4b,india_prep_2025_3,india,proofs,OPC R1 8B,0.0
1961,gemini-2.5-pro,gemini/gemini-pro-2.5,india_prep_2025_3,india,proofs,OPC R1 8B,1.0
1962,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,india_prep_2025_3,india,proofs,OPC R1 8B,0.0
1963,GPT-5 (high),openai/gpt-5,india_prep_2025_3,india,proofs,OPC R1 8B,0.0
1964,o4-mini (high),openai/o4-mini--high,india_prep_2025_3,india,proofs,OPC R1 8B,0.0
1965,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,india_prep_2025_3,india,proofs,OPC R1 8B,0.0
1966,GPT OSS 120B (high),openai/oss-120b,india_prep_2025_3,india,proofs,OPC R1 8B,0.0
1967,Qwen3-4B (25/07),qwen/qwen3_4b,india_prep_2025_4,india,proofs,OPC R1 8B,0.0
1968,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,india_prep_2025_4,india,proofs,OPC R1 8B,0.0
1969,gemini-2.5-pro,gemini/gemini-pro-2.5,india_prep_2025_4,india,proofs,OPC R1 8B,0.0
1970,Grok 4,xai/grok-4,india_prep_2025_4,india,proofs,OPC R1 8B,0.0
1971,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,india_prep_2025_4,india,proofs,OPC R1 8B,0.0
1972,GPT-5-mini (high),openai/gpt-5-mini,india_prep_2025_4,india,proofs,OPC R1 8B,0.0
1973,o4-mini (high),openai/o4-mini--high,india_prep_2025_4,india,proofs,OPC R1 8B,0.0
1974,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,india_prep_2025_4,india,proofs,OPC R1 8B,0.0
1975,GPT-5 (high),openai/gpt-5,india_prep_2025_4,india,proofs,OPC R1 8B,0.0
1976,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,india_prep_2025_4,india,proofs,OPC R1 8B,0.0
1977,GPT OSS 120B (high),openai/oss-120b,india_prep_2025_4,india,proofs,OPC R1 8B,0.0
1978,gemini-2.5-pro,gemini/gemini-pro-2.5,india_prep_2025_5,india,proofs,OPC R1 8B,0.0
1979,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,india_prep_2025_5,india,proofs,OPC R1 8B,0.0
1980,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,india_prep_2025_5,india,proofs,OPC R1 8B,0.0
1981,Grok 4,xai/grok-4,india_prep_2025_5,india,proofs,OPC R1 8B,0.0
1982,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,india_prep_2025_5,india,proofs,OPC R1 8B,0.0
1983,GPT OSS 120B (high),openai/oss-120b,india_prep_2025_5,india,proofs,OPC R1 8B,0.0
1984,Qwen3-4B (25/07),qwen/qwen3_4b,india_prep_2025_5,india,proofs,OPC R1 8B,0.0
1985,GPT-5 (high),openai/gpt-5,india_prep_2025_5,india,proofs,OPC R1 8B,0.0
1986,GPT-5-mini (high),openai/gpt-5-mini,india_prep_2025_5,india,proofs,OPC R1 8B,0.0
1987,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,india_prep_2025_5,india,proofs,OPC R1 8B,0.0
1988,o4-mini (high),openai/o4-mini--high,india_prep_2025_5,india,proofs,OPC R1 8B,0.0
1989,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,india_prep_2025_6,india,proofs,OPC R1 8B,0.0
1990,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,india_prep_2025_6,india,proofs,OPC R1 8B,0.0
1991,GPT-5-mini (high),openai/gpt-5-mini,india_prep_2025_6,india,proofs,OPC R1 8B,0.0
1992,o4-mini (high),openai/o4-mini--high,india_prep_2025_6,india,proofs,OPC R1 8B,0.0
1993,GPT OSS 120B (high),openai/oss-120b,india_prep_2025_6,india,proofs,OPC R1 8B,0.0
1994,Qwen3-4B (25/07),qwen/qwen3_4b,india_prep_2025_6,india,proofs,OPC R1 8B,1.0
1995,GPT-5 (high),openai/gpt-5,india_prep_2025_6,india,proofs,OPC R1 8B,1.0
1996,gemini-2.5-pro,gemini/gemini-pro-2.5,india_prep_2025_6,india,proofs,OPC R1 8B,0.0
1997,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,india_prep_2025_6,india,proofs,OPC R1 8B,0.0
1998,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,india_prep_2025_6,india,proofs,OPC R1 8B,0.0
1999,Grok 4,xai/grok-4,india_prep_2025_6,india,proofs,OPC R1 8B,0.0
2000,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,india_prep_2025_7,india,proofs,OPC R1 8B,0.0
2001,GPT OSS 120B (high),openai/oss-120b,india_prep_2025_7,india,proofs,OPC R1 8B,0.0
2002,Grok 4,xai/grok-4,india_prep_2025_7,india,proofs,OPC R1 8B,0.0
2003,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,india_prep_2025_7,india,proofs,OPC R1 8B,0.0
2004,GPT-5-mini (high),openai/gpt-5-mini,india_prep_2025_7,india,proofs,OPC R1 8B,0.0
2005,gemini-2.5-pro,gemini/gemini-pro-2.5,india_prep_2025_7,india,proofs,OPC R1 8B,0.0
2006,o4-mini (high),openai/o4-mini--high,india_prep_2025_7,india,proofs,OPC R1 8B,0.0
2007,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,india_prep_2025_7,india,proofs,OPC R1 8B,0.0
2008,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,india_prep_2025_7,india,proofs,OPC R1 8B,0.0
2009,GPT-5 (high),openai/gpt-5,india_prep_2025_7,india,proofs,OPC R1 8B,0.0
2010,Qwen3-4B (25/07),qwen/qwen3_4b,india_prep_2025_7,india,proofs,OPC R1 8B,0.0
2011,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,india_prep_2025_8,india,proofs,OPC R1 8B,0.0
2012,GPT OSS 120B (high),openai/oss-120b,india_prep_2025_8,india,proofs,OPC R1 8B,0.0
2013,gemini-2.5-pro,gemini/gemini-pro-2.5,india_prep_2025_8,india,proofs,OPC R1 8B,0.0
2014,GPT-5 (high),openai/gpt-5,india_prep_2025_8,india,proofs,OPC R1 8B,0.0
2015,o4-mini (high),openai/o4-mini--high,india_prep_2025_8,india,proofs,OPC R1 8B,0.0
2016,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,india_prep_2025_8,india,proofs,OPC R1 8B,0.0
2017,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,india_prep_2025_8,india,proofs,OPC R1 8B,0.0
2018,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,india_prep_2025_8,india,proofs,OPC R1 8B,0.0
2019,Qwen3-4B (25/07),qwen/qwen3_4b,india_prep_2025_8,india,proofs,OPC R1 8B,0.0
2020,Grok 4,xai/grok-4,india_prep_2025_8,india,proofs,OPC R1 8B,0.0
2021,GPT-5-mini (high),openai/gpt-5-mini,india_prep_2025_8,india,proofs,OPC R1 8B,0.0
2022,GPT-5 (high),openai/gpt-5,india_prep_2025_9,india,proofs,OPC R1 8B,1.0
2023,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,india_prep_2025_9,india,proofs,OPC R1 8B,1.0
2024,Qwen3-4B (25/07),qwen/qwen3_4b,india_prep_2025_9,india,proofs,OPC R1 8B,0.0
2025,Grok 4,xai/grok-4,india_prep_2025_9,india,proofs,OPC R1 8B,1.0
2026,o4-mini (high),openai/o4-mini--high,india_prep_2025_9,india,proofs,OPC R1 8B,0.0
2027,gemini-2.5-pro,gemini/gemini-pro-2.5,india_prep_2025_9,india,proofs,OPC R1 8B,0.0
2028,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,india_prep_2025_9,india,proofs,OPC R1 8B,1.0
2029,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,india_prep_2025_9,india,proofs,OPC R1 8B,1.0
2030,GPT OSS 120B (high),openai/oss-120b,india_prep_2025_9,india,proofs,OPC R1 8B,0.0
2031,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,india_prep_2025_9,india,proofs,OPC R1 8B,1.0
2032,GPT-5-mini (high),openai/gpt-5-mini,india_prep_2025_9,india,proofs,OPC R1 8B,1.0
2033,GPT OSS 120B (high),openai/oss-120b,iran_tst_2025_1,iran,proofs,OPC R1 8B,0.0
2034,Qwen3-4B (25/07),qwen/qwen3_4b,iran_tst_2025_1,iran,proofs,OPC R1 8B,0.0
2035,o4-mini (high),openai/o4-mini--high,iran_tst_2025_1,iran,proofs,OPC R1 8B,0.0
2036,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,iran_tst_2025_1,iran,proofs,OPC R1 8B,0.0
2037,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,iran_tst_2025_1,iran,proofs,OPC R1 8B,0.0
2038,gemini-2.5-pro,gemini/gemini-pro-2.5,iran_tst_2025_1,iran,proofs,OPC R1 8B,1.0
2039,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,iran_tst_2025_1,iran,proofs,OPC R1 8B,0.0
2040,Grok 4,xai/grok-4,iran_tst_2025_1,iran,proofs,OPC R1 8B,0.0
2041,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,iran_tst_2025_1,iran,proofs,OPC R1 8B,0.0
2042,GPT-5 (high),openai/gpt-5,iran_tst_2025_1,iran,proofs,OPC R1 8B,0.0
2043,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,iran_tst_2025_2,iran,proofs,OPC R1 8B,0.0
2044,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,iran_tst_2025_2,iran,proofs,OPC R1 8B,0.0
2045,gemini-2.5-pro,gemini/gemini-pro-2.5,iran_tst_2025_2,iran,proofs,OPC R1 8B,1.0
2046,o4-mini (high),openai/o4-mini--high,iran_tst_2025_2,iran,proofs,OPC R1 8B,0.0
2047,GPT-5 (high),openai/gpt-5,iran_tst_2025_2,iran,proofs,OPC R1 8B,0.0
2048,Grok 4,xai/grok-4,iran_tst_2025_2,iran,proofs,OPC R1 8B,0.0
2049,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,iran_tst_2025_2,iran,proofs,OPC R1 8B,0.0
2050,GPT OSS 120B (high),openai/oss-120b,iran_tst_2025_2,iran,proofs,OPC R1 8B,0.0
2051,Qwen3-4B (25/07),qwen/qwen3_4b,iran_tst_2025_2,iran,proofs,OPC R1 8B,0.0
2052,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,iran_tst_2025_2,iran,proofs,OPC R1 8B,0.0
2053,GPT OSS 120B (high),openai/oss-120b,iran_tst_2025_3,iran,proofs,OPC R1 8B,0.0
2054,gemini-2.5-pro,gemini/gemini-pro-2.5,iran_tst_2025_3,iran,proofs,OPC R1 8B,0.0
2055,Grok 4,xai/grok-4,iran_tst_2025_3,iran,proofs,OPC R1 8B,0.0
2056,GPT-5 (high),openai/gpt-5,iran_tst_2025_3,iran,proofs,OPC R1 8B,0.0
2057,Qwen3-4B (25/07),qwen/qwen3_4b,iran_tst_2025_3,iran,proofs,OPC R1 8B,0.0
2058,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,iran_tst_2025_3,iran,proofs,OPC R1 8B,0.0
2059,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,iran_tst_2025_3,iran,proofs,OPC R1 8B,0.0
2060,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,iran_tst_2025_3,iran,proofs,OPC R1 8B,0.0
2061,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,iran_tst_2025_3,iran,proofs,OPC R1 8B,0.0
2062,o4-mini (high),openai/o4-mini--high,iran_tst_2025_3,iran,proofs,OPC R1 8B,0.0
2063,Qwen3-4B (25/07),qwen/qwen3_4b,iran_tst_2025_4,iran,proofs,OPC R1 8B,1.0
2064,o4-mini (high),openai/o4-mini--high,iran_tst_2025_4,iran,proofs,OPC R1 8B,1.0
2065,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,iran_tst_2025_4,iran,proofs,OPC R1 8B,1.0
2066,GPT OSS 120B (high),openai/oss-120b,iran_tst_2025_4,iran,proofs,OPC R1 8B,1.0
2067,gemini-2.5-pro,gemini/gemini-pro-2.5,iran_tst_2025_4,iran,proofs,OPC R1 8B,1.0
2068,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,iran_tst_2025_4,iran,proofs,OPC R1 8B,1.0
2069,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,iran_tst_2025_4,iran,proofs,OPC R1 8B,1.0
2070,GPT-5 (high),openai/gpt-5,iran_tst_2025_4,iran,proofs,OPC R1 8B,1.0
2071,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,iran_tst_2025_4,iran,proofs,OPC R1 8B,1.0
2072,Grok 4,xai/grok-4,iran_tst_2025_4,iran,proofs,OPC R1 8B,1.0
2073,Grok 4,xai/grok-4,iran_tst_2025_5,iran,proofs,OPC R1 8B,0.0
2074,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,iran_tst_2025_5,iran,proofs,OPC R1 8B,0.0
2075,GPT-5 (high),openai/gpt-5,iran_tst_2025_5,iran,proofs,OPC R1 8B,0.0
2076,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,iran_tst_2025_5,iran,proofs,OPC R1 8B,0.0
2077,gemini-2.5-pro,gemini/gemini-pro-2.5,iran_tst_2025_5,iran,proofs,OPC R1 8B,0.0
2078,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,iran_tst_2025_5,iran,proofs,OPC R1 8B,0.0
2079,o4-mini (high),openai/o4-mini--high,iran_tst_2025_5,iran,proofs,OPC R1 8B,0.0
2080,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,iran_tst_2025_5,iran,proofs,OPC R1 8B,0.0
2081,Qwen3-4B (25/07),qwen/qwen3_4b,iran_tst_2025_5,iran,proofs,OPC R1 8B,0.0
2082,GPT OSS 120B (high),openai/oss-120b,iran_tst_2025_5,iran,proofs,OPC R1 8B,1.0
2083,GPT OSS 120B (high),openai/oss-120b,iran_tst_2025_6,iran,proofs,OPC R1 8B,0.0
2084,Grok 4,xai/grok-4,iran_tst_2025_6,iran,proofs,OPC R1 8B,0.0
2085,gemini-2.5-pro,gemini/gemini-pro-2.5,iran_tst_2025_6,iran,proofs,OPC R1 8B,0.0
2086,o4-mini (high),openai/o4-mini--high,iran_tst_2025_6,iran,proofs,OPC R1 8B,0.0
2087,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,iran_tst_2025_6,iran,proofs,OPC R1 8B,0.0
2088,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,iran_tst_2025_6,iran,proofs,OPC R1 8B,0.0
2089,GPT-5 (high),openai/gpt-5,iran_tst_2025_6,iran,proofs,OPC R1 8B,1.0
2090,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,iran_tst_2025_6,iran,proofs,OPC R1 8B,0.0
2091,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,iran_tst_2025_6,iran,proofs,OPC R1 8B,1.0
2092,Qwen3-4B (25/07),qwen/qwen3_4b,iran_tst_2025_6,iran,proofs,OPC R1 8B,0.0
2093,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,iran_tst_2025_7,iran,proofs,OPC R1 8B,1.0
2094,GPT-5 (high),openai/gpt-5,iran_tst_2025_7,iran,proofs,OPC R1 8B,1.0
2095,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,iran_tst_2025_7,iran,proofs,OPC R1 8B,1.0
2096,gemini-2.5-pro,gemini/gemini-pro-2.5,iran_tst_2025_7,iran,proofs,OPC R1 8B,1.0
2097,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,iran_tst_2025_7,iran,proofs,OPC R1 8B,1.0
2098,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,iran_tst_2025_7,iran,proofs,OPC R1 8B,1.0
2099,GPT OSS 120B (high),openai/oss-120b,iran_tst_2025_7,iran,proofs,OPC R1 8B,0.0
2100,o4-mini (high),openai/o4-mini--high,iran_tst_2025_7,iran,proofs,OPC R1 8B,0.0
2101,Qwen3-4B (25/07),qwen/qwen3_4b,iran_tst_2025_7,iran,proofs,OPC R1 8B,0.0
2102,Grok 4,xai/grok-4,iran_tst_2025_7,iran,proofs,OPC R1 8B,0.0
2103,GPT OSS 120B (high),openai/oss-120b,iran_tst_2025_8,iran,proofs,OPC R1 8B,1.0
2104,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,iran_tst_2025_8,iran,proofs,OPC R1 8B,0.0
2105,Qwen3-4B (25/07),qwen/qwen3_4b,iran_tst_2025_8,iran,proofs,OPC R1 8B,0.0
2106,gemini-2.5-pro,gemini/gemini-pro-2.5,iran_tst_2025_8,iran,proofs,OPC R1 8B,0.0
2107,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,iran_tst_2025_8,iran,proofs,OPC R1 8B,0.0
2108,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,iran_tst_2025_8,iran,proofs,OPC R1 8B,0.0
2109,Grok 4,xai/grok-4,iran_tst_2025_8,iran,proofs,OPC R1 8B,0.0
2110,o4-mini (high),openai/o4-mini--high,iran_tst_2025_8,iran,proofs,OPC R1 8B,0.0
2111,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,iran_tst_2025_8,iran,proofs,OPC R1 8B,0.0
2112,GPT-5 (high),openai/gpt-5,iran_tst_2025_8,iran,proofs,OPC R1 8B,0.0
2113,o4-mini (high),openai/o4-mini--high,iran_tst_2025_9,iran,proofs,OPC R1 8B,0.0
2114,Qwen3-4B (25/07),qwen/qwen3_4b,iran_tst_2025_9,iran,proofs,OPC R1 8B,0.0
2115,GPT OSS 120B (high),openai/oss-120b,iran_tst_2025_9,iran,proofs,OPC R1 8B,0.0
2116,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,iran_tst_2025_9,iran,proofs,OPC R1 8B,1.0
2117,Grok 4,xai/grok-4,iran_tst_2025_9,iran,proofs,OPC R1 8B,0.0
2118,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,iran_tst_2025_9,iran,proofs,OPC R1 8B,0.0
2119,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,iran_tst_2025_9,iran,proofs,OPC R1 8B,1.0
2120,gemini-2.5-pro,gemini/gemini-pro-2.5,iran_tst_2025_9,iran,proofs,OPC R1 8B,0.0
2121,GPT-5 (high),openai/gpt-5,iran_tst_2025_9,iran,proofs,OPC R1 8B,0.0
2122,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,iran_tst_2025_9,iran,proofs,OPC R1 8B,0.0
2123,gemini-2.5-pro,gemini/gemini-pro-2.5,israel_tst_2025_1,israel,proofs,OPC R1 8B,1.0
2124,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,israel_tst_2025_1,israel,proofs,OPC R1 8B,0.0
2125,GPT OSS 120B (high),openai/oss-120b,israel_tst_2025_1,israel,proofs,OPC R1 8B,0.0
2126,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,israel_tst_2025_1,israel,proofs,OPC R1 8B,0.0
2127,o4-mini (high),openai/o4-mini--high,israel_tst_2025_1,israel,proofs,OPC R1 8B,0.0
2128,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,israel_tst_2025_1,israel,proofs,OPC R1 8B,0.0
2129,Qwen3-4B (25/07),qwen/qwen3_4b,israel_tst_2025_1,israel,proofs,OPC R1 8B,0.0
2130,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,israel_tst_2025_1,israel,proofs,OPC R1 8B,0.0
2131,GPT-5 (high),openai/gpt-5,israel_tst_2025_1,israel,proofs,OPC R1 8B,1.0
2132,Grok 4,xai/grok-4,israel_tst_2025_1,israel,proofs,OPC R1 8B,0.0
2133,gemini-2.5-pro,gemini/gemini-pro-2.5,israel_tst_2025_10,israel,proofs,OPC R1 8B,0.0
2134,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,israel_tst_2025_10,israel,proofs,OPC R1 8B,0.0
2135,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,israel_tst_2025_10,israel,proofs,OPC R1 8B,0.0
2136,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,israel_tst_2025_10,israel,proofs,OPC R1 8B,0.0
2137,GPT OSS 120B (high),openai/oss-120b,israel_tst_2025_10,israel,proofs,OPC R1 8B,0.0
2138,GPT-5 (high),openai/gpt-5,israel_tst_2025_10,israel,proofs,OPC R1 8B,0.0
2139,o4-mini (high),openai/o4-mini--high,israel_tst_2025_10,israel,proofs,OPC R1 8B,0.0
2140,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,israel_tst_2025_10,israel,proofs,OPC R1 8B,1.0
2141,Qwen3-4B (25/07),qwen/qwen3_4b,israel_tst_2025_10,israel,proofs,OPC R1 8B,0.0
2142,Grok 4,xai/grok-4,israel_tst_2025_10,israel,proofs,OPC R1 8B,0.0
2143,Grok 4,xai/grok-4,israel_tst_2025_2,israel,proofs,OPC R1 8B,0.0
2144,gemini-2.5-pro,gemini/gemini-pro-2.5,israel_tst_2025_2,israel,proofs,OPC R1 8B,0.0
2145,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,israel_tst_2025_2,israel,proofs,OPC R1 8B,0.0
2146,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,israel_tst_2025_2,israel,proofs,OPC R1 8B,0.0
2147,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,israel_tst_2025_2,israel,proofs,OPC R1 8B,0.0
2148,GPT-5 (high),openai/gpt-5,israel_tst_2025_2,israel,proofs,OPC R1 8B,0.0
2149,Qwen3-4B (25/07),qwen/qwen3_4b,israel_tst_2025_2,israel,proofs,OPC R1 8B,0.0
2150,o4-mini (high),openai/o4-mini--high,israel_tst_2025_2,israel,proofs,OPC R1 8B,0.0
2151,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,israel_tst_2025_2,israel,proofs,OPC R1 8B,0.0
2152,GPT OSS 120B (high),openai/oss-120b,israel_tst_2025_2,israel,proofs,OPC R1 8B,0.0
2153,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,israel_tst_2025_3,israel,proofs,OPC R1 8B,0.0
2154,GPT OSS 120B (high),openai/oss-120b,israel_tst_2025_3,israel,proofs,OPC R1 8B,0.0
2155,gemini-2.5-pro,gemini/gemini-pro-2.5,israel_tst_2025_3,israel,proofs,OPC R1 8B,1.0
2156,Grok 4,xai/grok-4,israel_tst_2025_3,israel,proofs,OPC R1 8B,0.0
2157,GPT-5 (high),openai/gpt-5,israel_tst_2025_3,israel,proofs,OPC R1 8B,1.0
2158,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,israel_tst_2025_3,israel,proofs,OPC R1 8B,0.0
2159,o4-mini (high),openai/o4-mini--high,israel_tst_2025_3,israel,proofs,OPC R1 8B,0.0
2160,Qwen3-4B (25/07),qwen/qwen3_4b,israel_tst_2025_3,israel,proofs,OPC R1 8B,0.0
2161,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,israel_tst_2025_3,israel,proofs,OPC R1 8B,0.0
2162,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,israel_tst_2025_3,israel,proofs,OPC R1 8B,0.0
2163,Qwen3-4B (25/07),qwen/qwen3_4b,israel_tst_2025_4,israel,proofs,OPC R1 8B,0.0
2164,gemini-2.5-pro,gemini/gemini-pro-2.5,israel_tst_2025_4,israel,proofs,OPC R1 8B,0.0
2165,o4-mini (high),openai/o4-mini--high,israel_tst_2025_4,israel,proofs,OPC R1 8B,0.0
2166,Grok 4,xai/grok-4,israel_tst_2025_4,israel,proofs,OPC R1 8B,0.0
2167,GPT OSS 120B (high),openai/oss-120b,israel_tst_2025_4,israel,proofs,OPC R1 8B,0.0
2168,GPT-5 (high),openai/gpt-5,israel_tst_2025_4,israel,proofs,OPC R1 8B,0.0
2169,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,israel_tst_2025_4,israel,proofs,OPC R1 8B,0.0
2170,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,israel_tst_2025_4,israel,proofs,OPC R1 8B,0.0
2171,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,israel_tst_2025_4,israel,proofs,OPC R1 8B,0.0
2172,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,israel_tst_2025_4,israel,proofs,OPC R1 8B,0.0
2173,GPT-5 (high),openai/gpt-5,israel_tst_2025_5,israel,proofs,OPC R1 8B,0.0
2174,gemini-2.5-pro,gemini/gemini-pro-2.5,israel_tst_2025_5,israel,proofs,OPC R1 8B,0.0
2175,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,israel_tst_2025_5,israel,proofs,OPC R1 8B,0.0
2176,Grok 4,xai/grok-4,israel_tst_2025_5,israel,proofs,OPC R1 8B,0.0
2177,o4-mini (high),openai/o4-mini--high,israel_tst_2025_5,israel,proofs,OPC R1 8B,0.0
2178,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,israel_tst_2025_5,israel,proofs,OPC R1 8B,0.0
2179,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,israel_tst_2025_5,israel,proofs,OPC R1 8B,0.0
2180,GPT OSS 120B (high),openai/oss-120b,israel_tst_2025_5,israel,proofs,OPC R1 8B,1.0
2181,Qwen3-4B (25/07),qwen/qwen3_4b,israel_tst_2025_5,israel,proofs,OPC R1 8B,0.0
2182,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,israel_tst_2025_5,israel,proofs,OPC R1 8B,0.0
2183,GPT-5 (high),openai/gpt-5,israel_tst_2025_6,israel,proofs,OPC R1 8B,0.0
2184,Grok 4,xai/grok-4,israel_tst_2025_6,israel,proofs,OPC R1 8B,0.0
2185,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,israel_tst_2025_6,israel,proofs,OPC R1 8B,0.0
2186,gemini-2.5-pro,gemini/gemini-pro-2.5,israel_tst_2025_6,israel,proofs,OPC R1 8B,0.0
2187,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,israel_tst_2025_6,israel,proofs,OPC R1 8B,0.0
2188,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,israel_tst_2025_6,israel,proofs,OPC R1 8B,0.0
2189,o4-mini (high),openai/o4-mini--high,israel_tst_2025_6,israel,proofs,OPC R1 8B,0.0
2190,GPT OSS 120B (high),openai/oss-120b,israel_tst_2025_6,israel,proofs,OPC R1 8B,1.0
2191,Qwen3-4B (25/07),qwen/qwen3_4b,israel_tst_2025_6,israel,proofs,OPC R1 8B,0.0
2192,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,israel_tst_2025_6,israel,proofs,OPC R1 8B,0.0
2193,Qwen3-4B (25/07),qwen/qwen3_4b,israel_tst_2025_7,israel,proofs,OPC R1 8B,0.0
2194,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,israel_tst_2025_7,israel,proofs,OPC R1 8B,1.0
2195,gemini-2.5-pro,gemini/gemini-pro-2.5,israel_tst_2025_7,israel,proofs,OPC R1 8B,0.0
2196,o4-mini (high),openai/o4-mini--high,israel_tst_2025_7,israel,proofs,OPC R1 8B,0.0
2197,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,israel_tst_2025_7,israel,proofs,OPC R1 8B,0.0
2198,Grok 4,xai/grok-4,israel_tst_2025_7,israel,proofs,OPC R1 8B,0.0
2199,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,israel_tst_2025_7,israel,proofs,OPC R1 8B,0.0
2200,GPT OSS 120B (high),openai/oss-120b,israel_tst_2025_7,israel,proofs,OPC R1 8B,0.0
2201,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,israel_tst_2025_7,israel,proofs,OPC R1 8B,0.0
2202,GPT-5 (high),openai/gpt-5,israel_tst_2025_7,israel,proofs,OPC R1 8B,1.0
2203,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,israel_tst_2025_8,israel,proofs,OPC R1 8B,0.0
2204,GPT OSS 120B (high),openai/oss-120b,israel_tst_2025_8,israel,proofs,OPC R1 8B,1.0
2205,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,israel_tst_2025_8,israel,proofs,OPC R1 8B,0.0
2206,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,israel_tst_2025_8,israel,proofs,OPC R1 8B,1.0
2207,o4-mini (high),openai/o4-mini--high,israel_tst_2025_8,israel,proofs,OPC R1 8B,0.0
2208,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,israel_tst_2025_8,israel,proofs,OPC R1 8B,0.0
2209,Qwen3-4B (25/07),qwen/qwen3_4b,israel_tst_2025_8,israel,proofs,OPC R1 8B,0.0
2210,gemini-2.5-pro,gemini/gemini-pro-2.5,israel_tst_2025_8,israel,proofs,OPC R1 8B,0.0
2211,Grok 4,xai/grok-4,israel_tst_2025_8,israel,proofs,OPC R1 8B,0.0
2212,GPT-5 (high),openai/gpt-5,israel_tst_2025_8,israel,proofs,OPC R1 8B,1.0
2213,Qwen3-4B (25/07),qwen/qwen3_4b,israel_tst_2025_9,israel,proofs,OPC R1 8B,0.0
2214,Grok 4,xai/grok-4,israel_tst_2025_9,israel,proofs,OPC R1 8B,0.0
2215,gemini-2.5-pro,gemini/gemini-pro-2.5,israel_tst_2025_9,israel,proofs,OPC R1 8B,0.0
2216,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,israel_tst_2025_9,israel,proofs,OPC R1 8B,0.0
2217,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,israel_tst_2025_9,israel,proofs,OPC R1 8B,0.0
2218,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,israel_tst_2025_9,israel,proofs,OPC R1 8B,0.0
2219,GPT OSS 120B (high),openai/oss-120b,israel_tst_2025_9,israel,proofs,OPC R1 8B,0.0
2220,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,israel_tst_2025_9,israel,proofs,OPC R1 8B,0.0
2221,o4-mini (high),openai/o4-mini--high,israel_tst_2025_9,israel,proofs,OPC R1 8B,0.0
2222,GPT-5 (high),openai/gpt-5,israel_tst_2025_9,israel,proofs,OPC R1 8B,0.0
2223,Grok 4,xai/grok-4,izho_2025_1,izho,proofs,OPC R1 8B,1.0
2224,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,izho_2025_1,izho,proofs,OPC R1 8B,1.0
2225,GPT-5-mini (high),openai/gpt-5-mini,izho_2025_1,izho,proofs,OPC R1 8B,0.0
2226,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,izho_2025_1,izho,proofs,OPC R1 8B,1.0
2227,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,izho_2025_1,izho,proofs,OPC R1 8B,1.0
2228,Qwen3-4B (25/07),qwen/qwen3_4b,izho_2025_1,izho,proofs,OPC R1 8B,1.0
2229,o4-mini (high),openai/o4-mini--high,izho_2025_1,izho,proofs,OPC R1 8B,1.0
2230,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,izho_2025_1,izho,proofs,OPC R1 8B,1.0
2231,GPT OSS 120B (high),openai/oss-120b,izho_2025_1,izho,proofs,OPC R1 8B,1.0
2232,gemini-2.5-pro,gemini/gemini-pro-2.5,izho_2025_1,izho,proofs,OPC R1 8B,1.0
2233,GPT-5 (high),openai/gpt-5,izho_2025_1,izho,proofs,OPC R1 8B,1.0
2234,Qwen3-4B (25/07),qwen/qwen3_4b,izho_2025_2,izho,proofs,OPC R1 8B,0.0
2235,o4-mini (high),openai/o4-mini--high,izho_2025_2,izho,proofs,OPC R1 8B,0.0
2236,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,izho_2025_2,izho,proofs,OPC R1 8B,0.0
2237,gemini-2.5-pro,gemini/gemini-pro-2.5,izho_2025_2,izho,proofs,OPC R1 8B,1.0
2238,Grok 4,xai/grok-4,izho_2025_2,izho,proofs,OPC R1 8B,0.0
2239,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,izho_2025_2,izho,proofs,OPC R1 8B,1.0
2240,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,izho_2025_2,izho,proofs,OPC R1 8B,0.0
2241,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,izho_2025_2,izho,proofs,OPC R1 8B,0.0
2242,GPT OSS 120B (high),openai/oss-120b,izho_2025_2,izho,proofs,OPC R1 8B,0.0
2243,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,izho_2025_3,izho,proofs,OPC R1 8B,1.0
2244,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,izho_2025_3,izho,proofs,OPC R1 8B,0.0
2245,o4-mini (high),openai/o4-mini--high,izho_2025_3,izho,proofs,OPC R1 8B,0.0
2246,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,izho_2025_3,izho,proofs,OPC R1 8B,0.0
2247,GPT OSS 120B (high),openai/oss-120b,izho_2025_3,izho,proofs,OPC R1 8B,0.0
2248,GPT-5-mini (high),openai/gpt-5-mini,izho_2025_3,izho,proofs,OPC R1 8B,1.0
2249,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,izho_2025_3,izho,proofs,OPC R1 8B,0.0
2250,Qwen3-4B (25/07),qwen/qwen3_4b,izho_2025_3,izho,proofs,OPC R1 8B,0.0
2251,gemini-2.5-pro,gemini/gemini-pro-2.5,izho_2025_3,izho,proofs,OPC R1 8B,0.0
2252,Grok 4,xai/grok-4,izho_2025_3,izho,proofs,OPC R1 8B,0.0
2253,GPT-5 (high),openai/gpt-5,izho_2025_4,izho,proofs,OPC R1 8B,0.0
2254,Grok 4,xai/grok-4,izho_2025_4,izho,proofs,OPC R1 8B,1.0
2255,GPT OSS 120B (high),openai/oss-120b,izho_2025_4,izho,proofs,OPC R1 8B,0.0
2256,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,izho_2025_4,izho,proofs,OPC R1 8B,0.0
2257,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,izho_2025_4,izho,proofs,OPC R1 8B,0.0
2258,Qwen3-4B (25/07),qwen/qwen3_4b,izho_2025_4,izho,proofs,OPC R1 8B,0.0
2259,gemini-2.5-pro,gemini/gemini-pro-2.5,izho_2025_4,izho,proofs,OPC R1 8B,1.0
2260,o4-mini (high),openai/o4-mini--high,izho_2025_4,izho,proofs,OPC R1 8B,1.0
2261,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,izho_2025_4,izho,proofs,OPC R1 8B,1.0
2262,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,izho_2025_4,izho,proofs,OPC R1 8B,1.0
2263,GPT-5-mini (high),openai/gpt-5-mini,izho_2025_4,izho,proofs,OPC R1 8B,1.0
2264,o4-mini (high),openai/o4-mini--high,izho_2025_5,izho,proofs,OPC R1 8B,0.0
2265,Grok 4,xai/grok-4,izho_2025_5,izho,proofs,OPC R1 8B,0.0
2266,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,izho_2025_5,izho,proofs,OPC R1 8B,0.0
2267,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,izho_2025_5,izho,proofs,OPC R1 8B,0.0
2268,Qwen3-4B (25/07),qwen/qwen3_4b,izho_2025_5,izho,proofs,OPC R1 8B,0.0
2269,gemini-2.5-pro,gemini/gemini-pro-2.5,izho_2025_5,izho,proofs,OPC R1 8B,0.0
2270,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,izho_2025_5,izho,proofs,OPC R1 8B,0.0
2271,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,izho_2025_5,izho,proofs,OPC R1 8B,0.0
2272,GPT OSS 120B (high),openai/oss-120b,izho_2025_5,izho,proofs,OPC R1 8B,1.0
2273,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,izho_2025_6,izho,proofs,OPC R1 8B,0.0
2274,gemini-2.5-pro,gemini/gemini-pro-2.5,izho_2025_6,izho,proofs,OPC R1 8B,0.0
2275,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,izho_2025_6,izho,proofs,OPC R1 8B,0.0
2276,o4-mini (high),openai/o4-mini--high,izho_2025_6,izho,proofs,OPC R1 8B,0.0
2277,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,izho_2025_6,izho,proofs,OPC R1 8B,0.0
2278,Grok 4,xai/grok-4,izho_2025_6,izho,proofs,OPC R1 8B,0.0
2279,GPT OSS 120B (high),openai/oss-120b,izho_2025_6,izho,proofs,OPC R1 8B,0.0
2280,GPT-5-mini (high),openai/gpt-5-mini,izho_2025_6,izho,proofs,OPC R1 8B,0.0
2281,Qwen3-4B (25/07),qwen/qwen3_4b,izho_2025_6,izho,proofs,OPC R1 8B,0.0
2282,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,izho_2025_6,izho,proofs,OPC R1 8B,0.0
2283,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,jbmo_2025_1,jbmo,proofs,OPC R1 8B,0.0
2284,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,jbmo_2025_1,jbmo,proofs,OPC R1 8B,1.0
2285,Qwen3-4B (25/07),qwen/qwen3_4b,jbmo_2025_1,jbmo,proofs,OPC R1 8B,0.0
2286,Grok 4,xai/grok-4,jbmo_2025_1,jbmo,proofs,OPC R1 8B,0.0
2287,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,jbmo_2025_1,jbmo,proofs,OPC R1 8B,1.0
2288,GPT-5-mini (high),openai/gpt-5-mini,jbmo_2025_1,jbmo,proofs,OPC R1 8B,1.0
2289,GPT OSS 120B (high),openai/oss-120b,jbmo_2025_1,jbmo,proofs,OPC R1 8B,1.0
2290,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,jbmo_2025_1,jbmo,proofs,OPC R1 8B,0.0
2291,gemini-2.5-pro,gemini/gemini-pro-2.5,jbmo_2025_1,jbmo,proofs,OPC R1 8B,1.0
2292,o4-mini (high),openai/o4-mini--high,jbmo_2025_1,jbmo,proofs,OPC R1 8B,1.0
2293,GPT-5-mini (high),openai/gpt-5-mini,jbmo_2025_2,jbmo,proofs,OPC R1 8B,1.0
2294,Qwen3-4B (25/07),qwen/qwen3_4b,jbmo_2025_2,jbmo,proofs,OPC R1 8B,1.0
2295,gemini-2.5-pro,gemini/gemini-pro-2.5,jbmo_2025_2,jbmo,proofs,OPC R1 8B,1.0
2296,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,jbmo_2025_2,jbmo,proofs,OPC R1 8B,1.0
2297,GPT OSS 120B (high),openai/oss-120b,jbmo_2025_2,jbmo,proofs,OPC R1 8B,0.0
2298,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,jbmo_2025_2,jbmo,proofs,OPC R1 8B,1.0
2299,Grok 4,xai/grok-4,jbmo_2025_2,jbmo,proofs,OPC R1 8B,0.0
2300,o4-mini (high),openai/o4-mini--high,jbmo_2025_2,jbmo,proofs,OPC R1 8B,1.0
2301,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,jbmo_2025_2,jbmo,proofs,OPC R1 8B,0.0
2302,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,jbmo_2025_2,jbmo,proofs,OPC R1 8B,0.0
2303,GPT-5-mini (high),openai/gpt-5-mini,jbmo_2025_3,jbmo,proofs,OPC R1 8B,1.0
2304,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,jbmo_2025_3,jbmo,proofs,OPC R1 8B,1.0
2305,GPT OSS 120B (high),openai/oss-120b,jbmo_2025_3,jbmo,proofs,OPC R1 8B,1.0
2306,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,jbmo_2025_3,jbmo,proofs,OPC R1 8B,1.0
2307,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,jbmo_2025_3,jbmo,proofs,OPC R1 8B,1.0
2308,Qwen3-4B (25/07),qwen/qwen3_4b,jbmo_2025_3,jbmo,proofs,OPC R1 8B,1.0
2309,gemini-2.5-pro,gemini/gemini-pro-2.5,jbmo_2025_3,jbmo,proofs,OPC R1 8B,1.0
2310,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,jbmo_2025_3,jbmo,proofs,OPC R1 8B,1.0
2311,o4-mini (high),openai/o4-mini--high,jbmo_2025_3,jbmo,proofs,OPC R1 8B,1.0
2312,Grok 4,xai/grok-4,jbmo_2025_3,jbmo,proofs,OPC R1 8B,1.0
2313,GPT OSS 120B (high),openai/oss-120b,jbmo_2025_4,jbmo,proofs,OPC R1 8B,0.0
2314,GPT-5-mini (high),openai/gpt-5-mini,jbmo_2025_4,jbmo,proofs,OPC R1 8B,0.0
2315,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,jbmo_2025_4,jbmo,proofs,OPC R1 8B,0.0
2316,Grok 4,xai/grok-4,jbmo_2025_4,jbmo,proofs,OPC R1 8B,0.0
2317,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,jbmo_2025_4,jbmo,proofs,OPC R1 8B,1.0
2318,o4-mini (high),openai/o4-mini--high,jbmo_2025_4,jbmo,proofs,OPC R1 8B,0.0
2319,Qwen3-4B (25/07),qwen/qwen3_4b,jbmo_2025_4,jbmo,proofs,OPC R1 8B,0.0
2320,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,jbmo_2025_4,jbmo,proofs,OPC R1 8B,0.0
2321,gemini-2.5-pro,gemini/gemini-pro-2.5,jbmo_2025_4,jbmo,proofs,OPC R1 8B,0.0
2322,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,jbmo_2025_4,jbmo,proofs,OPC R1 8B,0.0
2323,Grok 4,xai/grok-4,korea_2025_1,korea,proofs,OPC R1 8B,0.0
2324,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,korea_2025_1,korea,proofs,OPC R1 8B,0.0
2325,GPT-5 (high),openai/gpt-5,korea_2025_1,korea,proofs,OPC R1 8B,1.0
2326,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,korea_2025_1,korea,proofs,OPC R1 8B,0.0
2327,o4-mini (high),openai/o4-mini--high,korea_2025_1,korea,proofs,OPC R1 8B,0.0
2328,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,korea_2025_1,korea,proofs,OPC R1 8B,0.0
2329,GPT-5-mini (high),openai/gpt-5-mini,korea_2025_1,korea,proofs,OPC R1 8B,1.0
2330,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,korea_2025_1,korea,proofs,OPC R1 8B,1.0
2331,gemini-2.5-pro,gemini/gemini-pro-2.5,korea_2025_1,korea,proofs,OPC R1 8B,0.0
2332,GPT OSS 120B (high),openai/oss-120b,korea_2025_1,korea,proofs,OPC R1 8B,0.0
2333,Qwen3-4B (25/07),qwen/qwen3_4b,korea_2025_1,korea,proofs,OPC R1 8B,0.0
2334,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,korea_2025_2,korea,proofs,OPC R1 8B,0.0
2335,Grok 4,xai/grok-4,korea_2025_2,korea,proofs,OPC R1 8B,0.0
2336,gemini-2.5-pro,gemini/gemini-pro-2.5,korea_2025_2,korea,proofs,OPC R1 8B,0.0
2337,GPT-5-mini (high),openai/gpt-5-mini,korea_2025_2,korea,proofs,OPC R1 8B,0.0
2338,GPT OSS 120B (high),openai/oss-120b,korea_2025_2,korea,proofs,OPC R1 8B,0.0
2339,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,korea_2025_2,korea,proofs,OPC R1 8B,0.0
2340,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,korea_2025_2,korea,proofs,OPC R1 8B,0.0
2341,o4-mini (high),openai/o4-mini--high,korea_2025_2,korea,proofs,OPC R1 8B,0.0
2342,GPT-5 (high),openai/gpt-5,korea_2025_2,korea,proofs,OPC R1 8B,1.0
2343,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,korea_2025_2,korea,proofs,OPC R1 8B,0.0
2344,Qwen3-4B (25/07),qwen/qwen3_4b,korea_2025_2,korea,proofs,OPC R1 8B,1.0
2345,Qwen3-4B (25/07),qwen/qwen3_4b,korea_2025_3,korea,proofs,OPC R1 8B,0.0
2346,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,korea_2025_3,korea,proofs,OPC R1 8B,0.0
2347,o4-mini (high),openai/o4-mini--high,korea_2025_3,korea,proofs,OPC R1 8B,0.0
2348,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,korea_2025_3,korea,proofs,OPC R1 8B,0.0
2349,Grok 4,xai/grok-4,korea_2025_3,korea,proofs,OPC R1 8B,0.0
2350,GPT OSS 120B (high),openai/oss-120b,korea_2025_3,korea,proofs,OPC R1 8B,0.0
2351,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,korea_2025_3,korea,proofs,OPC R1 8B,0.0
2352,GPT-5-mini (high),openai/gpt-5-mini,korea_2025_3,korea,proofs,OPC R1 8B,0.0
2353,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,korea_2025_3,korea,proofs,OPC R1 8B,0.0
2354,gemini-2.5-pro,gemini/gemini-pro-2.5,korea_2025_3,korea,proofs,OPC R1 8B,0.0
2355,GPT-5 (high),openai/gpt-5,korea_2025_3,korea,proofs,OPC R1 8B,0.0
2356,GPT-5-mini (high),openai/gpt-5-mini,korea_2025_4,korea,proofs,OPC R1 8B,0.0
2357,Grok 4,xai/grok-4,korea_2025_4,korea,proofs,OPC R1 8B,0.0
2358,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,korea_2025_4,korea,proofs,OPC R1 8B,0.0
2359,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,korea_2025_4,korea,proofs,OPC R1 8B,0.0
2360,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,korea_2025_4,korea,proofs,OPC R1 8B,0.0
2361,GPT-5 (high),openai/gpt-5,korea_2025_4,korea,proofs,OPC R1 8B,0.0
2362,Qwen3-4B (25/07),qwen/qwen3_4b,korea_2025_4,korea,proofs,OPC R1 8B,0.0
2363,o4-mini (high),openai/o4-mini--high,korea_2025_4,korea,proofs,OPC R1 8B,0.0
2364,gemini-2.5-pro,gemini/gemini-pro-2.5,korea_2025_4,korea,proofs,OPC R1 8B,0.0
2365,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,korea_2025_4,korea,proofs,OPC R1 8B,0.0
2366,GPT OSS 120B (high),openai/oss-120b,korea_2025_4,korea,proofs,OPC R1 8B,0.0
2367,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,korea_2025_5,korea,proofs,OPC R1 8B,1.0
2368,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,korea_2025_5,korea,proofs,OPC R1 8B,0.0
2369,GPT OSS 120B (high),openai/oss-120b,korea_2025_5,korea,proofs,OPC R1 8B,0.0
2370,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,korea_2025_5,korea,proofs,OPC R1 8B,1.0
2371,GPT-5 (high),openai/gpt-5,korea_2025_5,korea,proofs,OPC R1 8B,0.0
2372,Grok 4,xai/grok-4,korea_2025_5,korea,proofs,OPC R1 8B,0.0
2373,Qwen3-4B (25/07),qwen/qwen3_4b,korea_2025_5,korea,proofs,OPC R1 8B,0.0
2374,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,korea_2025_5,korea,proofs,OPC R1 8B,0.0
2375,GPT-5-mini (high),openai/gpt-5-mini,korea_2025_5,korea,proofs,OPC R1 8B,0.0
2376,o4-mini (high),openai/o4-mini--high,korea_2025_5,korea,proofs,OPC R1 8B,0.0
2377,gemini-2.5-pro,gemini/gemini-pro-2.5,korea_2025_5,korea,proofs,OPC R1 8B,0.0
2378,o4-mini (high),openai/o4-mini--high,korea_2025_6,korea,proofs,OPC R1 8B,0.0
2379,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,korea_2025_6,korea,proofs,OPC R1 8B,0.0
2380,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,korea_2025_6,korea,proofs,OPC R1 8B,0.0
2381,GPT-5 (high),openai/gpt-5,korea_2025_6,korea,proofs,OPC R1 8B,0.0
2382,Qwen3-4B (25/07),qwen/qwen3_4b,korea_2025_6,korea,proofs,OPC R1 8B,0.0
2383,GPT-5-mini (high),openai/gpt-5-mini,korea_2025_6,korea,proofs,OPC R1 8B,0.0
2384,Grok 4,xai/grok-4,korea_2025_6,korea,proofs,OPC R1 8B,0.0
2385,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,korea_2025_6,korea,proofs,OPC R1 8B,0.0
2386,GPT OSS 120B (high),openai/oss-120b,korea_2025_6,korea,proofs,OPC R1 8B,1.0
2387,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,korea_2025_6,korea,proofs,OPC R1 8B,0.0
2391,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_aime/aime_2025_1,matharena,answer,Final Answer Parser,1.0
2396,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_aime/aime_2025_1,matharena,answer,Final Answer Parser,1.0
2397,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_aime/aime_2025_1,matharena,answer,Final Answer Parser,1.0
2399,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_aime/aime_2025_10,matharena,answer,Final Answer Parser,0.0
2403,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_aime/aime_2025_10,matharena,answer,Final Answer Parser,1.0
2408,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_aime/aime_2025_10,matharena,answer,Final Answer Parser,0.0
2411,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_aime/aime_2025_11,matharena,answer,Final Answer Parser,1.0
2415,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_aime/aime_2025_11,matharena,answer,Final Answer Parser,0.0
2417,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_aime/aime_2025_11,matharena,answer,Final Answer Parser,1.0
2420,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_aime/aime_2025_12,matharena,answer,Final Answer Parser,1.0
2424,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_aime/aime_2025_12,matharena,answer,Final Answer Parser,1.0
2430,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_aime/aime_2025_12,matharena,answer,Final Answer Parser,1.0
2432,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_aime/aime_2025_13,matharena,answer,Final Answer Parser,0.0
2435,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_aime/aime_2025_13,matharena,answer,Final Answer Parser,0.0
2440,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_aime/aime_2025_13,matharena,answer,Final Answer Parser,1.0
2442,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_aime/aime_2025_14,matharena,answer,Final Answer Parser,0.0
2446,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_aime/aime_2025_14,matharena,answer,Final Answer Parser,0.0
2448,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_aime/aime_2025_14,matharena,answer,Final Answer Parser,0.0
2451,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_aime/aime_2025_15,matharena,answer,Final Answer Parser,0.0
2458,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_aime/aime_2025_15,matharena,answer,Final Answer Parser,0.0
2459,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_aime/aime_2025_15,matharena,answer,Final Answer Parser,0.0
2464,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_aime/aime_2025_16,matharena,answer,Final Answer Parser,1.0
2465,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_aime/aime_2025_16,matharena,answer,Final Answer Parser,1.0
2468,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_aime/aime_2025_16,matharena,answer,Final Answer Parser,1.0
2475,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_aime/aime_2025_17,matharena,answer,Final Answer Parser,1.0
2478,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_aime/aime_2025_17,matharena,answer,Final Answer Parser,1.0
2481,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_aime/aime_2025_17,matharena,answer,Final Answer Parser,1.0
2483,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_aime/aime_2025_18,matharena,answer,Final Answer Parser,0.0
2488,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_aime/aime_2025_18,matharena,answer,Final Answer Parser,1.0
2489,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_aime/aime_2025_18,matharena,answer,Final Answer Parser,1.0
2499,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_aime/aime_2025_19,matharena,answer,Final Answer Parser,1.0
2501,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_aime/aime_2025_19,matharena,answer,Final Answer Parser,1.0
2502,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_aime/aime_2025_19,matharena,answer,Final Answer Parser,1.0
2505,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_aime/aime_2025_2,matharena,answer,Final Answer Parser,1.0
2506,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_aime/aime_2025_2,matharena,answer,Final Answer Parser,1.0
2513,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_aime/aime_2025_2,matharena,answer,Final Answer Parser,1.0
2518,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_aime/aime_2025_20,matharena,answer,Final Answer Parser,1.0
2524,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_aime/aime_2025_20,matharena,answer,Final Answer Parser,0.0
2525,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_aime/aime_2025_20,matharena,answer,Final Answer Parser,1.0
2528,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_aime/aime_2025_21,matharena,answer,Final Answer Parser,1.0
2531,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_aime/aime_2025_21,matharena,answer,Final Answer Parser,1.0
2534,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_aime/aime_2025_21,matharena,answer,Final Answer Parser,1.0
2539,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_aime/aime_2025_22,matharena,answer,Final Answer Parser,1.0
2542,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_aime/aime_2025_22,matharena,answer,Final Answer Parser,1.0
2544,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_aime/aime_2025_22,matharena,answer,Final Answer Parser,1.0
2550,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_aime/aime_2025_23,matharena,answer,Final Answer Parser,1.0
2551,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_aime/aime_2025_23,matharena,answer,Final Answer Parser,1.0
2555,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_aime/aime_2025_23,matharena,answer,Final Answer Parser,1.0
2563,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_aime/aime_2025_24,matharena,answer,Final Answer Parser,1.0
2567,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_aime/aime_2025_24,matharena,answer,Final Answer Parser,1.0
2570,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_aime/aime_2025_24,matharena,answer,Final Answer Parser,1.0
2571,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_aime/aime_2025_25,matharena,answer,Final Answer Parser,1.0
2573,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_aime/aime_2025_25,matharena,answer,Final Answer Parser,1.0
2575,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_aime/aime_2025_25,matharena,answer,Final Answer Parser,1.0
2582,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_aime/aime_2025_26,matharena,answer,Final Answer Parser,1.0
2585,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_aime/aime_2025_26,matharena,answer,Final Answer Parser,1.0
2591,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_aime/aime_2025_26,matharena,answer,Final Answer Parser,1.0
2593,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_aime/aime_2025_27,matharena,answer,Final Answer Parser,1.0
2596,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_aime/aime_2025_27,matharena,answer,Final Answer Parser,1.0
2601,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_aime/aime_2025_27,matharena,answer,Final Answer Parser,1.0
2605,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_aime/aime_2025_28,matharena,answer,Final Answer Parser,1.0
2607,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_aime/aime_2025_28,matharena,answer,Final Answer Parser,0.0
2611,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_aime/aime_2025_28,matharena,answer,Final Answer Parser,0.0
2616,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_aime/aime_2025_29,matharena,answer,Final Answer Parser,1.0
2617,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_aime/aime_2025_29,matharena,answer,Final Answer Parser,1.0
2619,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_aime/aime_2025_29,matharena,answer,Final Answer Parser,1.0
2629,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_aime/aime_2025_3,matharena,answer,Final Answer Parser,1.0
2633,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_aime/aime_2025_3,matharena,answer,Final Answer Parser,1.0
2635,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_aime/aime_2025_3,matharena,answer,Final Answer Parser,1.0
2638,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_aime/aime_2025_30,matharena,answer,Final Answer Parser,1.0
2643,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_aime/aime_2025_30,matharena,answer,Final Answer Parser,0.0
2646,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_aime/aime_2025_30,matharena,answer,Final Answer Parser,1.0
2650,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_aime/aime_2025_4,matharena,answer,Final Answer Parser,1.0
2651,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_aime/aime_2025_4,matharena,answer,Final Answer Parser,1.0
2654,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_aime/aime_2025_4,matharena,answer,Final Answer Parser,1.0
2663,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_aime/aime_2025_5,matharena,answer,Final Answer Parser,1.0
2666,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_aime/aime_2025_5,matharena,answer,Final Answer Parser,1.0
2668,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_aime/aime_2025_5,matharena,answer,Final Answer Parser,1.0
2669,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_aime/aime_2025_6,matharena,answer,Final Answer Parser,1.0
2672,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_aime/aime_2025_6,matharena,answer,Final Answer Parser,1.0
2677,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_aime/aime_2025_6,matharena,answer,Final Answer Parser,1.0
2681,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_aime/aime_2025_7,matharena,answer,Final Answer Parser,0.0
2683,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_aime/aime_2025_7,matharena,answer,Final Answer Parser,1.0
2684,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_aime/aime_2025_7,matharena,answer,Final Answer Parser,1.0
2694,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_aime/aime_2025_8,matharena,answer,Final Answer Parser,1.0
2696,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_aime/aime_2025_8,matharena,answer,Final Answer Parser,1.0
2698,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_aime/aime_2025_8,matharena,answer,Final Answer Parser,1.0
2702,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_aime/aime_2025_9,matharena,answer,Final Answer Parser,1.0
2708,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_aime/aime_2025_9,matharena,answer,Final Answer Parser,1.0
2710,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_aime/aime_2025_9,matharena,answer,Final Answer Parser,0.0
2717,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_brumo/brumo_2025_1,matharena,answer,Final Answer Parser,1.0
2718,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_brumo/brumo_2025_1,matharena,answer,Final Answer Parser,1.0
2720,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_brumo/brumo_2025_1,matharena,answer,Final Answer Parser,1.0
2724,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_brumo/brumo_2025_10,matharena,answer,Final Answer Parser,1.0
2728,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_brumo/brumo_2025_10,matharena,answer,Final Answer Parser,1.0
2734,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_brumo/brumo_2025_10,matharena,answer,Final Answer Parser,1.0
2736,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_brumo/brumo_2025_11,matharena,answer,Final Answer Parser,1.0
2744,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_brumo/brumo_2025_11,matharena,answer,Final Answer Parser,1.0
2745,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_brumo/brumo_2025_11,matharena,answer,Final Answer Parser,1.0
2748,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_brumo/brumo_2025_12,matharena,answer,Final Answer Parser,0.0
2752,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_brumo/brumo_2025_12,matharena,answer,Final Answer Parser,0.0
2755,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_brumo/brumo_2025_12,matharena,answer,Final Answer Parser,1.0
2757,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_brumo/brumo_2025_13,matharena,answer,Final Answer Parser,0.0
2758,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_brumo/brumo_2025_13,matharena,answer,Final Answer Parser,0.0
2766,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_brumo/brumo_2025_13,matharena,answer,Final Answer Parser,1.0
2770,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_brumo/brumo_2025_14,matharena,answer,Final Answer Parser,1.0
2772,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_brumo/brumo_2025_14,matharena,answer,Final Answer Parser,1.0
2782,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_brumo/brumo_2025_15,matharena,answer,Final Answer Parser,0.0
2784,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_brumo/brumo_2025_15,matharena,answer,Final Answer Parser,1.0
2785,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_brumo/brumo_2025_15,matharena,answer,Final Answer Parser,0.0
2792,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_brumo/brumo_2025_16,matharena,answer,Final Answer Parser,1.0
2793,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_brumo/brumo_2025_16,matharena,answer,Final Answer Parser,1.0
2796,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_brumo/brumo_2025_16,matharena,answer,Final Answer Parser,0.0
2800,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_brumo/brumo_2025_17,matharena,answer,Final Answer Parser,1.0
2801,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_brumo/brumo_2025_17,matharena,answer,Final Answer Parser,1.0
2806,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_brumo/brumo_2025_17,matharena,answer,Final Answer Parser,1.0
2808,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_brumo/brumo_2025_18,matharena,answer,Final Answer Parser,1.0
2812,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_brumo/brumo_2025_18,matharena,answer,Final Answer Parser,1.0
2815,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_brumo/brumo_2025_18,matharena,answer,Final Answer Parser,1.0
2819,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_brumo/brumo_2025_19,matharena,answer,Final Answer Parser,1.0
2822,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_brumo/brumo_2025_19,matharena,answer,Final Answer Parser,1.0
2826,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_brumo/brumo_2025_19,matharena,answer,Final Answer Parser,1.0
2836,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_brumo/brumo_2025_2,matharena,answer,Final Answer Parser,1.0
2838,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_brumo/brumo_2025_2,matharena,answer,Final Answer Parser,1.0
2839,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_brumo/brumo_2025_2,matharena,answer,Final Answer Parser,1.0
2846,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_brumo/brumo_2025_20,matharena,answer,Final Answer Parser,1.0
2850,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_brumo/brumo_2025_20,matharena,answer,Final Answer Parser,1.0
2851,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_brumo/brumo_2025_20,matharena,answer,Final Answer Parser,1.0
2853,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_brumo/brumo_2025_21,matharena,answer,Final Answer Parser,1.0
2857,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_brumo/brumo_2025_21,matharena,answer,Final Answer Parser,1.0
2861,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_brumo/brumo_2025_21,matharena,answer,Final Answer Parser,0.0
2863,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_brumo/brumo_2025_22,matharena,answer,Final Answer Parser,1.0
2868,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_brumo/brumo_2025_22,matharena,answer,Final Answer Parser,0.0
2872,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_brumo/brumo_2025_22,matharena,answer,Final Answer Parser,1.0
2878,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_brumo/brumo_2025_23,matharena,answer,Final Answer Parser,0.0
2881,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_brumo/brumo_2025_23,matharena,answer,Final Answer Parser,0.0
2883,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_brumo/brumo_2025_23,matharena,answer,Final Answer Parser,0.0
2890,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_brumo/brumo_2025_24,matharena,answer,Final Answer Parser,1.0
2892,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_brumo/brumo_2025_24,matharena,answer,Final Answer Parser,1.0
2893,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_brumo/brumo_2025_24,matharena,answer,Final Answer Parser,1.0
2900,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_brumo/brumo_2025_25,matharena,answer,Final Answer Parser,1.0
2901,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_brumo/brumo_2025_25,matharena,answer,Final Answer Parser,1.0
2903,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_brumo/brumo_2025_25,matharena,answer,Final Answer Parser,1.0
2908,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_brumo/brumo_2025_26,matharena,answer,Final Answer Parser,1.0
2911,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_brumo/brumo_2025_26,matharena,answer,Final Answer Parser,1.0
2914,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_brumo/brumo_2025_26,matharena,answer,Final Answer Parser,1.0
2920,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_brumo/brumo_2025_27,matharena,answer,Final Answer Parser,1.0
2923,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_brumo/brumo_2025_27,matharena,answer,Final Answer Parser,0.0
2927,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_brumo/brumo_2025_27,matharena,answer,Final Answer Parser,1.0
2928,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_brumo/brumo_2025_28,matharena,answer,Final Answer Parser,0.0
2935,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_brumo/brumo_2025_28,matharena,answer,Final Answer Parser,1.0
2936,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_brumo/brumo_2025_28,matharena,answer,Final Answer Parser,0.0
2940,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_brumo/brumo_2025_29,matharena,answer,Final Answer Parser,0.0
2941,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_brumo/brumo_2025_29,matharena,answer,Final Answer Parser,1.0
2944,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_brumo/brumo_2025_29,matharena,answer,Final Answer Parser,1.0
2950,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_brumo/brumo_2025_3,matharena,answer,Final Answer Parser,1.0
2951,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_brumo/brumo_2025_3,matharena,answer,Final Answer Parser,1.0
2956,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_brumo/brumo_2025_3,matharena,answer,Final Answer Parser,1.0
2962,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_brumo/brumo_2025_30,matharena,answer,Final Answer Parser,0.0
2970,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_brumo/brumo_2025_30,matharena,answer,Final Answer Parser,1.0
2971,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_brumo/brumo_2025_30,matharena,answer,Final Answer Parser,0.0
2973,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_brumo/brumo_2025_4,matharena,answer,Final Answer Parser,1.0
2979,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_brumo/brumo_2025_4,matharena,answer,Final Answer Parser,1.0
2982,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_brumo/brumo_2025_4,matharena,answer,Final Answer Parser,1.0
2983,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_brumo/brumo_2025_5,matharena,answer,Final Answer Parser,1.0
2988,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_brumo/brumo_2025_5,matharena,answer,Final Answer Parser,1.0
2989,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_brumo/brumo_2025_5,matharena,answer,Final Answer Parser,1.0
2995,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_brumo/brumo_2025_6,matharena,answer,Final Answer Parser,1.0
3002,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_brumo/brumo_2025_6,matharena,answer,Final Answer Parser,0.0
3004,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_brumo/brumo_2025_6,matharena,answer,Final Answer Parser,1.0
3008,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_brumo/brumo_2025_7,matharena,answer,Final Answer Parser,1.0
3012,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_brumo/brumo_2025_7,matharena,answer,Final Answer Parser,1.0
3013,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_brumo/brumo_2025_7,matharena,answer,Final Answer Parser,1.0
3016,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_brumo/brumo_2025_8,matharena,answer,Final Answer Parser,1.0
3021,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_brumo/brumo_2025_8,matharena,answer,Final Answer Parser,1.0
3024,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_brumo/brumo_2025_8,matharena,answer,Final Answer Parser,1.0
3027,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_brumo/brumo_2025_9,matharena,answer,Final Answer Parser,1.0
3028,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_brumo/brumo_2025_9,matharena,answer,Final Answer Parser,1.0
3033,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_brumo/brumo_2025_9,matharena,answer,Final Answer Parser,1.0
3039,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_1,matharena,answer,Final Answer Parser,1.0
3041,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_1,matharena,answer,Final Answer Parser,1.0
3044,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_1,matharena,answer,Final Answer Parser,1.0
3045,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_1,matharena,answer,Final Answer Parser,1.0
3050,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_10,matharena,answer,Final Answer Parser,1.0
3052,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_10,matharena,answer,Final Answer Parser,1.0
3056,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_10,matharena,answer,Final Answer Parser,1.0
3059,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_10,matharena,answer,Final Answer Parser,1.0
3060,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_11,matharena,answer,Final Answer Parser,1.0
3065,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_11,matharena,answer,Final Answer Parser,1.0
3068,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_11,matharena,answer,Final Answer Parser,1.0
3070,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_11,matharena,answer,Final Answer Parser,1.0
3071,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_12,matharena,answer,Final Answer Parser,1.0
3076,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_12,matharena,answer,Final Answer Parser,1.0
3079,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_12,matharena,answer,Final Answer Parser,1.0
3081,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_12,matharena,answer,Final Answer Parser,1.0
3082,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_13,matharena,answer,Final Answer Parser,1.0
3089,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_13,matharena,answer,Final Answer Parser,1.0
3090,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_13,matharena,answer,Final Answer Parser,0.0
3092,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_13,matharena,answer,Final Answer Parser,1.0
3095,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_14,matharena,answer,Final Answer Parser,1.0
3098,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_14,matharena,answer,Final Answer Parser,1.0
3102,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_14,matharena,answer,Final Answer Parser,1.0
3103,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_14,matharena,answer,Final Answer Parser,0.0
3105,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_15,matharena,answer,Final Answer Parser,0.0
3107,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_15,matharena,answer,Final Answer Parser,0.0
3108,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_15,matharena,answer,Final Answer Parser,0.0
3111,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_15,matharena,answer,Final Answer Parser,0.0
3117,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_16,matharena,answer,Final Answer Parser,0.0
3121,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_16,matharena,answer,Final Answer Parser,1.0
3122,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_16,matharena,answer,Final Answer Parser,0.0
3124,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_16,matharena,answer,Final Answer Parser,0.0
3127,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_17,matharena,answer,Final Answer Parser,1.0
3130,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_17,matharena,answer,Final Answer Parser,1.0
3131,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_17,matharena,answer,Final Answer Parser,1.0
3133,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_17,matharena,answer,Final Answer Parser,1.0
3140,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_18,matharena,answer,Final Answer Parser,0.0
3142,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_18,matharena,answer,Final Answer Parser,0.0
3143,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_18,matharena,answer,Final Answer Parser,1.0
3145,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_18,matharena,answer,Final Answer Parser,1.0
3148,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_19,matharena,answer,Final Answer Parser,1.0
3149,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_19,matharena,answer,Final Answer Parser,1.0
3151,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_19,matharena,answer,Final Answer Parser,1.0
3153,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_19,matharena,answer,Final Answer Parser,0.0
3158,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_2,matharena,answer,Final Answer Parser,1.0
3160,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_2,matharena,answer,Final Answer Parser,1.0
3161,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_2,matharena,answer,Final Answer Parser,1.0
3166,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_2,matharena,answer,Final Answer Parser,1.0
3169,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_20,matharena,answer,Final Answer Parser,0.0
3170,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_20,matharena,answer,Final Answer Parser,1.0
3173,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_20,matharena,answer,Final Answer Parser,1.0
3177,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_20,matharena,answer,Final Answer Parser,1.0
3181,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_21,matharena,answer,Final Answer Parser,0.0
3184,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_21,matharena,answer,Final Answer Parser,0.0
3185,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_21,matharena,answer,Final Answer Parser,0.0
3189,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_21,matharena,answer,Final Answer Parser,1.0
3192,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_22,matharena,answer,Final Answer Parser,1.0
3197,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_22,matharena,answer,Final Answer Parser,1.0
3198,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_22,matharena,answer,Final Answer Parser,1.0
3199,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_22,matharena,answer,Final Answer Parser,1.0
3207,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_23,matharena,answer,Final Answer Parser,1.0
3208,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_23,matharena,answer,Final Answer Parser,1.0
3209,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_23,matharena,answer,Final Answer Parser,0.0
3211,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_23,matharena,answer,Final Answer Parser,1.0
3214,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_24,matharena,answer,Final Answer Parser,1.0
3217,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_24,matharena,answer,Final Answer Parser,1.0
3221,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_24,matharena,answer,Final Answer Parser,1.0
3223,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_24,matharena,answer,Final Answer Parser,1.0
3228,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_25,matharena,answer,Final Answer Parser,1.0
3230,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_25,matharena,answer,Final Answer Parser,0.0
3232,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_25,matharena,answer,Final Answer Parser,0.0
3233,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_25,matharena,answer,Final Answer Parser,0.0
3235,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_26,matharena,answer,Final Answer Parser,1.0
3237,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_26,matharena,answer,Final Answer Parser,1.0
3238,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_26,matharena,answer,Final Answer Parser,1.0
3244,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_26,matharena,answer,Final Answer Parser,1.0
3250,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_27,matharena,answer,Final Answer Parser,1.0
3252,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_27,matharena,answer,Final Answer Parser,0.0
3253,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_27,matharena,answer,Final Answer Parser,1.0
3256,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_27,matharena,answer,Final Answer Parser,1.0
3259,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_28,matharena,answer,Final Answer Parser,0.0
3261,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_28,matharena,answer,Final Answer Parser,0.0
3262,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_28,matharena,answer,Final Answer Parser,0.0
3264,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_28,matharena,answer,Final Answer Parser,0.0
3266,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_29,matharena,answer,Final Answer Parser,1.0
3268,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_29,matharena,answer,Final Answer Parser,1.0
3270,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_29,matharena,answer,Final Answer Parser,1.0
3274,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_29,matharena,answer,Final Answer Parser,0.0
3276,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_3,matharena,answer,Final Answer Parser,1.0
3283,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_3,matharena,answer,Final Answer Parser,1.0
3284,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_3,matharena,answer,Final Answer Parser,1.0
3285,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_3,matharena,answer,Final Answer Parser,1.0
3287,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_30,matharena,answer,Final Answer Parser,1.0
3289,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_30,matharena,answer,Final Answer Parser,0.0
3293,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_30,matharena,answer,Final Answer Parser,1.0
3296,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_30,matharena,answer,Final Answer Parser,0.0
3297,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_31,matharena,answer,Final Answer Parser,1.0
3301,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_31,matharena,answer,Final Answer Parser,1.0
3303,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_31,matharena,answer,Final Answer Parser,1.0
3307,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_31,matharena,answer,Final Answer Parser,1.0
3308,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_32,matharena,answer,Final Answer Parser,1.0
3311,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_32,matharena,answer,Final Answer Parser,0.0
3312,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_32,matharena,answer,Final Answer Parser,0.0
3313,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_32,matharena,answer,Final Answer Parser,0.0
3318,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_33,matharena,answer,Final Answer Parser,1.0
3319,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_33,matharena,answer,Final Answer Parser,1.0
3324,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_33,matharena,answer,Final Answer Parser,1.0
3327,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_33,matharena,answer,Final Answer Parser,1.0
3329,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_34,matharena,answer,Final Answer Parser,0.0
3330,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_34,matharena,answer,Final Answer Parser,0.0
3332,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_34,matharena,answer,Final Answer Parser,0.0
3335,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_34,matharena,answer,Final Answer Parser,0.0
3343,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_35,matharena,answer,Final Answer Parser,1.0
3345,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_35,matharena,answer,Final Answer Parser,1.0
3346,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_35,matharena,answer,Final Answer Parser,1.0
3348,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_35,matharena,answer,Final Answer Parser,1.0
3351,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_36,matharena,answer,Final Answer Parser,0.0
3352,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_36,matharena,answer,Final Answer Parser,0.0
3356,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_36,matharena,answer,Final Answer Parser,1.0
3357,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_36,matharena,answer,Final Answer Parser,1.0
3363,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_37,matharena,answer,Final Answer Parser,0.0
3364,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_37,matharena,answer,Final Answer Parser,1.0
3365,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_37,matharena,answer,Final Answer Parser,1.0
3366,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_37,matharena,answer,Final Answer Parser,1.0
3374,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_38,matharena,answer,Final Answer Parser,1.0
3378,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_38,matharena,answer,Final Answer Parser,0.0
3380,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_38,matharena,answer,Final Answer Parser,1.0
3382,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_38,matharena,answer,Final Answer Parser,0.0
3386,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_39,matharena,answer,Final Answer Parser,1.0
3387,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_39,matharena,answer,Final Answer Parser,0.0
3392,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_39,matharena,answer,Final Answer Parser,1.0
3393,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_39,matharena,answer,Final Answer Parser,0.0
3398,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_4,matharena,answer,Final Answer Parser,1.0
3399,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_4,matharena,answer,Final Answer Parser,1.0
3404,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_4,matharena,answer,Final Answer Parser,1.0
3405,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_4,matharena,answer,Final Answer Parser,1.0
3407,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_40,matharena,answer,Final Answer Parser,0.0
3408,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_40,matharena,answer,Final Answer Parser,0.0
3410,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_40,matharena,answer,Final Answer Parser,0.0
3412,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_40,matharena,answer,Final Answer Parser,1.0
3418,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_5,matharena,answer,Final Answer Parser,0.0
3419,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_5,matharena,answer,Final Answer Parser,1.0
3421,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_5,matharena,answer,Final Answer Parser,0.0
3424,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_5,matharena,answer,Final Answer Parser,0.0
3429,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_6,matharena,answer,Final Answer Parser,0.0
3431,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_6,matharena,answer,Final Answer Parser,1.0
3432,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_6,matharena,answer,Final Answer Parser,1.0
3437,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_6,matharena,answer,Final Answer Parser,1.0
3441,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_7,matharena,answer,Final Answer Parser,0.0
3442,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_7,matharena,answer,Final Answer Parser,0.0
3444,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_7,matharena,answer,Final Answer Parser,0.0
3447,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_7,matharena,answer,Final Answer Parser,0.0
3448,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_8,matharena,answer,Final Answer Parser,0.0
3449,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_8,matharena,answer,Final Answer Parser,0.0
3450,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_8,matharena,answer,Final Answer Parser,0.0
3458,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_8,matharena,answer,Final Answer Parser,0.0
3460,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_9,matharena,answer,Final Answer Parser,0.0
3462,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_9,matharena,answer,Final Answer Parser,0.0
3463,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_9,matharena,answer,Final Answer Parser,0.0
3469,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_9,matharena,answer,Final Answer Parser,1.0
3475,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_hmmt/hmmt_feb_2025_1,matharena,answer,Final Answer Parser,1.0
3478,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_hmmt/hmmt_feb_2025_1,matharena,answer,Final Answer Parser,1.0
3479,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_hmmt/hmmt_feb_2025_1,matharena,answer,Final Answer Parser,1.0
3483,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_hmmt/hmmt_feb_2025_10,matharena,answer,Final Answer Parser,1.0
3484,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_hmmt/hmmt_feb_2025_10,matharena,answer,Final Answer Parser,1.0
3485,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_hmmt/hmmt_feb_2025_10,matharena,answer,Final Answer Parser,1.0
3494,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_hmmt/hmmt_feb_2025_11,matharena,answer,Final Answer Parser,1.0
3496,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_hmmt/hmmt_feb_2025_11,matharena,answer,Final Answer Parser,1.0
3499,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_hmmt/hmmt_feb_2025_11,matharena,answer,Final Answer Parser,1.0
3503,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_hmmt/hmmt_feb_2025_12,matharena,answer,Final Answer Parser,1.0
3507,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_hmmt/hmmt_feb_2025_12,matharena,answer,Final Answer Parser,1.0
3511,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_hmmt/hmmt_feb_2025_12,matharena,answer,Final Answer Parser,1.0
3520,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_hmmt/hmmt_feb_2025_13,matharena,answer,Final Answer Parser,0.0
3522,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_hmmt/hmmt_feb_2025_13,matharena,answer,Final Answer Parser,0.0
3523,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_hmmt/hmmt_feb_2025_13,matharena,answer,Final Answer Parser,0.0
3527,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_hmmt/hmmt_feb_2025_14,matharena,answer,Final Answer Parser,0.0
3529,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_hmmt/hmmt_feb_2025_14,matharena,answer,Final Answer Parser,0.0
3531,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_hmmt/hmmt_feb_2025_14,matharena,answer,Final Answer Parser,0.0
3536,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_hmmt/hmmt_feb_2025_15,matharena,answer,Final Answer Parser,1.0
3542,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_hmmt/hmmt_feb_2025_15,matharena,answer,Final Answer Parser,0.0
3545,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_hmmt/hmmt_feb_2025_15,matharena,answer,Final Answer Parser,1.0
3546,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_hmmt/hmmt_feb_2025_16,matharena,answer,Final Answer Parser,1.0
3547,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_hmmt/hmmt_feb_2025_16,matharena,answer,Final Answer Parser,1.0
3553,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_hmmt/hmmt_feb_2025_16,matharena,answer,Final Answer Parser,0.0
3558,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_hmmt/hmmt_feb_2025_17,matharena,answer,Final Answer Parser,0.0
3560,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_hmmt/hmmt_feb_2025_17,matharena,answer,Final Answer Parser,0.0
3566,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_hmmt/hmmt_feb_2025_17,matharena,answer,Final Answer Parser,0.0
3570,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_hmmt/hmmt_feb_2025_18,matharena,answer,Final Answer Parser,1.0
3573,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_hmmt/hmmt_feb_2025_18,matharena,answer,Final Answer Parser,0.0
3575,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_hmmt/hmmt_feb_2025_18,matharena,answer,Final Answer Parser,0.0
3580,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_hmmt/hmmt_feb_2025_19,matharena,answer,Final Answer Parser,0.0
3581,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_hmmt/hmmt_feb_2025_19,matharena,answer,Final Answer Parser,0.0
3584,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_hmmt/hmmt_feb_2025_19,matharena,answer,Final Answer Parser,0.0
3593,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_hmmt/hmmt_feb_2025_2,matharena,answer,Final Answer Parser,1.0
3595,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_hmmt/hmmt_feb_2025_2,matharena,answer,Final Answer Parser,1.0
3597,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_hmmt/hmmt_feb_2025_2,matharena,answer,Final Answer Parser,1.0
3602,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_hmmt/hmmt_feb_2025_20,matharena,answer,Final Answer Parser,0.0
3604,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_hmmt/hmmt_feb_2025_20,matharena,answer,Final Answer Parser,0.0
3606,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_hmmt/hmmt_feb_2025_20,matharena,answer,Final Answer Parser,1.0
3613,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_hmmt/hmmt_feb_2025_21,matharena,answer,Final Answer Parser,1.0
3616,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_hmmt/hmmt_feb_2025_21,matharena,answer,Final Answer Parser,1.0
3621,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_hmmt/hmmt_feb_2025_21,matharena,answer,Final Answer Parser,1.0
3624,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_hmmt/hmmt_feb_2025_22,matharena,answer,Final Answer Parser,1.0
3627,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_hmmt/hmmt_feb_2025_22,matharena,answer,Final Answer Parser,1.0
3632,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_hmmt/hmmt_feb_2025_22,matharena,answer,Final Answer Parser,1.0
3634,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_hmmt/hmmt_feb_2025_23,matharena,answer,Final Answer Parser,1.0
3639,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_hmmt/hmmt_feb_2025_23,matharena,answer,Final Answer Parser,1.0
3640,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_hmmt/hmmt_feb_2025_23,matharena,answer,Final Answer Parser,1.0
3646,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_hmmt/hmmt_feb_2025_24,matharena,answer,Final Answer Parser,1.0
3649,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_hmmt/hmmt_feb_2025_24,matharena,answer,Final Answer Parser,0.0
3652,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_hmmt/hmmt_feb_2025_24,matharena,answer,Final Answer Parser,0.0
3661,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_hmmt/hmmt_feb_2025_25,matharena,answer,Final Answer Parser,1.0
3662,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_hmmt/hmmt_feb_2025_25,matharena,answer,Final Answer Parser,1.0
3665,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_hmmt/hmmt_feb_2025_25,matharena,answer,Final Answer Parser,0.0
3667,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_hmmt/hmmt_feb_2025_26,matharena,answer,Final Answer Parser,1.0
3675,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_hmmt/hmmt_feb_2025_26,matharena,answer,Final Answer Parser,1.0
3677,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_hmmt/hmmt_feb_2025_26,matharena,answer,Final Answer Parser,1.0
3679,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_hmmt/hmmt_feb_2025_27,matharena,answer,Final Answer Parser,1.0
3683,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_hmmt/hmmt_feb_2025_27,matharena,answer,Final Answer Parser,1.0
3688,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_hmmt/hmmt_feb_2025_27,matharena,answer,Final Answer Parser,1.0
3695,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_hmmt/hmmt_feb_2025_28,matharena,answer,Final Answer Parser,1.0
3697,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_hmmt/hmmt_feb_2025_28,matharena,answer,Final Answer Parser,1.0
3698,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_hmmt/hmmt_feb_2025_28,matharena,answer,Final Answer Parser,1.0
3701,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_hmmt/hmmt_feb_2025_29,matharena,answer,Final Answer Parser,1.0
3708,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_hmmt/hmmt_feb_2025_29,matharena,answer,Final Answer Parser,1.0
3710,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_hmmt/hmmt_feb_2025_29,matharena,answer,Final Answer Parser,1.0
3713,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_hmmt/hmmt_feb_2025_3,matharena,answer,Final Answer Parser,1.0
3714,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_hmmt/hmmt_feb_2025_3,matharena,answer,Final Answer Parser,1.0
3719,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_hmmt/hmmt_feb_2025_3,matharena,answer,Final Answer Parser,1.0
3728,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_hmmt/hmmt_feb_2025_30,matharena,answer,Final Answer Parser,0.0
3730,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_hmmt/hmmt_feb_2025_30,matharena,answer,Final Answer Parser,0.0
3732,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_hmmt/hmmt_feb_2025_30,matharena,answer,Final Answer Parser,0.0
3735,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_hmmt/hmmt_feb_2025_4,matharena,answer,Final Answer Parser,1.0
3736,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_hmmt/hmmt_feb_2025_4,matharena,answer,Final Answer Parser,1.0
3743,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_hmmt/hmmt_feb_2025_4,matharena,answer,Final Answer Parser,1.0
3747,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_hmmt/hmmt_feb_2025_5,matharena,answer,Final Answer Parser,1.0
3748,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_hmmt/hmmt_feb_2025_5,matharena,answer,Final Answer Parser,1.0
3754,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_hmmt/hmmt_feb_2025_5,matharena,answer,Final Answer Parser,1.0
3755,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_hmmt/hmmt_feb_2025_6,matharena,answer,Final Answer Parser,1.0
3756,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_hmmt/hmmt_feb_2025_6,matharena,answer,Final Answer Parser,1.0
3757,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_hmmt/hmmt_feb_2025_6,matharena,answer,Final Answer Parser,0.0
3771,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_hmmt/hmmt_feb_2025_7,matharena,answer,Final Answer Parser,1.0
3772,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_hmmt/hmmt_feb_2025_7,matharena,answer,Final Answer Parser,1.0
3773,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_hmmt/hmmt_feb_2025_7,matharena,answer,Final Answer Parser,1.0
3779,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_hmmt/hmmt_feb_2025_8,matharena,answer,Final Answer Parser,0.0
3783,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_hmmt/hmmt_feb_2025_8,matharena,answer,Final Answer Parser,1.0
3785,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_hmmt/hmmt_feb_2025_8,matharena,answer,Final Answer Parser,1.0
3790,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_hmmt/hmmt_feb_2025_9,matharena,answer,Final Answer Parser,1.0
3791,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_hmmt/hmmt_feb_2025_9,matharena,answer,Final Answer Parser,1.0
3796,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_hmmt/hmmt_feb_2025_9,matharena,answer,Final Answer Parser,1.0
3802,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_1,matharena,answer,Final Answer Parser,1.0
3805,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_1,matharena,answer,Final Answer Parser,1.0
3806,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_1,matharena,answer,Final Answer Parser,1.0
3812,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_10,matharena,answer,Final Answer Parser,1.0
3819,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_10,matharena,answer,Final Answer Parser,1.0
3820,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_10,matharena,answer,Final Answer Parser,1.0
3821,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_11,matharena,answer,Final Answer Parser,1.0
3824,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_11,matharena,answer,Final Answer Parser,1.0
3830,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_11,matharena,answer,Final Answer Parser,1.0
3832,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_12,matharena,answer,Final Answer Parser,1.0
3835,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_12,matharena,answer,Final Answer Parser,1.0
3839,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_12,matharena,answer,Final Answer Parser,1.0
3844,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_13,matharena,answer,Final Answer Parser,1.0
3851,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_13,matharena,answer,Final Answer Parser,1.0
3853,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_13,matharena,answer,Final Answer Parser,1.0
3855,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_14,matharena,answer,Final Answer Parser,1.0
3856,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_14,matharena,answer,Final Answer Parser,1.0
3858,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_14,matharena,answer,Final Answer Parser,1.0
3865,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_15,matharena,answer,Final Answer Parser,1.0
3866,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_15,matharena,answer,Final Answer Parser,1.0
3870,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_15,matharena,answer,Final Answer Parser,1.0
3880,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_16,matharena,answer,Final Answer Parser,1.0
3883,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_16,matharena,answer,Final Answer Parser,1.0
3884,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_16,matharena,answer,Final Answer Parser,1.0
3889,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_17,matharena,answer,Final Answer Parser,1.0
3893,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_17,matharena,answer,Final Answer Parser,0.0
3894,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_17,matharena,answer,Final Answer Parser,0.0
3900,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_18,matharena,answer,Final Answer Parser,1.0
3903,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_18,matharena,answer,Final Answer Parser,1.0
3908,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_18,matharena,answer,Final Answer Parser,0.0
3909,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_19,matharena,answer,Final Answer Parser,0.0
3910,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_19,matharena,answer,Final Answer Parser,0.0
3918,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_19,matharena,answer,Final Answer Parser,0.0
3923,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_2,matharena,answer,Final Answer Parser,1.0
3926,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_2,matharena,answer,Final Answer Parser,1.0
3929,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_2,matharena,answer,Final Answer Parser,1.0
3933,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_20,matharena,answer,Final Answer Parser,1.0
3935,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_20,matharena,answer,Final Answer Parser,0.0
3936,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_20,matharena,answer,Final Answer Parser,0.0
3942,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_21,matharena,answer,Final Answer Parser,1.0
3944,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_21,matharena,answer,Final Answer Parser,1.0
3946,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_21,matharena,answer,Final Answer Parser,1.0
3953,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_22,matharena,answer,Final Answer Parser,0.0
3956,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_22,matharena,answer,Final Answer Parser,0.0
3962,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_22,matharena,answer,Final Answer Parser,1.0
3966,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_23,matharena,answer,Final Answer Parser,1.0
3970,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_23,matharena,answer,Final Answer Parser,1.0
3973,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_23,matharena,answer,Final Answer Parser,1.0
3974,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_24,matharena,answer,Final Answer Parser,0.0
3975,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_24,matharena,answer,Final Answer Parser,1.0
3980,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_24,matharena,answer,Final Answer Parser,1.0
3987,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_25,matharena,answer,Final Answer Parser,1.0
3988,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_25,matharena,answer,Final Answer Parser,1.0
3990,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_25,matharena,answer,Final Answer Parser,1.0
3998,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_26,matharena,answer,Final Answer Parser,1.0
4003,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_26,matharena,answer,Final Answer Parser,1.0
4004,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_26,matharena,answer,Final Answer Parser,1.0
4013,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_27,matharena,answer,Final Answer Parser,0.0
4015,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_27,matharena,answer,Final Answer Parser,0.0
4016,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_27,matharena,answer,Final Answer Parser,0.0
4017,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_28,matharena,answer,Final Answer Parser,1.0
4019,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_28,matharena,answer,Final Answer Parser,1.0
4024,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_28,matharena,answer,Final Answer Parser,1.0
4031,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_29,matharena,answer,Final Answer Parser,1.0
4032,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_29,matharena,answer,Final Answer Parser,1.0
4034,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_29,matharena,answer,Final Answer Parser,1.0
4041,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_3,matharena,answer,Final Answer Parser,1.0
4042,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_3,matharena,answer,Final Answer Parser,1.0
4047,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_3,matharena,answer,Final Answer Parser,1.0
4050,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_30,matharena,answer,Final Answer Parser,0.0
4051,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_30,matharena,answer,Final Answer Parser,1.0
4057,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_30,matharena,answer,Final Answer Parser,0.0
4061,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_31,matharena,answer,Final Answer Parser,1.0
4068,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_31,matharena,answer,Final Answer Parser,1.0
4070,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_31,matharena,answer,Final Answer Parser,1.0
4076,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_32,matharena,answer,Final Answer Parser,1.0
4078,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_32,matharena,answer,Final Answer Parser,1.0
4079,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_32,matharena,answer,Final Answer Parser,0.0
4085,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_33,matharena,answer,Final Answer Parser,1.0
4086,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_33,matharena,answer,Final Answer Parser,1.0
4087,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_33,matharena,answer,Final Answer Parser,1.0
4096,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_34,matharena,answer,Final Answer Parser,1.0
4101,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_34,matharena,answer,Final Answer Parser,0.0
4102,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_34,matharena,answer,Final Answer Parser,0.0
4108,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_35,matharena,answer,Final Answer Parser,1.0
4109,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_35,matharena,answer,Final Answer Parser,1.0
4114,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_35,matharena,answer,Final Answer Parser,1.0
4117,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_36,matharena,answer,Final Answer Parser,1.0
4123,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_36,matharena,answer,Final Answer Parser,1.0
4125,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_36,matharena,answer,Final Answer Parser,1.0
4131,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_37,matharena,answer,Final Answer Parser,1.0
4132,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_37,matharena,answer,Final Answer Parser,1.0
4134,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_37,matharena,answer,Final Answer Parser,1.0
4139,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_38,matharena,answer,Final Answer Parser,1.0
4140,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_38,matharena,answer,Final Answer Parser,0.0
4145,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_38,matharena,answer,Final Answer Parser,0.0
4147,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_39,matharena,answer,Final Answer Parser,1.0
4148,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_39,matharena,answer,Final Answer Parser,1.0
4154,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_39,matharena,answer,Final Answer Parser,1.0
4159,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_4,matharena,answer,Final Answer Parser,1.0
4161,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_4,matharena,answer,Final Answer Parser,1.0
4163,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_4,matharena,answer,Final Answer Parser,1.0
4169,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_40,matharena,answer,Final Answer Parser,1.0
4170,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_40,matharena,answer,Final Answer Parser,1.0
4173,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_40,matharena,answer,Final Answer Parser,1.0
4186,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_41,matharena,answer,Final Answer Parser,1.0
4188,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_41,matharena,answer,Final Answer Parser,0.0
4189,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_41,matharena,answer,Final Answer Parser,1.0
4193,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_42,matharena,answer,Final Answer Parser,0.0
4197,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_42,matharena,answer,Final Answer Parser,0.0
4199,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_42,matharena,answer,Final Answer Parser,0.0
4202,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_43,matharena,answer,Final Answer Parser,0.0
4203,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_43,matharena,answer,Final Answer Parser,0.0
4204,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_43,matharena,answer,Final Answer Parser,0.0
4212,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_44,matharena,answer,Final Answer Parser,1.0
4213,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_44,matharena,answer,Final Answer Parser,1.0
4214,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_44,matharena,answer,Final Answer Parser,1.0
4227,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_45,matharena,answer,Final Answer Parser,1.0
4229,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_45,matharena,answer,Final Answer Parser,1.0
4231,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_45,matharena,answer,Final Answer Parser,1.0
4236,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_46,matharena,answer,Final Answer Parser,1.0
4238,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_46,matharena,answer,Final Answer Parser,1.0
4242,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_46,matharena,answer,Final Answer Parser,1.0
4247,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_47,matharena,answer,Final Answer Parser,1.0
4248,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_47,matharena,answer,Final Answer Parser,1.0
4251,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_47,matharena,answer,Final Answer Parser,1.0
4259,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_48,matharena,answer,Final Answer Parser,1.0
4261,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_48,matharena,answer,Final Answer Parser,1.0
4264,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_48,matharena,answer,Final Answer Parser,1.0
4267,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_49,matharena,answer,Final Answer Parser,1.0
4268,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_49,matharena,answer,Final Answer Parser,1.0
4273,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_49,matharena,answer,Final Answer Parser,1.0
4276,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_5,matharena,answer,Final Answer Parser,1.0
4277,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_5,matharena,answer,Final Answer Parser,1.0
4283,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_5,matharena,answer,Final Answer Parser,1.0
4287,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_50,matharena,answer,Final Answer Parser,1.0
4288,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_50,matharena,answer,Final Answer Parser,0.0
4297,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_50,matharena,answer,Final Answer Parser,1.0
4299,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_51,matharena,answer,Final Answer Parser,1.0
4301,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_51,matharena,answer,Final Answer Parser,1.0
4302,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_51,matharena,answer,Final Answer Parser,1.0
4309,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_52,matharena,answer,Final Answer Parser,1.0
4315,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_52,matharena,answer,Final Answer Parser,1.0
4316,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_52,matharena,answer,Final Answer Parser,0.0
4320,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_53,matharena,answer,Final Answer Parser,0.0
4321,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_53,matharena,answer,Final Answer Parser,1.0
4322,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_53,matharena,answer,Final Answer Parser,0.0
4334,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_6,matharena,answer,Final Answer Parser,1.0
4335,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_6,matharena,answer,Final Answer Parser,1.0
4337,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_6,matharena,answer,Final Answer Parser,1.0
4346,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_7,matharena,answer,Final Answer Parser,1.0
4347,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_7,matharena,answer,Final Answer Parser,1.0
4348,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_7,matharena,answer,Final Answer Parser,1.0
4358,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_8,matharena,answer,Final Answer Parser,0.0
4359,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_8,matharena,answer,Final Answer Parser,0.0
4360,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_8,matharena,answer,Final Answer Parser,1.0
4367,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_9,matharena,answer,Final Answer Parser,1.0
4371,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_9,matharena,answer,Final Answer Parser,0.0
4372,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_9,matharena,answer,Final Answer Parser,1.0
4374,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,nordic_2025_1,nordic,proofs,OPC R1 8B,1.0
4375,GPT-5-mini (high),openai/gpt-5-mini,nordic_2025_1,nordic,proofs,OPC R1 8B,1.0
4376,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,nordic_2025_1,nordic,proofs,OPC R1 8B,1.0
4377,Qwen3-4B (25/07),qwen/qwen3_4b,nordic_2025_1,nordic,proofs,OPC R1 8B,1.0
4378,o4-mini (high),openai/o4-mini--high,nordic_2025_1,nordic,proofs,OPC R1 8B,1.0
4379,GPT OSS 120B (high),openai/oss-120b,nordic_2025_1,nordic,proofs,OPC R1 8B,0.0
4380,GPT-5 (high),openai/gpt-5,nordic_2025_1,nordic,proofs,OPC R1 8B,1.0
4381,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,nordic_2025_1,nordic,proofs,OPC R1 8B,0.0
4382,Grok 4,xai/grok-4,nordic_2025_1,nordic,proofs,OPC R1 8B,1.0
4383,gemini-2.5-pro,gemini/gemini-pro-2.5,nordic_2025_1,nordic,proofs,OPC R1 8B,1.0
4384,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,nordic_2025_1,nordic,proofs,OPC R1 8B,1.0
4385,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,nordic_2025_2,nordic,proofs,OPC R1 8B,1.0
4386,GPT-5-mini (high),openai/gpt-5-mini,nordic_2025_2,nordic,proofs,OPC R1 8B,1.0
4387,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,nordic_2025_2,nordic,proofs,OPC R1 8B,0.0
4388,o4-mini (high),openai/o4-mini--high,nordic_2025_2,nordic,proofs,OPC R1 8B,1.0
4389,GPT OSS 120B (high),openai/oss-120b,nordic_2025_2,nordic,proofs,OPC R1 8B,1.0
4390,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,nordic_2025_2,nordic,proofs,OPC R1 8B,1.0
4391,gemini-2.5-pro,gemini/gemini-pro-2.5,nordic_2025_2,nordic,proofs,OPC R1 8B,1.0
4392,GPT-5 (high),openai/gpt-5,nordic_2025_2,nordic,proofs,OPC R1 8B,1.0
4393,Qwen3-4B (25/07),qwen/qwen3_4b,nordic_2025_2,nordic,proofs,OPC R1 8B,0.0
4394,Grok 4,xai/grok-4,nordic_2025_2,nordic,proofs,OPC R1 8B,1.0
4395,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,nordic_2025_2,nordic,proofs,OPC R1 8B,1.0
4396,gemini-2.5-pro,gemini/gemini-pro-2.5,nordic_2025_3,nordic,proofs,OPC R1 8B,1.0
4397,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,nordic_2025_3,nordic,proofs,OPC R1 8B,0.0
4398,GPT OSS 120B (high),openai/oss-120b,nordic_2025_3,nordic,proofs,OPC R1 8B,1.0
4399,GPT-5-mini (high),openai/gpt-5-mini,nordic_2025_3,nordic,proofs,OPC R1 8B,1.0
4400,o4-mini (high),openai/o4-mini--high,nordic_2025_3,nordic,proofs,OPC R1 8B,1.0
4401,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,nordic_2025_3,nordic,proofs,OPC R1 8B,0.0
4402,GPT-5 (high),openai/gpt-5,nordic_2025_3,nordic,proofs,OPC R1 8B,1.0
4403,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,nordic_2025_3,nordic,proofs,OPC R1 8B,0.0
4404,Qwen3-4B (25/07),qwen/qwen3_4b,nordic_2025_3,nordic,proofs,OPC R1 8B,0.0
4405,Grok 4,xai/grok-4,nordic_2025_3,nordic,proofs,OPC R1 8B,0.0
4406,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,nordic_2025_3,nordic,proofs,OPC R1 8B,0.0
4407,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,pan_african_2025_1,pan,proofs,OPC R1 8B,0.0
4408,GPT-5-mini (high),openai/gpt-5-mini,pan_african_2025_1,pan,proofs,OPC R1 8B,0.0
4409,GPT OSS 120B (high),openai/oss-120b,pan_african_2025_1,pan,proofs,OPC R1 8B,1.0
4410,Grok 4,xai/grok-4,pan_african_2025_1,pan,proofs,OPC R1 8B,0.0
4411,GPT-5 (high),openai/gpt-5,pan_african_2025_1,pan,proofs,OPC R1 8B,0.0
4412,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,pan_african_2025_1,pan,proofs,OPC R1 8B,0.0
4413,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,pan_african_2025_1,pan,proofs,OPC R1 8B,0.0
4414,gemini-2.5-pro,gemini/gemini-pro-2.5,pan_african_2025_1,pan,proofs,OPC R1 8B,0.0
4415,Qwen3-4B (25/07),qwen/qwen3_4b,pan_african_2025_1,pan,proofs,OPC R1 8B,0.0
4416,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,pan_african_2025_1,pan,proofs,OPC R1 8B,0.0
4417,o4-mini (high),openai/o4-mini--high,pan_african_2025_1,pan,proofs,OPC R1 8B,0.0
4418,GPT-5-mini (high),openai/gpt-5-mini,pan_african_2025_2,pan,proofs,OPC R1 8B,1.0
4419,GPT OSS 120B (high),openai/oss-120b,pan_african_2025_2,pan,proofs,OPC R1 8B,1.0
4420,Grok 4,xai/grok-4,pan_african_2025_2,pan,proofs,OPC R1 8B,1.0
4421,gemini-2.5-pro,gemini/gemini-pro-2.5,pan_african_2025_2,pan,proofs,OPC R1 8B,1.0
4422,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,pan_african_2025_2,pan,proofs,OPC R1 8B,1.0
4423,Qwen3-4B (25/07),qwen/qwen3_4b,pan_african_2025_2,pan,proofs,OPC R1 8B,1.0
4424,o4-mini (high),openai/o4-mini--high,pan_african_2025_2,pan,proofs,OPC R1 8B,1.0
4425,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,pan_african_2025_2,pan,proofs,OPC R1 8B,1.0
4426,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,pan_african_2025_2,pan,proofs,OPC R1 8B,1.0
4427,GPT-5 (high),openai/gpt-5,pan_african_2025_2,pan,proofs,OPC R1 8B,1.0
4428,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,pan_african_2025_2,pan,proofs,OPC R1 8B,1.0
4429,GPT-5 (high),openai/gpt-5,pan_african_2025_3,pan,proofs,OPC R1 8B,1.0
4430,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,pan_african_2025_3,pan,proofs,OPC R1 8B,1.0
4431,GPT OSS 120B (high),openai/oss-120b,pan_african_2025_3,pan,proofs,OPC R1 8B,0.0
4432,Qwen3-4B (25/07),qwen/qwen3_4b,pan_african_2025_3,pan,proofs,OPC R1 8B,1.0
4433,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,pan_african_2025_3,pan,proofs,OPC R1 8B,1.0
4434,gemini-2.5-pro,gemini/gemini-pro-2.5,pan_african_2025_3,pan,proofs,OPC R1 8B,1.0
4435,o4-mini (high),openai/o4-mini--high,pan_african_2025_3,pan,proofs,OPC R1 8B,1.0
4436,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,pan_african_2025_3,pan,proofs,OPC R1 8B,1.0
4437,GPT-5-mini (high),openai/gpt-5-mini,pan_african_2025_3,pan,proofs,OPC R1 8B,1.0
4438,Grok 4,xai/grok-4,pan_african_2025_3,pan,proofs,OPC R1 8B,1.0
4439,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,pan_african_2025_3,pan,proofs,OPC R1 8B,1.0
4440,Qwen3-4B (25/07),qwen/qwen3_4b,pan_african_2025_4,pan,proofs,OPC R1 8B,1.0
4441,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,pan_african_2025_4,pan,proofs,OPC R1 8B,1.0
4442,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,pan_african_2025_4,pan,proofs,OPC R1 8B,1.0
4443,GPT-5-mini (high),openai/gpt-5-mini,pan_african_2025_4,pan,proofs,OPC R1 8B,1.0
4444,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,pan_african_2025_4,pan,proofs,OPC R1 8B,1.0
4445,o4-mini (high),openai/o4-mini--high,pan_african_2025_4,pan,proofs,OPC R1 8B,1.0
4446,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,pan_african_2025_4,pan,proofs,OPC R1 8B,1.0
4447,GPT OSS 120B (high),openai/oss-120b,pan_african_2025_4,pan,proofs,OPC R1 8B,1.0
4448,Grok 4,xai/grok-4,pan_african_2025_4,pan,proofs,OPC R1 8B,1.0
4449,gemini-2.5-pro,gemini/gemini-pro-2.5,pan_african_2025_4,pan,proofs,OPC R1 8B,1.0
4450,GPT-5 (high),openai/gpt-5,pan_african_2025_4,pan,proofs,OPC R1 8B,1.0
4451,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,pan_african_2025_5,pan,proofs,OPC R1 8B,0.0
4452,GPT OSS 120B (high),openai/oss-120b,pan_african_2025_5,pan,proofs,OPC R1 8B,0.0
4453,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,pan_african_2025_5,pan,proofs,OPC R1 8B,1.0
4454,Qwen3-4B (25/07),qwen/qwen3_4b,pan_african_2025_5,pan,proofs,OPC R1 8B,1.0
4455,Grok 4,xai/grok-4,pan_african_2025_5,pan,proofs,OPC R1 8B,0.0
4456,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,pan_african_2025_5,pan,proofs,OPC R1 8B,0.0
4457,GPT-5 (high),openai/gpt-5,pan_african_2025_5,pan,proofs,OPC R1 8B,1.0
4458,gemini-2.5-pro,gemini/gemini-pro-2.5,pan_african_2025_5,pan,proofs,OPC R1 8B,1.0
4459,GPT-5-mini (high),openai/gpt-5-mini,pan_african_2025_5,pan,proofs,OPC R1 8B,1.0
4460,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,pan_african_2025_5,pan,proofs,OPC R1 8B,0.0
4461,o4-mini (high),openai/o4-mini--high,pan_african_2025_5,pan,proofs,OPC R1 8B,0.0
4462,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,pan_african_2025_6,pan,proofs,OPC R1 8B,0.0
4463,gemini-2.5-pro,gemini/gemini-pro-2.5,pan_african_2025_6,pan,proofs,OPC R1 8B,1.0
4464,Grok 4,xai/grok-4,pan_african_2025_6,pan,proofs,OPC R1 8B,1.0
4465,Qwen3-4B (25/07),qwen/qwen3_4b,pan_african_2025_6,pan,proofs,OPC R1 8B,0.0
4466,o4-mini (high),openai/o4-mini--high,pan_african_2025_6,pan,proofs,OPC R1 8B,0.0
4467,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,pan_african_2025_6,pan,proofs,OPC R1 8B,0.0
4468,GPT OSS 120B (high),openai/oss-120b,pan_african_2025_6,pan,proofs,OPC R1 8B,0.0
4469,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,pan_african_2025_6,pan,proofs,OPC R1 8B,1.0
4470,GPT-5-mini (high),openai/gpt-5-mini,pan_african_2025_6,pan,proofs,OPC R1 8B,1.0
4471,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,pan_african_2025_6,pan,proofs,OPC R1 8B,0.0
4472,GPT-5 (high),openai/gpt-5,pan_african_2025_6,pan,proofs,OPC R1 8B,1.0
4473,Qwen3-4B (25/07),qwen/qwen3_4b,philippines_2025_1,philippines,proofs,OPC R1 8B,1.0
4474,o4-mini (high),openai/o4-mini--high,philippines_2025_1,philippines,proofs,OPC R1 8B,1.0
4475,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,philippines_2025_1,philippines,proofs,OPC R1 8B,0.0
4476,GPT OSS 120B (high),openai/oss-120b,philippines_2025_1,philippines,proofs,OPC R1 8B,0.0
4477,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,philippines_2025_1,philippines,proofs,OPC R1 8B,0.0
4478,GPT-5-mini (high),openai/gpt-5-mini,philippines_2025_1,philippines,proofs,OPC R1 8B,1.0
4479,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,philippines_2025_1,philippines,proofs,OPC R1 8B,1.0
4480,GPT-5 (high),openai/gpt-5,philippines_2025_1,philippines,proofs,OPC R1 8B,1.0
4481,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,philippines_2025_1,philippines,proofs,OPC R1 8B,1.0
4482,Grok 4,xai/grok-4,philippines_2025_1,philippines,proofs,OPC R1 8B,1.0
4483,gemini-2.5-pro,gemini/gemini-pro-2.5,philippines_2025_1,philippines,proofs,OPC R1 8B,1.0
4484,GPT-5 (high),openai/gpt-5,philippines_2025_2,philippines,proofs,OPC R1 8B,0.0
4485,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,philippines_2025_2,philippines,proofs,OPC R1 8B,0.0
4486,gemini-2.5-pro,gemini/gemini-pro-2.5,philippines_2025_2,philippines,proofs,OPC R1 8B,0.0
4487,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,philippines_2025_2,philippines,proofs,OPC R1 8B,0.0
4488,o4-mini (high),openai/o4-mini--high,philippines_2025_2,philippines,proofs,OPC R1 8B,0.0
4489,GPT-5-mini (high),openai/gpt-5-mini,philippines_2025_2,philippines,proofs,OPC R1 8B,0.0
4490,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,philippines_2025_2,philippines,proofs,OPC R1 8B,0.0
4491,GPT OSS 120B (high),openai/oss-120b,philippines_2025_2,philippines,proofs,OPC R1 8B,0.0
4492,Grok 4,xai/grok-4,philippines_2025_2,philippines,proofs,OPC R1 8B,0.0
4493,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,philippines_2025_2,philippines,proofs,OPC R1 8B,0.0
4494,Qwen3-4B (25/07),qwen/qwen3_4b,philippines_2025_2,philippines,proofs,OPC R1 8B,0.0
4495,GPT OSS 120B (high),openai/oss-120b,philippines_2025_3,philippines,proofs,OPC R1 8B,0.0
4496,Grok 4,xai/grok-4,philippines_2025_3,philippines,proofs,OPC R1 8B,0.0
4497,Qwen3-4B (25/07),qwen/qwen3_4b,philippines_2025_3,philippines,proofs,OPC R1 8B,0.0
4498,gemini-2.5-pro,gemini/gemini-pro-2.5,philippines_2025_3,philippines,proofs,OPC R1 8B,1.0
4499,o4-mini (high),openai/o4-mini--high,philippines_2025_3,philippines,proofs,OPC R1 8B,1.0
4500,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,philippines_2025_3,philippines,proofs,OPC R1 8B,1.0
4501,GPT-5 (high),openai/gpt-5,philippines_2025_3,philippines,proofs,OPC R1 8B,1.0
4502,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,philippines_2025_3,philippines,proofs,OPC R1 8B,0.0
4503,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,philippines_2025_3,philippines,proofs,OPC R1 8B,0.0
4504,GPT-5-mini (high),openai/gpt-5-mini,philippines_2025_3,philippines,proofs,OPC R1 8B,1.0
4505,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,philippines_2025_3,philippines,proofs,OPC R1 8B,0.0
4506,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,philippines_2025_4,philippines,proofs,OPC R1 8B,0.0
4507,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,philippines_2025_4,philippines,proofs,OPC R1 8B,0.0
4508,Grok 4,xai/grok-4,philippines_2025_4,philippines,proofs,OPC R1 8B,0.0
4509,GPT OSS 120B (high),openai/oss-120b,philippines_2025_4,philippines,proofs,OPC R1 8B,1.0
4510,GPT-5-mini (high),openai/gpt-5-mini,philippines_2025_4,philippines,proofs,OPC R1 8B,0.0
4511,Qwen3-4B (25/07),qwen/qwen3_4b,philippines_2025_4,philippines,proofs,OPC R1 8B,0.0
4512,o4-mini (high),openai/o4-mini--high,philippines_2025_4,philippines,proofs,OPC R1 8B,0.0
4513,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,philippines_2025_4,philippines,proofs,OPC R1 8B,0.0
4514,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,philippines_2025_4,philippines,proofs,OPC R1 8B,0.0
4515,gemini-2.5-pro,gemini/gemini-pro-2.5,philippines_2025_4,philippines,proofs,OPC R1 8B,0.0
4516,GPT-5 (high),openai/gpt-5,philippines_2025_4,philippines,proofs,OPC R1 8B,0.0
4517,GPT-5 (high),openai/gpt-5,philippines_2025_5,philippines,proofs,OPC R1 8B,1.0
4518,gemini-2.5-pro,gemini/gemini-pro-2.5,philippines_2025_5,philippines,proofs,OPC R1 8B,1.0
4519,Grok 4,xai/grok-4,philippines_2025_5,philippines,proofs,OPC R1 8B,1.0
4520,o4-mini (high),openai/o4-mini--high,philippines_2025_5,philippines,proofs,OPC R1 8B,0.0
4521,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,philippines_2025_5,philippines,proofs,OPC R1 8B,1.0
4522,GPT OSS 120B (high),openai/oss-120b,philippines_2025_5,philippines,proofs,OPC R1 8B,0.0
4523,GPT-5-mini (high),openai/gpt-5-mini,philippines_2025_5,philippines,proofs,OPC R1 8B,1.0
4524,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,philippines_2025_5,philippines,proofs,OPC R1 8B,1.0
4525,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,philippines_2025_5,philippines,proofs,OPC R1 8B,0.0
4526,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,philippines_2025_5,philippines,proofs,OPC R1 8B,0.0
4527,Qwen3-4B (25/07),qwen/qwen3_4b,philippines_2025_5,philippines,proofs,OPC R1 8B,0.0
4528,GPT-5 (high),openai/gpt-5,philippines_2025_6,philippines,proofs,OPC R1 8B,1.0
4529,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,philippines_2025_6,philippines,proofs,OPC R1 8B,1.0
4530,gemini-2.5-pro,gemini/gemini-pro-2.5,philippines_2025_6,philippines,proofs,OPC R1 8B,1.0
4531,Qwen3-4B (25/07),qwen/qwen3_4b,philippines_2025_6,philippines,proofs,OPC R1 8B,1.0
4532,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,philippines_2025_6,philippines,proofs,OPC R1 8B,0.0
4533,Grok 4,xai/grok-4,philippines_2025_6,philippines,proofs,OPC R1 8B,1.0
4534,GPT-5-mini (high),openai/gpt-5-mini,philippines_2025_6,philippines,proofs,OPC R1 8B,1.0
4535,o4-mini (high),openai/o4-mini--high,philippines_2025_6,philippines,proofs,OPC R1 8B,0.0
4536,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,philippines_2025_6,philippines,proofs,OPC R1 8B,1.0
4537,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,philippines_2025_6,philippines,proofs,OPC R1 8B,0.0
4538,GPT OSS 120B (high),openai/oss-120b,philippines_2025_6,philippines,proofs,OPC R1 8B,0.0
4539,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,philippines_2025_7,philippines,proofs,OPC R1 8B,0.0
4540,GPT OSS 120B (high),openai/oss-120b,philippines_2025_7,philippines,proofs,OPC R1 8B,0.0
4541,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,philippines_2025_7,philippines,proofs,OPC R1 8B,0.0
4542,Qwen3-4B (25/07),qwen/qwen3_4b,philippines_2025_7,philippines,proofs,OPC R1 8B,0.0
4543,o4-mini (high),openai/o4-mini--high,philippines_2025_7,philippines,proofs,OPC R1 8B,0.0
4544,Grok 4,xai/grok-4,philippines_2025_7,philippines,proofs,OPC R1 8B,0.0
4545,gemini-2.5-pro,gemini/gemini-pro-2.5,philippines_2025_7,philippines,proofs,OPC R1 8B,0.0
4546,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,philippines_2025_7,philippines,proofs,OPC R1 8B,0.0
4547,GPT-5-mini (high),openai/gpt-5-mini,philippines_2025_7,philippines,proofs,OPC R1 8B,0.0
4548,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,philippines_2025_7,philippines,proofs,OPC R1 8B,0.0
4549,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,philippines_2025_8,philippines,proofs,OPC R1 8B,0.0
4550,GPT OSS 120B (high),openai/oss-120b,philippines_2025_8,philippines,proofs,OPC R1 8B,0.0
4551,o4-mini (high),openai/o4-mini--high,philippines_2025_8,philippines,proofs,OPC R1 8B,0.0
4552,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,philippines_2025_8,philippines,proofs,OPC R1 8B,0.0
4553,Qwen3-4B (25/07),qwen/qwen3_4b,philippines_2025_8,philippines,proofs,OPC R1 8B,0.0
4554,gemini-2.5-pro,gemini/gemini-pro-2.5,philippines_2025_8,philippines,proofs,OPC R1 8B,0.0
4555,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,philippines_2025_8,philippines,proofs,OPC R1 8B,1.0
4556,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,philippines_2025_8,philippines,proofs,OPC R1 8B,0.0
4557,Grok 4,xai/grok-4,philippines_2025_8,philippines,proofs,OPC R1 8B,0.0
4558,GPT-5-mini (high),openai/gpt-5-mini,philippines_2025_8,philippines,proofs,OPC R1 8B,1.0
4559,Grok 4,xai/grok-4,polish_2025_1,polish,proofs,OPC R1 8B,0.0
4560,GPT-5 (high),openai/gpt-5,polish_2025_1,polish,proofs,OPC R1 8B,0.0
4561,GPT OSS 120B (high),openai/oss-120b,polish_2025_1,polish,proofs,OPC R1 8B,1.0
4562,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,polish_2025_1,polish,proofs,OPC R1 8B,1.0
4563,GPT-5-mini (high),openai/gpt-5-mini,polish_2025_1,polish,proofs,OPC R1 8B,1.0
4564,o4-mini (high),openai/o4-mini--high,polish_2025_1,polish,proofs,OPC R1 8B,1.0
4565,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,polish_2025_1,polish,proofs,OPC R1 8B,1.0
4566,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,polish_2025_1,polish,proofs,OPC R1 8B,1.0
4567,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,polish_2025_1,polish,proofs,OPC R1 8B,1.0
4568,Qwen3-4B (25/07),qwen/qwen3_4b,polish_2025_1,polish,proofs,OPC R1 8B,1.0
4569,gemini-2.5-pro,gemini/gemini-pro-2.5,polish_2025_1,polish,proofs,OPC R1 8B,1.0
4570,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,polish_2025_2,polish,proofs,OPC R1 8B,0.0
4571,GPT OSS 120B (high),openai/oss-120b,polish_2025_2,polish,proofs,OPC R1 8B,0.0
4572,Grok 4,xai/grok-4,polish_2025_2,polish,proofs,OPC R1 8B,0.0
4573,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,polish_2025_2,polish,proofs,OPC R1 8B,1.0
4574,gemini-2.5-pro,gemini/gemini-pro-2.5,polish_2025_2,polish,proofs,OPC R1 8B,1.0
4575,Qwen3-4B (25/07),qwen/qwen3_4b,polish_2025_2,polish,proofs,OPC R1 8B,1.0
4576,o4-mini (high),openai/o4-mini--high,polish_2025_2,polish,proofs,OPC R1 8B,0.0
4577,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,polish_2025_2,polish,proofs,OPC R1 8B,0.0
4578,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,polish_2025_2,polish,proofs,OPC R1 8B,1.0
4579,GPT-5 (high),openai/gpt-5,polish_2025_2,polish,proofs,OPC R1 8B,1.0
4580,GPT-5-mini (high),openai/gpt-5-mini,polish_2025_2,polish,proofs,OPC R1 8B,1.0
4581,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,polish_2025_3,polish,proofs,OPC R1 8B,1.0
4582,gemini-2.5-pro,gemini/gemini-pro-2.5,polish_2025_3,polish,proofs,OPC R1 8B,1.0
4583,GPT-5-mini (high),openai/gpt-5-mini,polish_2025_3,polish,proofs,OPC R1 8B,1.0
4584,GPT-5 (high),openai/gpt-5,polish_2025_3,polish,proofs,OPC R1 8B,1.0
4585,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,polish_2025_3,polish,proofs,OPC R1 8B,0.0
4586,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,polish_2025_3,polish,proofs,OPC R1 8B,1.0
4587,o4-mini (high),openai/o4-mini--high,polish_2025_3,polish,proofs,OPC R1 8B,1.0
4588,Qwen3-4B (25/07),qwen/qwen3_4b,polish_2025_3,polish,proofs,OPC R1 8B,1.0
4589,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,polish_2025_3,polish,proofs,OPC R1 8B,1.0
4590,GPT OSS 120B (high),openai/oss-120b,polish_2025_3,polish,proofs,OPC R1 8B,1.0
4591,Grok 4,xai/grok-4,polish_2025_3,polish,proofs,OPC R1 8B,1.0
4592,gemini-2.5-pro,gemini/gemini-pro-2.5,polish_2025_4,polish,proofs,OPC R1 8B,0.0
4593,GPT-5-mini (high),openai/gpt-5-mini,polish_2025_4,polish,proofs,OPC R1 8B,0.0
4594,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,polish_2025_4,polish,proofs,OPC R1 8B,0.0
4595,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,polish_2025_4,polish,proofs,OPC R1 8B,0.0
4596,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,polish_2025_4,polish,proofs,OPC R1 8B,0.0
4597,GPT OSS 120B (high),openai/oss-120b,polish_2025_4,polish,proofs,OPC R1 8B,0.0
4598,GPT-5 (high),openai/gpt-5,polish_2025_4,polish,proofs,OPC R1 8B,0.0
4599,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,polish_2025_4,polish,proofs,OPC R1 8B,0.0
4600,Grok 4,xai/grok-4,polish_2025_4,polish,proofs,OPC R1 8B,0.0
4601,Qwen3-4B (25/07),qwen/qwen3_4b,polish_2025_4,polish,proofs,OPC R1 8B,0.0
4602,o4-mini (high),openai/o4-mini--high,polish_2025_4,polish,proofs,OPC R1 8B,0.0
4603,Grok 4,xai/grok-4,polish_2025_5,polish,proofs,OPC R1 8B,0.0
4604,Qwen3-4B (25/07),qwen/qwen3_4b,polish_2025_5,polish,proofs,OPC R1 8B,0.0
4605,gemini-2.5-pro,gemini/gemini-pro-2.5,polish_2025_5,polish,proofs,OPC R1 8B,0.0
4606,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,polish_2025_5,polish,proofs,OPC R1 8B,0.0
4607,GPT-5 (high),openai/gpt-5,polish_2025_5,polish,proofs,OPC R1 8B,0.0
4608,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,polish_2025_5,polish,proofs,OPC R1 8B,0.0
4609,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,polish_2025_5,polish,proofs,OPC R1 8B,0.0
4610,o4-mini (high),openai/o4-mini--high,polish_2025_5,polish,proofs,OPC R1 8B,0.0
4611,GPT-5-mini (high),openai/gpt-5-mini,polish_2025_5,polish,proofs,OPC R1 8B,0.0
4612,GPT OSS 120B (high),openai/oss-120b,polish_2025_5,polish,proofs,OPC R1 8B,1.0
4613,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,polish_2025_5,polish,proofs,OPC R1 8B,0.0
4614,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,polish_2025_6,polish,proofs,OPC R1 8B,0.0
4615,GPT-5 (high),openai/gpt-5,polish_2025_6,polish,proofs,OPC R1 8B,0.0
4616,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,polish_2025_6,polish,proofs,OPC R1 8B,0.0
4617,gemini-2.5-pro,gemini/gemini-pro-2.5,polish_2025_6,polish,proofs,OPC R1 8B,0.0
4618,o4-mini (high),openai/o4-mini--high,polish_2025_6,polish,proofs,OPC R1 8B,0.0
4619,GPT-5-mini (high),openai/gpt-5-mini,polish_2025_6,polish,proofs,OPC R1 8B,0.0
4620,GPT OSS 120B (high),openai/oss-120b,polish_2025_6,polish,proofs,OPC R1 8B,0.0
4621,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,polish_2025_6,polish,proofs,OPC R1 8B,0.0
4622,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,polish_2025_6,polish,proofs,OPC R1 8B,0.0
4623,Qwen3-4B (25/07),qwen/qwen3_4b,polish_2025_6,polish,proofs,OPC R1 8B,1.0
4624,Grok 4,xai/grok-4,polish_2025_6,polish,proofs,OPC R1 8B,0.0
4625,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,rmm_2025_1,rmm,proofs,OPC R1 8B,0.0
4626,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,rmm_2025_1,rmm,proofs,OPC R1 8B,0.0
4627,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,rmm_2025_1,rmm,proofs,OPC R1 8B,0.0
4628,GPT-5 (high),openai/gpt-5,rmm_2025_1,rmm,proofs,OPC R1 8B,0.0
4629,o4-mini (high),openai/o4-mini--high,rmm_2025_1,rmm,proofs,OPC R1 8B,0.0
4630,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,rmm_2025_1,rmm,proofs,OPC R1 8B,0.0
4631,Qwen3-4B (25/07),qwen/qwen3_4b,rmm_2025_1,rmm,proofs,OPC R1 8B,0.0
4632,gemini-2.5-pro,gemini/gemini-pro-2.5,rmm_2025_1,rmm,proofs,OPC R1 8B,0.0
4633,GPT-5-mini (high),openai/gpt-5-mini,rmm_2025_1,rmm,proofs,OPC R1 8B,1.0
4634,GPT OSS 120B (high),openai/oss-120b,rmm_2025_1,rmm,proofs,OPC R1 8B,0.0
4635,Grok 4,xai/grok-4,rmm_2025_1,rmm,proofs,OPC R1 8B,1.0
4636,gemini-2.5-pro,gemini/gemini-pro-2.5,rmm_2025_2,rmm,proofs,OPC R1 8B,0.0
4637,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,rmm_2025_2,rmm,proofs,OPC R1 8B,0.0
4638,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,rmm_2025_2,rmm,proofs,OPC R1 8B,1.0
4639,GPT OSS 120B (high),openai/oss-120b,rmm_2025_2,rmm,proofs,OPC R1 8B,0.0
4640,GPT-5 (high),openai/gpt-5,rmm_2025_2,rmm,proofs,OPC R1 8B,0.0
4641,o4-mini (high),openai/o4-mini--high,rmm_2025_2,rmm,proofs,OPC R1 8B,1.0
4642,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,rmm_2025_2,rmm,proofs,OPC R1 8B,1.0
4643,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,rmm_2025_2,rmm,proofs,OPC R1 8B,0.0
4644,GPT-5-mini (high),openai/gpt-5-mini,rmm_2025_2,rmm,proofs,OPC R1 8B,0.0
4645,Grok 4,xai/grok-4,rmm_2025_2,rmm,proofs,OPC R1 8B,1.0
4646,Qwen3-4B (25/07),qwen/qwen3_4b,rmm_2025_2,rmm,proofs,OPC R1 8B,1.0
4647,o4-mini (high),openai/o4-mini--high,rmm_2025_3,rmm,proofs,OPC R1 8B,0.0
4648,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,rmm_2025_3,rmm,proofs,OPC R1 8B,0.0
4649,GPT-5 (high),openai/gpt-5,rmm_2025_3,rmm,proofs,OPC R1 8B,1.0
4650,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,rmm_2025_3,rmm,proofs,OPC R1 8B,0.0
4651,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,rmm_2025_3,rmm,proofs,OPC R1 8B,0.0
4652,GPT OSS 120B (high),openai/oss-120b,rmm_2025_3,rmm,proofs,OPC R1 8B,0.0
4653,GPT-5-mini (high),openai/gpt-5-mini,rmm_2025_3,rmm,proofs,OPC R1 8B,1.0
4654,Grok 4,xai/grok-4,rmm_2025_3,rmm,proofs,OPC R1 8B,1.0
4655,Qwen3-4B (25/07),qwen/qwen3_4b,rmm_2025_3,rmm,proofs,OPC R1 8B,0.0
4656,gemini-2.5-pro,gemini/gemini-pro-2.5,rmm_2025_3,rmm,proofs,OPC R1 8B,0.0
4657,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,rmm_2025_3,rmm,proofs,OPC R1 8B,0.0
4658,Qwen3-4B (25/07),qwen/qwen3_4b,rmm_2025_4,rmm,proofs,OPC R1 8B,0.0
4659,Grok 4,xai/grok-4,rmm_2025_4,rmm,proofs,OPC R1 8B,0.0
4660,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,rmm_2025_4,rmm,proofs,OPC R1 8B,0.0
4661,GPT-5 (high),openai/gpt-5,rmm_2025_4,rmm,proofs,OPC R1 8B,0.0
4662,o4-mini (high),openai/o4-mini--high,rmm_2025_4,rmm,proofs,OPC R1 8B,0.0
4663,GPT OSS 120B (high),openai/oss-120b,rmm_2025_4,rmm,proofs,OPC R1 8B,0.0
4664,gemini-2.5-pro,gemini/gemini-pro-2.5,rmm_2025_4,rmm,proofs,OPC R1 8B,0.0
4665,GPT-5-mini (high),openai/gpt-5-mini,rmm_2025_4,rmm,proofs,OPC R1 8B,0.0
4666,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,rmm_2025_4,rmm,proofs,OPC R1 8B,0.0
4667,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,rmm_2025_4,rmm,proofs,OPC R1 8B,0.0
4668,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,rmm_2025_4,rmm,proofs,OPC R1 8B,1.0
4669,Grok 4,xai/grok-4,rmm_2025_5,rmm,proofs,OPC R1 8B,0.0
4670,Qwen3-4B (25/07),qwen/qwen3_4b,rmm_2025_5,rmm,proofs,OPC R1 8B,0.0
4671,gemini-2.5-pro,gemini/gemini-pro-2.5,rmm_2025_5,rmm,proofs,OPC R1 8B,0.0
4672,GPT OSS 120B (high),openai/oss-120b,rmm_2025_5,rmm,proofs,OPC R1 8B,0.0
4673,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,rmm_2025_5,rmm,proofs,OPC R1 8B,0.0
4674,GPT-5-mini (high),openai/gpt-5-mini,rmm_2025_5,rmm,proofs,OPC R1 8B,0.0
4675,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,rmm_2025_5,rmm,proofs,OPC R1 8B,0.0
4676,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,rmm_2025_5,rmm,proofs,OPC R1 8B,0.0
4677,o4-mini (high),openai/o4-mini--high,rmm_2025_5,rmm,proofs,OPC R1 8B,0.0
4678,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,rmm_2025_5,rmm,proofs,OPC R1 8B,0.0
4679,gemini-2.5-pro,gemini/gemini-pro-2.5,rmm_2025_6,rmm,proofs,OPC R1 8B,0.0
4680,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,rmm_2025_6,rmm,proofs,OPC R1 8B,1.0
4681,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,rmm_2025_6,rmm,proofs,OPC R1 8B,1.0
4682,GPT-5 (high),openai/gpt-5,rmm_2025_6,rmm,proofs,OPC R1 8B,1.0
4683,GPT-5-mini (high),openai/gpt-5-mini,rmm_2025_6,rmm,proofs,OPC R1 8B,0.0
4684,Qwen3-4B (25/07),qwen/qwen3_4b,rmm_2025_6,rmm,proofs,OPC R1 8B,0.0
4685,Grok 4,xai/grok-4,rmm_2025_6,rmm,proofs,OPC R1 8B,1.0
4686,GPT OSS 120B (high),openai/oss-120b,rmm_2025_6,rmm,proofs,OPC R1 8B,0.0
4687,o4-mini (high),openai/o4-mini--high,rmm_2025_6,rmm,proofs,OPC R1 8B,0.0
4688,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,rmm_2025_6,rmm,proofs,OPC R1 8B,0.0
4689,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,rmm_2025_6,rmm,proofs,OPC R1 8B,0.0
4690,o4-mini (high),openai/o4-mini--high,romania_10_2025_1,romania,proofs,OPC R1 8B,0.0
4691,GPT-5 (high),openai/gpt-5,romania_10_2025_1,romania,proofs,OPC R1 8B,0.0
4692,GPT-5-mini (high),openai/gpt-5-mini,romania_10_2025_1,romania,proofs,OPC R1 8B,0.0
4693,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,romania_10_2025_1,romania,proofs,OPC R1 8B,0.0
4694,Grok 4,xai/grok-4,romania_10_2025_1,romania,proofs,OPC R1 8B,0.0
4695,gemini-2.5-pro,gemini/gemini-pro-2.5,romania_10_2025_1,romania,proofs,OPC R1 8B,1.0
4696,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,romania_10_2025_1,romania,proofs,OPC R1 8B,0.0
4697,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,romania_10_2025_1,romania,proofs,OPC R1 8B,0.0
4698,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,romania_10_2025_1,romania,proofs,OPC R1 8B,0.0
4699,GPT OSS 120B (high),openai/oss-120b,romania_10_2025_1,romania,proofs,OPC R1 8B,0.0
4700,Qwen3-4B (25/07),qwen/qwen3_4b,romania_10_2025_1,romania,proofs,OPC R1 8B,0.0
4701,GPT-5-mini (high),openai/gpt-5-mini,romania_10_2025_2,romania,proofs,OPC R1 8B,1.0
4702,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,romania_10_2025_2,romania,proofs,OPC R1 8B,0.0
4703,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,romania_10_2025_2,romania,proofs,OPC R1 8B,1.0
4704,gemini-2.5-pro,gemini/gemini-pro-2.5,romania_10_2025_2,romania,proofs,OPC R1 8B,1.0
4705,o4-mini (high),openai/o4-mini--high,romania_10_2025_2,romania,proofs,OPC R1 8B,1.0
4706,Grok 4,xai/grok-4,romania_10_2025_2,romania,proofs,OPC R1 8B,1.0
4707,Qwen3-4B (25/07),qwen/qwen3_4b,romania_10_2025_2,romania,proofs,OPC R1 8B,0.0
4708,GPT OSS 120B (high),openai/oss-120b,romania_10_2025_2,romania,proofs,OPC R1 8B,0.0
4709,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,romania_10_2025_2,romania,proofs,OPC R1 8B,1.0
4710,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,romania_10_2025_2,romania,proofs,OPC R1 8B,0.0
4711,GPT-5 (high),openai/gpt-5,romania_10_2025_2,romania,proofs,OPC R1 8B,1.0
4712,GPT OSS 120B (high),openai/oss-120b,romania_10_2025_3,romania,proofs,OPC R1 8B,0.0
4713,GPT-5 (high),openai/gpt-5,romania_10_2025_3,romania,proofs,OPC R1 8B,0.0
4714,gemini-2.5-pro,gemini/gemini-pro-2.5,romania_10_2025_3,romania,proofs,OPC R1 8B,1.0
4715,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,romania_10_2025_3,romania,proofs,OPC R1 8B,1.0
4716,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,romania_10_2025_3,romania,proofs,OPC R1 8B,0.0
4717,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,romania_10_2025_3,romania,proofs,OPC R1 8B,0.0
4718,GPT-5-mini (high),openai/gpt-5-mini,romania_10_2025_3,romania,proofs,OPC R1 8B,0.0
4719,o4-mini (high),openai/o4-mini--high,romania_10_2025_3,romania,proofs,OPC R1 8B,0.0
4720,Qwen3-4B (25/07),qwen/qwen3_4b,romania_10_2025_3,romania,proofs,OPC R1 8B,1.0
4721,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,romania_10_2025_3,romania,proofs,OPC R1 8B,1.0
4722,Grok 4,xai/grok-4,romania_10_2025_3,romania,proofs,OPC R1 8B,0.0
4723,GPT-5-mini (high),openai/gpt-5-mini,romania_11_2025_1,romania,proofs,OPC R1 8B,1.0
4724,Grok 4,xai/grok-4,romania_11_2025_1,romania,proofs,OPC R1 8B,0.0
4725,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,romania_11_2025_1,romania,proofs,OPC R1 8B,1.0
4726,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,romania_11_2025_1,romania,proofs,OPC R1 8B,1.0
4727,o4-mini (high),openai/o4-mini--high,romania_11_2025_1,romania,proofs,OPC R1 8B,1.0
4728,GPT-5 (high),openai/gpt-5,romania_11_2025_1,romania,proofs,OPC R1 8B,1.0
4729,GPT OSS 120B (high),openai/oss-120b,romania_11_2025_1,romania,proofs,OPC R1 8B,0.0
4730,gemini-2.5-pro,gemini/gemini-pro-2.5,romania_11_2025_1,romania,proofs,OPC R1 8B,1.0
4731,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,romania_11_2025_1,romania,proofs,OPC R1 8B,0.0
4732,Qwen3-4B (25/07),qwen/qwen3_4b,romania_11_2025_1,romania,proofs,OPC R1 8B,1.0
4733,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,romania_11_2025_1,romania,proofs,OPC R1 8B,0.0
4734,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,romania_11_2025_2,romania,proofs,OPC R1 8B,0.0
4735,GPT OSS 120B (high),openai/oss-120b,romania_11_2025_2,romania,proofs,OPC R1 8B,0.0
4736,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,romania_11_2025_2,romania,proofs,OPC R1 8B,1.0
4737,GPT-5-mini (high),openai/gpt-5-mini,romania_11_2025_2,romania,proofs,OPC R1 8B,1.0
4738,Grok 4,xai/grok-4,romania_11_2025_2,romania,proofs,OPC R1 8B,1.0
4739,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,romania_11_2025_2,romania,proofs,OPC R1 8B,1.0
4740,Qwen3-4B (25/07),qwen/qwen3_4b,romania_11_2025_2,romania,proofs,OPC R1 8B,0.0
4741,o4-mini (high),openai/o4-mini--high,romania_11_2025_2,romania,proofs,OPC R1 8B,0.0
4742,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,romania_11_2025_2,romania,proofs,OPC R1 8B,0.0
4743,GPT-5 (high),openai/gpt-5,romania_11_2025_2,romania,proofs,OPC R1 8B,1.0
4744,gemini-2.5-pro,gemini/gemini-pro-2.5,romania_11_2025_2,romania,proofs,OPC R1 8B,0.0
4745,GPT OSS 120B (high),openai/oss-120b,romania_11_2025_3,romania,proofs,OPC R1 8B,0.0
4746,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,romania_11_2025_3,romania,proofs,OPC R1 8B,0.0
4747,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,romania_11_2025_3,romania,proofs,OPC R1 8B,0.0
4748,o4-mini (high),openai/o4-mini--high,romania_11_2025_3,romania,proofs,OPC R1 8B,0.0
4749,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,romania_11_2025_3,romania,proofs,OPC R1 8B,0.0
4750,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,romania_11_2025_3,romania,proofs,OPC R1 8B,0.0
4751,Qwen3-4B (25/07),qwen/qwen3_4b,romania_11_2025_3,romania,proofs,OPC R1 8B,0.0
4752,gemini-2.5-pro,gemini/gemini-pro-2.5,romania_11_2025_3,romania,proofs,OPC R1 8B,0.0
4753,Grok 4,xai/grok-4,romania_11_2025_3,romania,proofs,OPC R1 8B,0.0
4754,GPT-5 (high),openai/gpt-5,romania_11_2025_3,romania,proofs,OPC R1 8B,0.0
4755,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,romania_12_2025_1,romania,proofs,OPC R1 8B,0.0
4756,GPT OSS 120B (high),openai/oss-120b,romania_12_2025_1,romania,proofs,OPC R1 8B,1.0
4757,o4-mini (high),openai/o4-mini--high,romania_12_2025_1,romania,proofs,OPC R1 8B,0.0
4758,Grok 4,xai/grok-4,romania_12_2025_1,romania,proofs,OPC R1 8B,0.0
4759,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,romania_12_2025_1,romania,proofs,OPC R1 8B,0.0
4760,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,romania_12_2025_1,romania,proofs,OPC R1 8B,0.0
4761,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,romania_12_2025_1,romania,proofs,OPC R1 8B,0.0
4762,GPT-5 (high),openai/gpt-5,romania_12_2025_1,romania,proofs,OPC R1 8B,0.0
4763,gemini-2.5-pro,gemini/gemini-pro-2.5,romania_12_2025_1,romania,proofs,OPC R1 8B,1.0
4764,Qwen3-4B (25/07),qwen/qwen3_4b,romania_12_2025_1,romania,proofs,OPC R1 8B,0.0
4765,GPT OSS 120B (high),openai/oss-120b,romania_12_2025_2,romania,proofs,OPC R1 8B,1.0
4766,Qwen3-4B (25/07),qwen/qwen3_4b,romania_12_2025_2,romania,proofs,OPC R1 8B,1.0
4767,GPT-5-mini (high),openai/gpt-5-mini,romania_12_2025_2,romania,proofs,OPC R1 8B,1.0
4768,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,romania_12_2025_2,romania,proofs,OPC R1 8B,1.0
4769,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,romania_12_2025_2,romania,proofs,OPC R1 8B,1.0
4770,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,romania_12_2025_2,romania,proofs,OPC R1 8B,0.0
4771,Grok 4,xai/grok-4,romania_12_2025_2,romania,proofs,OPC R1 8B,1.0
4772,o4-mini (high),openai/o4-mini--high,romania_12_2025_2,romania,proofs,OPC R1 8B,0.0
4773,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,romania_12_2025_2,romania,proofs,OPC R1 8B,0.0
4774,gemini-2.5-pro,gemini/gemini-pro-2.5,romania_12_2025_2,romania,proofs,OPC R1 8B,1.0
4775,GPT-5 (high),openai/gpt-5,romania_12_2025_2,romania,proofs,OPC R1 8B,1.0
4776,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,romania_12_2025_3,romania,proofs,OPC R1 8B,0.0
4777,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,romania_12_2025_3,romania,proofs,OPC R1 8B,1.0
4778,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,romania_12_2025_3,romania,proofs,OPC R1 8B,0.0
4779,gemini-2.5-pro,gemini/gemini-pro-2.5,romania_12_2025_3,romania,proofs,OPC R1 8B,0.0
4780,GPT OSS 120B (high),openai/oss-120b,romania_12_2025_3,romania,proofs,OPC R1 8B,0.0
4781,Grok 4,xai/grok-4,romania_12_2025_3,romania,proofs,OPC R1 8B,1.0
4782,o4-mini (high),openai/o4-mini--high,romania_12_2025_3,romania,proofs,OPC R1 8B,0.0
4783,Qwen3-4B (25/07),qwen/qwen3_4b,romania_12_2025_3,romania,proofs,OPC R1 8B,0.0
4784,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,romania_12_2025_3,romania,proofs,OPC R1 8B,0.0
4785,GPT-5 (high),openai/gpt-5,romania_12_2025_3,romania,proofs,OPC R1 8B,0.0
4786,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,romania_9_2025_1,romania,proofs,OPC R1 8B,0.0
4787,Grok 4,xai/grok-4,romania_9_2025_1,romania,proofs,OPC R1 8B,0.0
4788,Qwen3-4B (25/07),qwen/qwen3_4b,romania_9_2025_1,romania,proofs,OPC R1 8B,0.0
4789,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,romania_9_2025_1,romania,proofs,OPC R1 8B,0.0
4790,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,romania_9_2025_1,romania,proofs,OPC R1 8B,0.0
4791,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,romania_9_2025_1,romania,proofs,OPC R1 8B,0.0
4792,o4-mini (high),openai/o4-mini--high,romania_9_2025_1,romania,proofs,OPC R1 8B,0.0
4793,GPT OSS 120B (high),openai/oss-120b,romania_9_2025_1,romania,proofs,OPC R1 8B,0.0
4794,gemini-2.5-pro,gemini/gemini-pro-2.5,romania_9_2025_1,romania,proofs,OPC R1 8B,0.0
4795,GPT-5 (high),openai/gpt-5,romania_9_2025_1,romania,proofs,OPC R1 8B,1.0
4796,gemini-2.5-pro,gemini/gemini-pro-2.5,romania_9_2025_2,romania,proofs,OPC R1 8B,0.0
4797,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,romania_9_2025_2,romania,proofs,OPC R1 8B,0.0
4798,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,romania_9_2025_2,romania,proofs,OPC R1 8B,0.0
4799,o4-mini (high),openai/o4-mini--high,romania_9_2025_2,romania,proofs,OPC R1 8B,0.0
4800,GPT-5 (high),openai/gpt-5,romania_9_2025_2,romania,proofs,OPC R1 8B,0.0
4801,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,romania_9_2025_2,romania,proofs,OPC R1 8B,0.0
4802,Qwen3-4B (25/07),qwen/qwen3_4b,romania_9_2025_2,romania,proofs,OPC R1 8B,0.0
4803,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,romania_9_2025_2,romania,proofs,OPC R1 8B,0.0
4804,Grok 4,xai/grok-4,romania_9_2025_2,romania,proofs,OPC R1 8B,0.0
4805,GPT OSS 120B (high),openai/oss-120b,romania_9_2025_2,romania,proofs,OPC R1 8B,0.0
4806,Qwen3-4B (25/07),qwen/qwen3_4b,romania_tst_2025_1,romania,proofs,OPC R1 8B,0.0
4807,GPT-5 (high),openai/gpt-5,romania_tst_2025_1,romania,proofs,OPC R1 8B,0.0
4808,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,romania_tst_2025_1,romania,proofs,OPC R1 8B,0.0
4809,gemini-2.5-pro,gemini/gemini-pro-2.5,romania_tst_2025_1,romania,proofs,OPC R1 8B,0.0
4810,GPT OSS 120B (high),openai/oss-120b,romania_tst_2025_1,romania,proofs,OPC R1 8B,1.0
4811,Grok 4,xai/grok-4,romania_tst_2025_1,romania,proofs,OPC R1 8B,0.0
4812,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,romania_tst_2025_1,romania,proofs,OPC R1 8B,0.0
4813,o4-mini (high),openai/o4-mini--high,romania_tst_2025_1,romania,proofs,OPC R1 8B,0.0
4814,GPT-5-mini (high),openai/gpt-5-mini,romania_tst_2025_1,romania,proofs,OPC R1 8B,0.0
4815,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,romania_tst_2025_1,romania,proofs,OPC R1 8B,0.0
4816,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,romania_tst_2025_1,romania,proofs,OPC R1 8B,0.0
4817,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,romania_tst_2025_2,romania,proofs,OPC R1 8B,0.0
4818,gemini-2.5-pro,gemini/gemini-pro-2.5,romania_tst_2025_2,romania,proofs,OPC R1 8B,1.0
4819,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,romania_tst_2025_2,romania,proofs,OPC R1 8B,0.0
4820,Grok 4,xai/grok-4,romania_tst_2025_2,romania,proofs,OPC R1 8B,0.0
4821,GPT-5 (high),openai/gpt-5,romania_tst_2025_2,romania,proofs,OPC R1 8B,1.0
4822,o4-mini (high),openai/o4-mini--high,romania_tst_2025_2,romania,proofs,OPC R1 8B,0.0
4823,Qwen3-4B (25/07),qwen/qwen3_4b,romania_tst_2025_2,romania,proofs,OPC R1 8B,1.0
4824,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,romania_tst_2025_2,romania,proofs,OPC R1 8B,0.0
4825,GPT-5-mini (high),openai/gpt-5-mini,romania_tst_2025_2,romania,proofs,OPC R1 8B,1.0
4826,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,romania_tst_2025_2,romania,proofs,OPC R1 8B,0.0
4827,GPT OSS 120B (high),openai/oss-120b,romania_tst_2025_2,romania,proofs,OPC R1 8B,0.0
4828,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,romania_tst_2025_3,romania,proofs,OPC R1 8B,0.0
4829,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,romania_tst_2025_3,romania,proofs,OPC R1 8B,0.0
4830,GPT OSS 120B (high),openai/oss-120b,romania_tst_2025_3,romania,proofs,OPC R1 8B,0.0
4831,GPT-5-mini (high),openai/gpt-5-mini,romania_tst_2025_3,romania,proofs,OPC R1 8B,0.0
4832,GPT-5 (high),openai/gpt-5,romania_tst_2025_3,romania,proofs,OPC R1 8B,0.0
4833,Grok 4,xai/grok-4,romania_tst_2025_3,romania,proofs,OPC R1 8B,0.0
4834,Qwen3-4B (25/07),qwen/qwen3_4b,romania_tst_2025_3,romania,proofs,OPC R1 8B,0.0
4835,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,romania_tst_2025_3,romania,proofs,OPC R1 8B,0.0
4836,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,romania_tst_2025_3,romania,proofs,OPC R1 8B,0.0
4837,gemini-2.5-pro,gemini/gemini-pro-2.5,romania_tst_2025_3,romania,proofs,OPC R1 8B,0.0
4838,o4-mini (high),openai/o4-mini--high,romania_tst_2025_3,romania,proofs,OPC R1 8B,0.0
4839,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,serbia_tst_bmo_2025_1,serbia,proofs,OPC R1 8B,0.0
4840,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,serbia_tst_bmo_2025_1,serbia,proofs,OPC R1 8B,1.0
4841,Qwen3-4B (25/07),qwen/qwen3_4b,serbia_tst_bmo_2025_1,serbia,proofs,OPC R1 8B,0.0
4842,Grok 4,xai/grok-4,serbia_tst_bmo_2025_1,serbia,proofs,OPC R1 8B,0.0
4843,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,serbia_tst_bmo_2025_1,serbia,proofs,OPC R1 8B,0.0
4844,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,serbia_tst_bmo_2025_1,serbia,proofs,OPC R1 8B,0.0
4845,o4-mini (high),openai/o4-mini--high,serbia_tst_bmo_2025_1,serbia,proofs,OPC R1 8B,0.0
4846,gemini-2.5-pro,gemini/gemini-pro-2.5,serbia_tst_bmo_2025_1,serbia,proofs,OPC R1 8B,0.0
4847,GPT OSS 120B (high),openai/oss-120b,serbia_tst_bmo_2025_1,serbia,proofs,OPC R1 8B,1.0
4848,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,serbia_tst_bmo_2025_2,serbia,proofs,OPC R1 8B,0.0
4849,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,serbia_tst_bmo_2025_2,serbia,proofs,OPC R1 8B,0.0
4850,gemini-2.5-pro,gemini/gemini-pro-2.5,serbia_tst_bmo_2025_2,serbia,proofs,OPC R1 8B,0.0
4851,Grok 4,xai/grok-4,serbia_tst_bmo_2025_2,serbia,proofs,OPC R1 8B,0.0
4852,Qwen3-4B (25/07),qwen/qwen3_4b,serbia_tst_bmo_2025_2,serbia,proofs,OPC R1 8B,0.0
4853,o4-mini (high),openai/o4-mini--high,serbia_tst_bmo_2025_2,serbia,proofs,OPC R1 8B,1.0
4854,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,serbia_tst_bmo_2025_2,serbia,proofs,OPC R1 8B,0.0
4855,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,serbia_tst_bmo_2025_2,serbia,proofs,OPC R1 8B,0.0
4856,GPT OSS 120B (high),openai/oss-120b,serbia_tst_bmo_2025_2,serbia,proofs,OPC R1 8B,0.0
4857,Grok 4,xai/grok-4,serbia_tst_bmo_2025_3,serbia,proofs,OPC R1 8B,1.0
4858,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,serbia_tst_bmo_2025_3,serbia,proofs,OPC R1 8B,0.0
4859,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,serbia_tst_bmo_2025_3,serbia,proofs,OPC R1 8B,1.0
4860,GPT OSS 120B (high),openai/oss-120b,serbia_tst_bmo_2025_3,serbia,proofs,OPC R1 8B,1.0
4861,o4-mini (high),openai/o4-mini--high,serbia_tst_bmo_2025_3,serbia,proofs,OPC R1 8B,0.0
4862,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,serbia_tst_bmo_2025_3,serbia,proofs,OPC R1 8B,1.0
4863,gemini-2.5-pro,gemini/gemini-pro-2.5,serbia_tst_bmo_2025_3,serbia,proofs,OPC R1 8B,0.0
4864,Qwen3-4B (25/07),qwen/qwen3_4b,serbia_tst_bmo_2025_3,serbia,proofs,OPC R1 8B,0.0
4865,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,serbia_tst_bmo_2025_3,serbia,proofs,OPC R1 8B,0.0
4866,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,serbia_tst_bmo_2025_4,serbia,proofs,OPC R1 8B,0.0
4867,gemini-2.5-pro,gemini/gemini-pro-2.5,serbia_tst_bmo_2025_4,serbia,proofs,OPC R1 8B,0.0
4868,Grok 4,xai/grok-4,serbia_tst_bmo_2025_4,serbia,proofs,OPC R1 8B,0.0
4869,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,serbia_tst_bmo_2025_4,serbia,proofs,OPC R1 8B,0.0
4870,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,serbia_tst_bmo_2025_4,serbia,proofs,OPC R1 8B,0.0
4871,o4-mini (high),openai/o4-mini--high,serbia_tst_bmo_2025_4,serbia,proofs,OPC R1 8B,0.0
4872,Qwen3-4B (25/07),qwen/qwen3_4b,serbia_tst_bmo_2025_4,serbia,proofs,OPC R1 8B,0.0
4873,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,serbia_tst_bmo_2025_4,serbia,proofs,OPC R1 8B,0.0
4874,GPT OSS 120B (high),openai/oss-120b,serbia_tst_bmo_2025_4,serbia,proofs,OPC R1 8B,0.0
4875,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,spain_2025_1,spain,proofs,OPC R1 8B,0.0
4876,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,spain_2025_1,spain,proofs,OPC R1 8B,1.0
4877,gemini-2.5-pro,gemini/gemini-pro-2.5,spain_2025_1,spain,proofs,OPC R1 8B,1.0
4878,GPT-5-mini (high),openai/gpt-5-mini,spain_2025_1,spain,proofs,OPC R1 8B,1.0
4879,GPT-5 (high),openai/gpt-5,spain_2025_1,spain,proofs,OPC R1 8B,0.0
4880,GPT OSS 120B (high),openai/oss-120b,spain_2025_1,spain,proofs,OPC R1 8B,0.0
4881,o4-mini (high),openai/o4-mini--high,spain_2025_1,spain,proofs,OPC R1 8B,0.0
4882,Grok 4,xai/grok-4,spain_2025_1,spain,proofs,OPC R1 8B,1.0
4883,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,spain_2025_1,spain,proofs,OPC R1 8B,1.0
4884,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,spain_2025_1,spain,proofs,OPC R1 8B,0.0
4885,Qwen3-4B (25/07),qwen/qwen3_4b,spain_2025_1,spain,proofs,OPC R1 8B,1.0
4886,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,spain_2025_2,spain,proofs,OPC R1 8B,1.0
4887,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,spain_2025_2,spain,proofs,OPC R1 8B,1.0
4888,GPT OSS 120B (high),openai/oss-120b,spain_2025_2,spain,proofs,OPC R1 8B,0.0
4889,o4-mini (high),openai/o4-mini--high,spain_2025_2,spain,proofs,OPC R1 8B,0.0
4890,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,spain_2025_2,spain,proofs,OPC R1 8B,0.0
4891,GPT-5 (high),openai/gpt-5,spain_2025_2,spain,proofs,OPC R1 8B,1.0
4892,Qwen3-4B (25/07),qwen/qwen3_4b,spain_2025_2,spain,proofs,OPC R1 8B,1.0
4893,gemini-2.5-pro,gemini/gemini-pro-2.5,spain_2025_2,spain,proofs,OPC R1 8B,1.0
4894,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,spain_2025_2,spain,proofs,OPC R1 8B,1.0
4895,Grok 4,xai/grok-4,spain_2025_2,spain,proofs,OPC R1 8B,1.0
4896,GPT-5-mini (high),openai/gpt-5-mini,spain_2025_2,spain,proofs,OPC R1 8B,1.0
4897,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,spain_2025_3,spain,proofs,OPC R1 8B,1.0
4898,Qwen3-4B (25/07),qwen/qwen3_4b,spain_2025_3,spain,proofs,OPC R1 8B,0.0
4899,o4-mini (high),openai/o4-mini--high,spain_2025_3,spain,proofs,OPC R1 8B,0.0
4900,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,spain_2025_3,spain,proofs,OPC R1 8B,0.0
4901,GPT OSS 120B (high),openai/oss-120b,spain_2025_3,spain,proofs,OPC R1 8B,0.0
4902,GPT-5 (high),openai/gpt-5,spain_2025_3,spain,proofs,OPC R1 8B,1.0
4903,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,spain_2025_3,spain,proofs,OPC R1 8B,0.0
4904,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,spain_2025_3,spain,proofs,OPC R1 8B,0.0
4905,Grok 4,xai/grok-4,spain_2025_3,spain,proofs,OPC R1 8B,0.0
4906,gemini-2.5-pro,gemini/gemini-pro-2.5,spain_2025_3,spain,proofs,OPC R1 8B,1.0
4907,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,spain_2025_4,spain,proofs,OPC R1 8B,1.0
4908,Grok 4,xai/grok-4,spain_2025_4,spain,proofs,OPC R1 8B,0.0
4909,GPT-5 (high),openai/gpt-5,spain_2025_4,spain,proofs,OPC R1 8B,0.0
4910,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,spain_2025_4,spain,proofs,OPC R1 8B,0.0
4911,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,spain_2025_4,spain,proofs,OPC R1 8B,0.0
4912,Qwen3-4B (25/07),qwen/qwen3_4b,spain_2025_4,spain,proofs,OPC R1 8B,0.0
4913,gemini-2.5-pro,gemini/gemini-pro-2.5,spain_2025_4,spain,proofs,OPC R1 8B,0.0
4914,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,spain_2025_4,spain,proofs,OPC R1 8B,0.0
4915,GPT OSS 120B (high),openai/oss-120b,spain_2025_4,spain,proofs,OPC R1 8B,0.0
4916,o4-mini (high),openai/o4-mini--high,spain_2025_4,spain,proofs,OPC R1 8B,0.0
4917,GPT-5 (high),openai/gpt-5,spain_2025_5,spain,proofs,OPC R1 8B,1.0
4918,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,spain_2025_5,spain,proofs,OPC R1 8B,0.0
4919,GPT-5-mini (high),openai/gpt-5-mini,spain_2025_5,spain,proofs,OPC R1 8B,0.0
4920,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,spain_2025_5,spain,proofs,OPC R1 8B,0.0
4921,Grok 4,xai/grok-4,spain_2025_5,spain,proofs,OPC R1 8B,0.0
4922,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,spain_2025_5,spain,proofs,OPC R1 8B,0.0
4923,gemini-2.5-pro,gemini/gemini-pro-2.5,spain_2025_5,spain,proofs,OPC R1 8B,0.0
4924,o4-mini (high),openai/o4-mini--high,spain_2025_5,spain,proofs,OPC R1 8B,0.0
4925,GPT OSS 120B (high),openai/oss-120b,spain_2025_5,spain,proofs,OPC R1 8B,0.0
4926,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,spain_2025_5,spain,proofs,OPC R1 8B,0.0
4927,Qwen3-4B (25/07),qwen/qwen3_4b,spain_2025_5,spain,proofs,OPC R1 8B,0.0
4928,Grok 4,xai/grok-4,thai_2025_1,thai,proofs,OPC R1 8B,1.0
4929,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,thai_2025_1,thai,proofs,OPC R1 8B,1.0
4930,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,thai_2025_1,thai,proofs,OPC R1 8B,1.0
4931,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,thai_2025_1,thai,proofs,OPC R1 8B,1.0
4932,GPT OSS 120B (high),openai/oss-120b,thai_2025_1,thai,proofs,OPC R1 8B,1.0
4933,Qwen3-4B (25/07),qwen/qwen3_4b,thai_2025_1,thai,proofs,OPC R1 8B,0.0
4934,gemini-2.5-pro,gemini/gemini-pro-2.5,thai_2025_1,thai,proofs,OPC R1 8B,1.0
4935,o4-mini (high),openai/o4-mini--high,thai_2025_1,thai,proofs,OPC R1 8B,1.0
4936,GPT-5 (high),openai/gpt-5,thai_2025_1,thai,proofs,OPC R1 8B,1.0
4937,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,thai_2025_1,thai,proofs,OPC R1 8B,0.0
4938,Grok 4,xai/grok-4,thai_2025_10,thai,proofs,OPC R1 8B,0.0
4939,o4-mini (high),openai/o4-mini--high,thai_2025_10,thai,proofs,OPC R1 8B,1.0
4940,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,thai_2025_10,thai,proofs,OPC R1 8B,0.0
4941,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,thai_2025_10,thai,proofs,OPC R1 8B,0.0
4942,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,thai_2025_10,thai,proofs,OPC R1 8B,0.0
4943,GPT OSS 120B (high),openai/oss-120b,thai_2025_10,thai,proofs,OPC R1 8B,1.0
4944,Qwen3-4B (25/07),qwen/qwen3_4b,thai_2025_10,thai,proofs,OPC R1 8B,0.0
4945,GPT-5 (high),openai/gpt-5,thai_2025_10,thai,proofs,OPC R1 8B,1.0
4946,gemini-2.5-pro,gemini/gemini-pro-2.5,thai_2025_10,thai,proofs,OPC R1 8B,1.0
4947,GPT-5-mini (high),openai/gpt-5-mini,thai_2025_10,thai,proofs,OPC R1 8B,1.0
4948,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,thai_2025_10,thai,proofs,OPC R1 8B,0.0
4949,GPT OSS 120B (high),openai/oss-120b,thai_2025_2,thai,proofs,OPC R1 8B,0.0
4950,o4-mini (high),openai/o4-mini--high,thai_2025_2,thai,proofs,OPC R1 8B,1.0
4951,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,thai_2025_2,thai,proofs,OPC R1 8B,1.0
4952,GPT-5-mini (high),openai/gpt-5-mini,thai_2025_2,thai,proofs,OPC R1 8B,1.0
4953,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,thai_2025_2,thai,proofs,OPC R1 8B,1.0
4954,GPT-5 (high),openai/gpt-5,thai_2025_2,thai,proofs,OPC R1 8B,1.0
4955,Qwen3-4B (25/07),qwen/qwen3_4b,thai_2025_2,thai,proofs,OPC R1 8B,1.0
4956,gemini-2.5-pro,gemini/gemini-pro-2.5,thai_2025_2,thai,proofs,OPC R1 8B,1.0
4957,Grok 4,xai/grok-4,thai_2025_2,thai,proofs,OPC R1 8B,1.0
4958,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,thai_2025_2,thai,proofs,OPC R1 8B,1.0
4959,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,thai_2025_2,thai,proofs,OPC R1 8B,1.0
4960,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,thai_2025_3,thai,proofs,OPC R1 8B,0.0
4961,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,thai_2025_3,thai,proofs,OPC R1 8B,0.0
4962,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,thai_2025_3,thai,proofs,OPC R1 8B,1.0
4963,gemini-2.5-pro,gemini/gemini-pro-2.5,thai_2025_3,thai,proofs,OPC R1 8B,0.0
4964,Grok 4,xai/grok-4,thai_2025_3,thai,proofs,OPC R1 8B,0.0
4965,GPT-5 (high),openai/gpt-5,thai_2025_3,thai,proofs,OPC R1 8B,1.0
4966,GPT OSS 120B (high),openai/oss-120b,thai_2025_3,thai,proofs,OPC R1 8B,1.0
4967,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,thai_2025_3,thai,proofs,OPC R1 8B,1.0
4968,Qwen3-4B (25/07),qwen/qwen3_4b,thai_2025_3,thai,proofs,OPC R1 8B,0.0
4969,o4-mini (high),openai/o4-mini--high,thai_2025_3,thai,proofs,OPC R1 8B,1.0
4970,gemini-2.5-pro,gemini/gemini-pro-2.5,thai_2025_4,thai,proofs,OPC R1 8B,1.0
4971,GPT-5 (high),openai/gpt-5,thai_2025_4,thai,proofs,OPC R1 8B,0.0
4972,Qwen3-4B (25/07),qwen/qwen3_4b,thai_2025_4,thai,proofs,OPC R1 8B,0.0
4973,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,thai_2025_4,thai,proofs,OPC R1 8B,0.0
4974,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,thai_2025_4,thai,proofs,OPC R1 8B,0.0
4975,GPT OSS 120B (high),openai/oss-120b,thai_2025_4,thai,proofs,OPC R1 8B,1.0
4976,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,thai_2025_4,thai,proofs,OPC R1 8B,0.0
4977,o4-mini (high),openai/o4-mini--high,thai_2025_4,thai,proofs,OPC R1 8B,0.0
4978,Grok 4,xai/grok-4,thai_2025_4,thai,proofs,OPC R1 8B,0.0
4979,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,thai_2025_4,thai,proofs,OPC R1 8B,0.0
4980,GPT-5 (high),openai/gpt-5,thai_2025_5,thai,proofs,OPC R1 8B,1.0
4981,GPT OSS 120B (high),openai/oss-120b,thai_2025_5,thai,proofs,OPC R1 8B,1.0
4982,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,thai_2025_5,thai,proofs,OPC R1 8B,1.0
4983,gemini-2.5-pro,gemini/gemini-pro-2.5,thai_2025_5,thai,proofs,OPC R1 8B,1.0
4984,GPT-5-mini (high),openai/gpt-5-mini,thai_2025_5,thai,proofs,OPC R1 8B,0.0
4985,Grok 4,xai/grok-4,thai_2025_5,thai,proofs,OPC R1 8B,0.0
4986,o4-mini (high),openai/o4-mini--high,thai_2025_5,thai,proofs,OPC R1 8B,1.0
4987,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,thai_2025_5,thai,proofs,OPC R1 8B,0.0
4988,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,thai_2025_5,thai,proofs,OPC R1 8B,1.0
4989,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,thai_2025_5,thai,proofs,OPC R1 8B,0.0
4990,Qwen3-4B (25/07),qwen/qwen3_4b,thai_2025_5,thai,proofs,OPC R1 8B,0.0
4991,Qwen3-4B (25/07),qwen/qwen3_4b,thai_2025_6,thai,proofs,OPC R1 8B,0.0
4992,Grok 4,xai/grok-4,thai_2025_6,thai,proofs,OPC R1 8B,1.0
4993,GPT-5-mini (high),openai/gpt-5-mini,thai_2025_6,thai,proofs,OPC R1 8B,1.0
4994,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,thai_2025_6,thai,proofs,OPC R1 8B,0.0
4995,o4-mini (high),openai/o4-mini--high,thai_2025_6,thai,proofs,OPC R1 8B,1.0
4996,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,thai_2025_6,thai,proofs,OPC R1 8B,1.0
4997,GPT OSS 120B (high),openai/oss-120b,thai_2025_6,thai,proofs,OPC R1 8B,1.0
4998,gemini-2.5-pro,gemini/gemini-pro-2.5,thai_2025_6,thai,proofs,OPC R1 8B,1.0
4999,GPT-5 (high),openai/gpt-5,thai_2025_6,thai,proofs,OPC R1 8B,1.0
5000,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,thai_2025_6,thai,proofs,OPC R1 8B,0.0
5001,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,thai_2025_6,thai,proofs,OPC R1 8B,1.0
5002,Qwen3-4B (25/07),qwen/qwen3_4b,thai_2025_7,thai,proofs,OPC R1 8B,0.0
5003,GPT-5 (high),openai/gpt-5,thai_2025_7,thai,proofs,OPC R1 8B,1.0
5004,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,thai_2025_7,thai,proofs,OPC R1 8B,0.0
5005,o4-mini (high),openai/o4-mini--high,thai_2025_7,thai,proofs,OPC R1 8B,1.0
5006,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,thai_2025_7,thai,proofs,OPC R1 8B,1.0
5007,GPT OSS 120B (high),openai/oss-120b,thai_2025_7,thai,proofs,OPC R1 8B,0.0
5008,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,thai_2025_7,thai,proofs,OPC R1 8B,0.0
5009,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,thai_2025_7,thai,proofs,OPC R1 8B,1.0
5010,Grok 4,xai/grok-4,thai_2025_7,thai,proofs,OPC R1 8B,0.0
5011,gemini-2.5-pro,gemini/gemini-pro-2.5,thai_2025_7,thai,proofs,OPC R1 8B,0.0
5012,Qwen3-4B (25/07),qwen/qwen3_4b,thai_2025_8,thai,proofs,OPC R1 8B,0.0
5013,gemini-2.5-pro,gemini/gemini-pro-2.5,thai_2025_8,thai,proofs,OPC R1 8B,1.0
5014,GPT OSS 120B (high),openai/oss-120b,thai_2025_8,thai,proofs,OPC R1 8B,0.0
5015,GPT-5-mini (high),openai/gpt-5-mini,thai_2025_8,thai,proofs,OPC R1 8B,1.0
5016,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,thai_2025_8,thai,proofs,OPC R1 8B,1.0
5017,GPT-5 (high),openai/gpt-5,thai_2025_8,thai,proofs,OPC R1 8B,1.0
5018,o4-mini (high),openai/o4-mini--high,thai_2025_8,thai,proofs,OPC R1 8B,1.0
5019,Grok 4,xai/grok-4,thai_2025_8,thai,proofs,OPC R1 8B,0.0
5020,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,thai_2025_8,thai,proofs,OPC R1 8B,0.0
5021,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,thai_2025_8,thai,proofs,OPC R1 8B,0.0
5022,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,thai_2025_8,thai,proofs,OPC R1 8B,0.0
5023,o4-mini (high),openai/o4-mini--high,thai_2025_9,thai,proofs,OPC R1 8B,1.0
5024,GPT OSS 120B (high),openai/oss-120b,thai_2025_9,thai,proofs,OPC R1 8B,0.0
5025,Qwen3-4B (25/07),qwen/qwen3_4b,thai_2025_9,thai,proofs,OPC R1 8B,0.0
5026,GPT-5 (high),openai/gpt-5,thai_2025_9,thai,proofs,OPC R1 8B,1.0
5027,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,thai_2025_9,thai,proofs,OPC R1 8B,1.0
5028,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,thai_2025_9,thai,proofs,OPC R1 8B,0.0
5029,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,thai_2025_9,thai,proofs,OPC R1 8B,0.0
5030,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,thai_2025_9,thai,proofs,OPC R1 8B,0.0
5031,gemini-2.5-pro,gemini/gemini-pro-2.5,thai_2025_9,thai,proofs,OPC R1 8B,0.0
5032,Grok 4,xai/grok-4,thai_2025_9,thai,proofs,OPC R1 8B,1.0
5033,GPT-5-mini (high),openai/gpt-5-mini,thai_2025_9,thai,proofs,OPC R1 8B,1.0
5034,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,turkey_tst_2025_1,turkey,proofs,OPC R1 8B,1.0
5035,gemini-2.5-pro,gemini/gemini-pro-2.5,turkey_tst_2025_1,turkey,proofs,OPC R1 8B,1.0
5036,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,turkey_tst_2025_1,turkey,proofs,OPC R1 8B,0.0
5037,o4-mini (high),openai/o4-mini--high,turkey_tst_2025_1,turkey,proofs,OPC R1 8B,1.0
5038,GPT-5-mini (high),openai/gpt-5-mini,turkey_tst_2025_1,turkey,proofs,OPC R1 8B,1.0
5039,GPT-5 (high),openai/gpt-5,turkey_tst_2025_1,turkey,proofs,OPC R1 8B,1.0
5040,GPT OSS 120B (high),openai/oss-120b,turkey_tst_2025_1,turkey,proofs,OPC R1 8B,0.0
5041,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,turkey_tst_2025_1,turkey,proofs,OPC R1 8B,0.0
5042,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,turkey_tst_2025_1,turkey,proofs,OPC R1 8B,1.0
5043,Grok 4,xai/grok-4,turkey_tst_2025_1,turkey,proofs,OPC R1 8B,1.0
5044,Qwen3-4B (25/07),qwen/qwen3_4b,turkey_tst_2025_1,turkey,proofs,OPC R1 8B,1.0
5045,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,turkey_tst_2025_2,turkey,proofs,OPC R1 8B,0.0
5046,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,turkey_tst_2025_2,turkey,proofs,OPC R1 8B,0.0
5047,gemini-2.5-pro,gemini/gemini-pro-2.5,turkey_tst_2025_2,turkey,proofs,OPC R1 8B,0.0
5048,GPT OSS 120B (high),openai/oss-120b,turkey_tst_2025_2,turkey,proofs,OPC R1 8B,0.0
5049,Grok 4,xai/grok-4,turkey_tst_2025_2,turkey,proofs,OPC R1 8B,0.0
5050,GPT-5-mini (high),openai/gpt-5-mini,turkey_tst_2025_2,turkey,proofs,OPC R1 8B,1.0
5051,GPT-5 (high),openai/gpt-5,turkey_tst_2025_2,turkey,proofs,OPC R1 8B,1.0
5052,Qwen3-4B (25/07),qwen/qwen3_4b,turkey_tst_2025_2,turkey,proofs,OPC R1 8B,0.0
5053,o4-mini (high),openai/o4-mini--high,turkey_tst_2025_2,turkey,proofs,OPC R1 8B,0.0
5054,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,turkey_tst_2025_2,turkey,proofs,OPC R1 8B,0.0
5055,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,turkey_tst_2025_2,turkey,proofs,OPC R1 8B,0.0
5056,gemini-2.5-pro,gemini/gemini-pro-2.5,turkey_tst_2025_3,turkey,proofs,OPC R1 8B,1.0
5057,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,turkey_tst_2025_3,turkey,proofs,OPC R1 8B,0.0
5058,GPT OSS 120B (high),openai/oss-120b,turkey_tst_2025_3,turkey,proofs,OPC R1 8B,0.0
5059,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,turkey_tst_2025_3,turkey,proofs,OPC R1 8B,0.0
5060,o4-mini (high),openai/o4-mini--high,turkey_tst_2025_3,turkey,proofs,OPC R1 8B,1.0
5061,Grok 4,xai/grok-4,turkey_tst_2025_3,turkey,proofs,OPC R1 8B,0.0
5062,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,turkey_tst_2025_3,turkey,proofs,OPC R1 8B,0.0
5063,GPT-5 (high),openai/gpt-5,turkey_tst_2025_3,turkey,proofs,OPC R1 8B,0.0
5064,Qwen3-4B (25/07),qwen/qwen3_4b,turkey_tst_2025_3,turkey,proofs,OPC R1 8B,0.0
5065,GPT-5-mini (high),openai/gpt-5-mini,turkey_tst_2025_3,turkey,proofs,OPC R1 8B,0.0
5066,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,turkey_tst_2025_3,turkey,proofs,OPC R1 8B,0.0
5067,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,turkey_tst_2025_4,turkey,proofs,OPC R1 8B,0.0
5068,gemini-2.5-pro,gemini/gemini-pro-2.5,turkey_tst_2025_4,turkey,proofs,OPC R1 8B,0.0
5069,o4-mini (high),openai/o4-mini--high,turkey_tst_2025_4,turkey,proofs,OPC R1 8B,0.0
5070,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,turkey_tst_2025_4,turkey,proofs,OPC R1 8B,0.0
5071,GPT-5-mini (high),openai/gpt-5-mini,turkey_tst_2025_4,turkey,proofs,OPC R1 8B,0.0
5072,Grok 4,xai/grok-4,turkey_tst_2025_4,turkey,proofs,OPC R1 8B,0.0
5073,GPT OSS 120B (high),openai/oss-120b,turkey_tst_2025_4,turkey,proofs,OPC R1 8B,0.0
5074,Qwen3-4B (25/07),qwen/qwen3_4b,turkey_tst_2025_4,turkey,proofs,OPC R1 8B,0.0
5075,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,turkey_tst_2025_4,turkey,proofs,OPC R1 8B,0.0
5076,GPT-5 (high),openai/gpt-5,turkey_tst_2025_4,turkey,proofs,OPC R1 8B,0.0
5077,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,turkey_tst_2025_4,turkey,proofs,OPC R1 8B,0.0
5078,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,turkey_tst_2025_5,turkey,proofs,OPC R1 8B,0.0
5079,gemini-2.5-pro,gemini/gemini-pro-2.5,turkey_tst_2025_5,turkey,proofs,OPC R1 8B,0.0
5080,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,turkey_tst_2025_5,turkey,proofs,OPC R1 8B,0.0
5081,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,turkey_tst_2025_5,turkey,proofs,OPC R1 8B,0.0
5082,o4-mini (high),openai/o4-mini--high,turkey_tst_2025_5,turkey,proofs,OPC R1 8B,0.0
5083,GPT-5 (high),openai/gpt-5,turkey_tst_2025_5,turkey,proofs,OPC R1 8B,0.0
5084,Grok 4,xai/grok-4,turkey_tst_2025_5,turkey,proofs,OPC R1 8B,0.0
5085,GPT OSS 120B (high),openai/oss-120b,turkey_tst_2025_5,turkey,proofs,OPC R1 8B,0.0
5086,Qwen3-4B (25/07),qwen/qwen3_4b,turkey_tst_2025_5,turkey,proofs,OPC R1 8B,0.0
5087,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,turkey_tst_2025_5,turkey,proofs,OPC R1 8B,0.0
5088,gemini-2.5-pro,gemini/gemini-pro-2.5,turkey_tst_2025_6,turkey,proofs,OPC R1 8B,0.0
5089,GPT-5 (high),openai/gpt-5,turkey_tst_2025_6,turkey,proofs,OPC R1 8B,0.0
5090,Qwen3-4B (25/07),qwen/qwen3_4b,turkey_tst_2025_6,turkey,proofs,OPC R1 8B,0.0
5091,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,turkey_tst_2025_6,turkey,proofs,OPC R1 8B,0.0
5092,GPT-5-mini (high),openai/gpt-5-mini,turkey_tst_2025_6,turkey,proofs,OPC R1 8B,0.0
5093,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,turkey_tst_2025_6,turkey,proofs,OPC R1 8B,0.0
5094,o4-mini (high),openai/o4-mini--high,turkey_tst_2025_6,turkey,proofs,OPC R1 8B,0.0
5095,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,turkey_tst_2025_6,turkey,proofs,OPC R1 8B,0.0
5096,Grok 4,xai/grok-4,turkey_tst_2025_6,turkey,proofs,OPC R1 8B,0.0
5097,GPT OSS 120B (high),openai/oss-120b,turkey_tst_2025_6,turkey,proofs,OPC R1 8B,1.0
5098,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,turkey_tst_2025_6,turkey,proofs,OPC R1 8B,0.0
5099,Grok 4,xai/grok-4,turkey_tst_2025_7,turkey,proofs,OPC R1 8B,0.0
5100,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,turkey_tst_2025_7,turkey,proofs,OPC R1 8B,0.0
5101,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,turkey_tst_2025_7,turkey,proofs,OPC R1 8B,0.0
5102,Qwen3-4B (25/07),qwen/qwen3_4b,turkey_tst_2025_7,turkey,proofs,OPC R1 8B,0.0
5103,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,turkey_tst_2025_7,turkey,proofs,OPC R1 8B,0.0
5104,GPT OSS 120B (high),openai/oss-120b,turkey_tst_2025_7,turkey,proofs,OPC R1 8B,0.0
5105,o4-mini (high),openai/o4-mini--high,turkey_tst_2025_7,turkey,proofs,OPC R1 8B,0.0
5106,GPT-5 (high),openai/gpt-5,turkey_tst_2025_7,turkey,proofs,OPC R1 8B,0.0
5107,GPT-5-mini (high),openai/gpt-5-mini,turkey_tst_2025_7,turkey,proofs,OPC R1 8B,0.0
5108,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,turkey_tst_2025_7,turkey,proofs,OPC R1 8B,0.0
5109,gemini-2.5-pro,gemini/gemini-pro-2.5,turkey_tst_2025_7,turkey,proofs,OPC R1 8B,0.0
5110,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,turkey_tst_2025_8,turkey,proofs,OPC R1 8B,0.0
5111,Grok 4,xai/grok-4,turkey_tst_2025_8,turkey,proofs,OPC R1 8B,0.0
5112,GPT-5-mini (high),openai/gpt-5-mini,turkey_tst_2025_8,turkey,proofs,OPC R1 8B,0.0
5113,GPT OSS 120B (high),openai/oss-120b,turkey_tst_2025_8,turkey,proofs,OPC R1 8B,1.0
5114,GPT-5 (high),openai/gpt-5,turkey_tst_2025_8,turkey,proofs,OPC R1 8B,0.0
5115,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,turkey_tst_2025_8,turkey,proofs,OPC R1 8B,0.0
5116,o4-mini (high),openai/o4-mini--high,turkey_tst_2025_8,turkey,proofs,OPC R1 8B,0.0
5117,gemini-2.5-pro,gemini/gemini-pro-2.5,turkey_tst_2025_8,turkey,proofs,OPC R1 8B,0.0
5118,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,turkey_tst_2025_8,turkey,proofs,OPC R1 8B,0.0
5119,Qwen3-4B (25/07),qwen/qwen3_4b,turkey_tst_2025_8,turkey,proofs,OPC R1 8B,0.0
5120,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,turkey_tst_2025_8,turkey,proofs,OPC R1 8B,0.0
5121,Qwen3-4B (25/07),qwen/qwen3_4b,turkey_tst_2025_9,turkey,proofs,OPC R1 8B,0.0
5122,Grok 4,xai/grok-4,turkey_tst_2025_9,turkey,proofs,OPC R1 8B,0.0
5123,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,turkey_tst_2025_9,turkey,proofs,OPC R1 8B,0.0
5124,gemini-2.5-pro,gemini/gemini-pro-2.5,turkey_tst_2025_9,turkey,proofs,OPC R1 8B,0.0
5125,GPT-5 (high),openai/gpt-5,turkey_tst_2025_9,turkey,proofs,OPC R1 8B,0.0
5126,o4-mini (high),openai/o4-mini--high,turkey_tst_2025_9,turkey,proofs,OPC R1 8B,0.0
5127,GPT OSS 120B (high),openai/oss-120b,turkey_tst_2025_9,turkey,proofs,OPC R1 8B,0.0
5128,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,turkey_tst_2025_9,turkey,proofs,OPC R1 8B,1.0
5129,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,turkey_tst_2025_9,turkey,proofs,OPC R1 8B,0.0
5130,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,turkey_tst_2025_9,turkey,proofs,OPC R1 8B,1.0
5131,GPT-5-mini (high),openai/gpt-5-mini,turkey_tst_2025_9,turkey,proofs,OPC R1 8B,0.0
5132,GPT OSS 120B (high),openai/oss-120b,usamo_2025_1,usamo,proofs,OPC R1 8B,0.0
5133,GPT-5-mini (high),openai/gpt-5-mini,usamo_2025_1,usamo,proofs,OPC R1 8B,1.0
5134,Qwen3-4B (25/07),qwen/qwen3_4b,usamo_2025_1,usamo,proofs,OPC R1 8B,0.0
5135,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,usamo_2025_1,usamo,proofs,OPC R1 8B,1.0
5136,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,usamo_2025_1,usamo,proofs,OPC R1 8B,0.0
5137,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,usamo_2025_1,usamo,proofs,OPC R1 8B,0.0
5138,gemini-2.5-pro,gemini/gemini-pro-2.5,usamo_2025_1,usamo,proofs,OPC R1 8B,0.0
5139,Grok 4,xai/grok-4,usamo_2025_1,usamo,proofs,OPC R1 8B,0.0
5140,o4-mini (high),openai/o4-mini--high,usamo_2025_1,usamo,proofs,OPC R1 8B,0.0
5141,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,usamo_2025_1,usamo,proofs,OPC R1 8B,1.0
5142,GPT-5 (high),openai/gpt-5,usamo_2025_1,usamo,proofs,OPC R1 8B,1.0
5143,GPT OSS 120B (high),openai/oss-120b,usamo_2025_2,usamo,proofs,OPC R1 8B,0.0
5144,o4-mini (high),openai/o4-mini--high,usamo_2025_2,usamo,proofs,OPC R1 8B,0.0
5145,GPT-5-mini (high),openai/gpt-5-mini,usamo_2025_2,usamo,proofs,OPC R1 8B,0.0
5146,Grok 4,xai/grok-4,usamo_2025_2,usamo,proofs,OPC R1 8B,0.0
5147,GPT-5 (high),openai/gpt-5,usamo_2025_2,usamo,proofs,OPC R1 8B,0.0
5148,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,usamo_2025_2,usamo,proofs,OPC R1 8B,0.0
5149,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,usamo_2025_2,usamo,proofs,OPC R1 8B,0.0
5150,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,usamo_2025_2,usamo,proofs,OPC R1 8B,0.0
5151,gemini-2.5-pro,gemini/gemini-pro-2.5,usamo_2025_2,usamo,proofs,OPC R1 8B,0.0
5152,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,usamo_2025_2,usamo,proofs,OPC R1 8B,0.0
5153,Qwen3-4B (25/07),qwen/qwen3_4b,usamo_2025_2,usamo,proofs,OPC R1 8B,0.0
5154,o4-mini (high),openai/o4-mini--high,usamo_2025_3,usamo,proofs,OPC R1 8B,0.0
5155,gemini-2.5-pro,gemini/gemini-pro-2.5,usamo_2025_3,usamo,proofs,OPC R1 8B,0.0
5156,GPT-5 (high),openai/gpt-5,usamo_2025_3,usamo,proofs,OPC R1 8B,1.0
5157,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,usamo_2025_3,usamo,proofs,OPC R1 8B,0.0
5158,GPT OSS 120B (high),openai/oss-120b,usamo_2025_3,usamo,proofs,OPC R1 8B,0.0
5159,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,usamo_2025_3,usamo,proofs,OPC R1 8B,0.0
5160,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,usamo_2025_3,usamo,proofs,OPC R1 8B,0.0
5161,Grok 4,xai/grok-4,usamo_2025_3,usamo,proofs,OPC R1 8B,0.0
5162,Qwen3-4B (25/07),qwen/qwen3_4b,usamo_2025_3,usamo,proofs,OPC R1 8B,0.0
5163,GPT-5-mini (high),openai/gpt-5-mini,usamo_2025_3,usamo,proofs,OPC R1 8B,0.0
5164,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,usamo_2025_3,usamo,proofs,OPC R1 8B,0.0
5165,GPT-5-mini (high),openai/gpt-5-mini,usamo_2025_4,usamo,proofs,OPC R1 8B,1.0
5166,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,usamo_2025_4,usamo,proofs,OPC R1 8B,1.0
5167,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,usamo_2025_4,usamo,proofs,OPC R1 8B,1.0
5168,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,usamo_2025_4,usamo,proofs,OPC R1 8B,0.0
5169,Grok 4,xai/grok-4,usamo_2025_4,usamo,proofs,OPC R1 8B,1.0
5170,GPT-5 (high),openai/gpt-5,usamo_2025_4,usamo,proofs,OPC R1 8B,1.0
5171,GPT OSS 120B (high),openai/oss-120b,usamo_2025_4,usamo,proofs,OPC R1 8B,1.0
5172,o4-mini (high),openai/o4-mini--high,usamo_2025_4,usamo,proofs,OPC R1 8B,1.0
5173,Qwen3-4B (25/07),qwen/qwen3_4b,usamo_2025_4,usamo,proofs,OPC R1 8B,0.0
5174,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,usamo_2025_4,usamo,proofs,OPC R1 8B,0.0
5175,gemini-2.5-pro,gemini/gemini-pro-2.5,usamo_2025_4,usamo,proofs,OPC R1 8B,0.0
5176,gemini-2.5-pro,gemini/gemini-pro-2.5,usamo_2025_5,usamo,proofs,OPC R1 8B,0.0
5177,o4-mini (high),openai/o4-mini--high,usamo_2025_5,usamo,proofs,OPC R1 8B,0.0
5178,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,usamo_2025_5,usamo,proofs,OPC R1 8B,0.0
5179,GPT-5 (high),openai/gpt-5,usamo_2025_5,usamo,proofs,OPC R1 8B,1.0
5180,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,usamo_2025_5,usamo,proofs,OPC R1 8B,0.0
5181,Grok 4,xai/grok-4,usamo_2025_5,usamo,proofs,OPC R1 8B,0.0
5182,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,usamo_2025_5,usamo,proofs,OPC R1 8B,0.0
5183,GPT-5-mini (high),openai/gpt-5-mini,usamo_2025_5,usamo,proofs,OPC R1 8B,0.0
5184,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,usamo_2025_5,usamo,proofs,OPC R1 8B,0.0
5185,Qwen3-4B (25/07),qwen/qwen3_4b,usamo_2025_5,usamo,proofs,OPC R1 8B,0.0
5186,GPT OSS 120B (high),openai/oss-120b,usamo_2025_5,usamo,proofs,OPC R1 8B,0.0
5187,GPT OSS 120B (high),openai/oss-120b,usamo_2025_6,usamo,proofs,OPC R1 8B,0.0
5188,GPT-5 (high),openai/gpt-5,usamo_2025_6,usamo,proofs,OPC R1 8B,0.0
5189,Qwen3-4B (25/07),qwen/qwen3_4b,usamo_2025_6,usamo,proofs,OPC R1 8B,0.0
5190,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,usamo_2025_6,usamo,proofs,OPC R1 8B,0.0
5191,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,usamo_2025_6,usamo,proofs,OPC R1 8B,0.0
5192,GPT-5-mini (high),openai/gpt-5-mini,usamo_2025_6,usamo,proofs,OPC R1 8B,0.0
5193,o4-mini (high),openai/o4-mini--high,usamo_2025_6,usamo,proofs,OPC R1 8B,0.0
5194,Grok 4,xai/grok-4,usamo_2025_6,usamo,proofs,OPC R1 8B,0.0
5195,gemini-2.5-pro,gemini/gemini-pro-2.5,usamo_2025_6,usamo,proofs,OPC R1 8B,0.0
5196,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,usamo_2025_6,usamo,proofs,OPC R1 8B,0.0
5197,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,usamo_2025_6,usamo,proofs,OPC R1 8B,0.0
5198,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,usatst_2025_1,usatst,proofs,OPC R1 8B,0.0
5199,GPT-5-mini (high),openai/gpt-5-mini,usatst_2025_1,usatst,proofs,OPC R1 8B,1.0
5200,Qwen3-4B (25/07),qwen/qwen3_4b,usatst_2025_1,usatst,proofs,OPC R1 8B,0.0
5201,gemini-2.5-pro,gemini/gemini-pro-2.5,usatst_2025_1,usatst,proofs,OPC R1 8B,1.0
5202,o4-mini (high),openai/o4-mini--high,usatst_2025_1,usatst,proofs,OPC R1 8B,0.0
5203,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,usatst_2025_1,usatst,proofs,OPC R1 8B,1.0
5204,Grok 4,xai/grok-4,usatst_2025_1,usatst,proofs,OPC R1 8B,1.0
5205,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,usatst_2025_1,usatst,proofs,OPC R1 8B,1.0
5206,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,usatst_2025_1,usatst,proofs,OPC R1 8B,0.0
5207,GPT OSS 120B (high),openai/oss-120b,usatst_2025_1,usatst,proofs,OPC R1 8B,1.0
5208,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,usatst_2025_2,usatst,proofs,OPC R1 8B,0.0
5209,GPT-5-mini (high),openai/gpt-5-mini,usatst_2025_2,usatst,proofs,OPC R1 8B,0.0
5210,Grok 4,xai/grok-4,usatst_2025_2,usatst,proofs,OPC R1 8B,0.0
5211,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,usatst_2025_2,usatst,proofs,OPC R1 8B,0.0
5212,GPT-5 (high),openai/gpt-5,usatst_2025_2,usatst,proofs,OPC R1 8B,0.0
5213,GPT OSS 120B (high),openai/oss-120b,usatst_2025_2,usatst,proofs,OPC R1 8B,0.0
5214,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,usatst_2025_2,usatst,proofs,OPC R1 8B,0.0
5215,o4-mini (high),openai/o4-mini--high,usatst_2025_2,usatst,proofs,OPC R1 8B,0.0
5216,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,usatst_2025_2,usatst,proofs,OPC R1 8B,1.0
5217,gemini-2.5-pro,gemini/gemini-pro-2.5,usatst_2025_2,usatst,proofs,OPC R1 8B,0.0
5218,Qwen3-4B (25/07),qwen/qwen3_4b,usatst_2025_2,usatst,proofs,OPC R1 8B,0.0
5219,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,usatst_2025_3,usatst,proofs,OPC R1 8B,0.0
5220,Grok 4,xai/grok-4,usatst_2025_3,usatst,proofs,OPC R1 8B,0.0
5221,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,usatst_2025_3,usatst,proofs,OPC R1 8B,0.0
5222,gemini-2.5-pro,gemini/gemini-pro-2.5,usatst_2025_3,usatst,proofs,OPC R1 8B,1.0
5223,o4-mini (high),openai/o4-mini--high,usatst_2025_3,usatst,proofs,OPC R1 8B,0.0
5224,GPT OSS 120B (high),openai/oss-120b,usatst_2025_3,usatst,proofs,OPC R1 8B,0.0
5225,GPT-5 (high),openai/gpt-5,usatst_2025_3,usatst,proofs,OPC R1 8B,0.0
5226,Qwen3-4B (25/07),qwen/qwen3_4b,usatst_2025_3,usatst,proofs,OPC R1 8B,0.0
5227,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,usatst_2025_3,usatst,proofs,OPC R1 8B,0.0
5228,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,usatst_2025_3,usatst,proofs,OPC R1 8B,0.0
5229,Qwen3-4B (25/07),qwen/qwen3_4b,usatst_2025_4,usatst,proofs,OPC R1 8B,0.0
5230,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,usatst_2025_4,usatst,proofs,OPC R1 8B,0.0
5231,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,usatst_2025_4,usatst,proofs,OPC R1 8B,0.0
5232,o4-mini (high),openai/o4-mini--high,usatst_2025_4,usatst,proofs,OPC R1 8B,0.0
5233,GPT-5 (high),openai/gpt-5,usatst_2025_4,usatst,proofs,OPC R1 8B,0.0
5234,Grok 4,xai/grok-4,usatst_2025_4,usatst,proofs,OPC R1 8B,0.0
5235,gemini-2.5-pro,gemini/gemini-pro-2.5,usatst_2025_4,usatst,proofs,OPC R1 8B,1.0
5236,GPT OSS 120B (high),openai/oss-120b,usatst_2025_4,usatst,proofs,OPC R1 8B,0.0
5237,GPT-5-mini (high),openai/gpt-5-mini,usatst_2025_4,usatst,proofs,OPC R1 8B,1.0
5238,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,usatst_2025_4,usatst,proofs,OPC R1 8B,1.0
5239,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,usatst_2025_4,usatst,proofs,OPC R1 8B,0.0
5240,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,usatst_2025_5,usatst,proofs,OPC R1 8B,0.0
5241,GPT-5 (high),openai/gpt-5,usatst_2025_5,usatst,proofs,OPC R1 8B,0.0
5242,o4-mini (high),openai/o4-mini--high,usatst_2025_5,usatst,proofs,OPC R1 8B,0.0
5243,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,usatst_2025_5,usatst,proofs,OPC R1 8B,0.0
5244,GPT OSS 120B (high),openai/oss-120b,usatst_2025_5,usatst,proofs,OPC R1 8B,0.0
5245,Qwen3-4B (25/07),qwen/qwen3_4b,usatst_2025_5,usatst,proofs,OPC R1 8B,0.0
5246,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,usatst_2025_5,usatst,proofs,OPC R1 8B,0.0
5247,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,usatst_2025_5,usatst,proofs,OPC R1 8B,0.0
5248,GPT-5-mini (high),openai/gpt-5-mini,usatst_2025_5,usatst,proofs,OPC R1 8B,0.0
5249,gemini-2.5-pro,gemini/gemini-pro-2.5,usatst_2025_5,usatst,proofs,OPC R1 8B,0.0
5250,Grok 4,xai/grok-4,usatst_2025_5,usatst,proofs,OPC R1 8B,0.0
5251,o4-mini (high),openai/o4-mini--high,usatst_2025_6,usatst,proofs,OPC R1 8B,0.0
5252,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,usatst_2025_6,usatst,proofs,OPC R1 8B,0.0
5253,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,usatst_2025_6,usatst,proofs,OPC R1 8B,0.0
5254,Qwen3-4B (25/07),qwen/qwen3_4b,usatst_2025_6,usatst,proofs,OPC R1 8B,0.0
5255,Grok 4,xai/grok-4,usatst_2025_6,usatst,proofs,OPC R1 8B,0.0
5256,GPT-5 (high),openai/gpt-5,usatst_2025_6,usatst,proofs,OPC R1 8B,0.0
5257,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,usatst_2025_6,usatst,proofs,OPC R1 8B,0.0
5258,GPT OSS 120B (high),openai/oss-120b,usatst_2025_6,usatst,proofs,OPC R1 8B,0.0
5259,GPT-5-mini (high),openai/gpt-5-mini,usatst_2025_6,usatst,proofs,OPC R1 8B,0.0
5260,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,usatst_2025_6,usatst,proofs,OPC R1 8B,0.0
5261,gemini-2.5-pro,gemini/gemini-pro-2.5,usatst_2025_6,usatst,proofs,OPC R1 8B,0.0
5262,o4-mini (high),openai/o4-mini--high,usatst_2025_7,usatst,proofs,OPC R1 8B,0.0
5263,GPT-5-mini (high),openai/gpt-5-mini,usatst_2025_7,usatst,proofs,OPC R1 8B,0.0
5264,GPT-5 (high),openai/gpt-5,usatst_2025_7,usatst,proofs,OPC R1 8B,0.0
5265,Qwen3-4B (25/07),qwen/qwen3_4b,usatst_2025_7,usatst,proofs,OPC R1 8B,0.0
5266,GPT OSS 120B (high),openai/oss-120b,usatst_2025_7,usatst,proofs,OPC R1 8B,0.0
5267,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,usatst_2025_7,usatst,proofs,OPC R1 8B,1.0
5268,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,usatst_2025_7,usatst,proofs,OPC R1 8B,0.0
5269,Grok 4,xai/grok-4,usatst_2025_7,usatst,proofs,OPC R1 8B,0.0
5270,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,usatst_2025_7,usatst,proofs,OPC R1 8B,0.0
5271,gemini-2.5-pro,gemini/gemini-pro-2.5,usatst_2025_7,usatst,proofs,OPC R1 8B,0.0
5272,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,usatst_2025_7,usatst,proofs,OPC R1 8B,0.0
5273,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,usatst_2025_8,usatst,proofs,OPC R1 8B,0.0
5274,o4-mini (high),openai/o4-mini--high,usatst_2025_8,usatst,proofs,OPC R1 8B,0.0
5275,Qwen3-4B (25/07),qwen/qwen3_4b,usatst_2025_8,usatst,proofs,OPC R1 8B,0.0
5276,GPT-5-mini (high),openai/gpt-5-mini,usatst_2025_8,usatst,proofs,OPC R1 8B,0.0
5277,GPT OSS 120B (high),openai/oss-120b,usatst_2025_8,usatst,proofs,OPC R1 8B,0.0
5278,gemini-2.5-pro,gemini/gemini-pro-2.5,usatst_2025_8,usatst,proofs,OPC R1 8B,0.0
5279,GPT-5 (high),openai/gpt-5,usatst_2025_8,usatst,proofs,OPC R1 8B,0.0
5280,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,usatst_2025_8,usatst,proofs,OPC R1 8B,0.0
5281,Grok 4,xai/grok-4,usatst_2025_8,usatst,proofs,OPC R1 8B,0.0
5282,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,usatst_2025_8,usatst,proofs,OPC R1 8B,0.0
5283,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,usatst_2025_8,usatst,proofs,OPC R1 8B,0.0
5284,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,usatst_2025_9,usatst,proofs,OPC R1 8B,0.0
5285,Qwen3-4B (25/07),qwen/qwen3_4b,usatst_2025_9,usatst,proofs,OPC R1 8B,0.0
5286,GPT-5 (high),openai/gpt-5,usatst_2025_9,usatst,proofs,OPC R1 8B,0.0
5287,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,usatst_2025_9,usatst,proofs,OPC R1 8B,0.0
5288,o4-mini (high),openai/o4-mini--high,usatst_2025_9,usatst,proofs,OPC R1 8B,0.0
5289,Grok 4,xai/grok-4,usatst_2025_9,usatst,proofs,OPC R1 8B,0.0
5290,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,usatst_2025_9,usatst,proofs,OPC R1 8B,0.0
5291,gemini-2.5-pro,gemini/gemini-pro-2.5,usatst_2025_9,usatst,proofs,OPC R1 8B,0.0
5292,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,usatst_2025_9,usatst,proofs,OPC R1 8B,0.0
5293,GPT OSS 120B (high),openai/oss-120b,usatst_2025_9,usatst,proofs,OPC R1 8B,1.0
5294,GPT-5-mini (high),openai/gpt-5-mini,usatst_2025_9,usatst,proofs,OPC R1 8B,0.0
5295,Grok 4,xai/grok-4,vietnam_2025_1,vietnam,proofs,OPC R1 8B,1.0
5296,Qwen3-4B (25/07),qwen/qwen3_4b,vietnam_2025_1,vietnam,proofs,OPC R1 8B,1.0
5297,GPT-5 (high),openai/gpt-5,vietnam_2025_1,vietnam,proofs,OPC R1 8B,1.0
5298,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,vietnam_2025_1,vietnam,proofs,OPC R1 8B,1.0
5299,GPT OSS 120B (high),openai/oss-120b,vietnam_2025_1,vietnam,proofs,OPC R1 8B,1.0
5300,gemini-2.5-pro,gemini/gemini-pro-2.5,vietnam_2025_1,vietnam,proofs,OPC R1 8B,1.0
5301,o4-mini (high),openai/o4-mini--high,vietnam_2025_1,vietnam,proofs,OPC R1 8B,0.0
5302,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,vietnam_2025_1,vietnam,proofs,OPC R1 8B,0.0
5303,GPT-5-mini (high),openai/gpt-5-mini,vietnam_2025_1,vietnam,proofs,OPC R1 8B,1.0
5304,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,vietnam_2025_1,vietnam,proofs,OPC R1 8B,1.0
5305,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,vietnam_2025_1,vietnam,proofs,OPC R1 8B,1.0
5306,GPT OSS 120B (high),openai/oss-120b,vietnam_2025_2,vietnam,proofs,OPC R1 8B,0.0
5307,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,vietnam_2025_2,vietnam,proofs,OPC R1 8B,0.0
5308,Grok 4,xai/grok-4,vietnam_2025_2,vietnam,proofs,OPC R1 8B,0.0
5309,o4-mini (high),openai/o4-mini--high,vietnam_2025_2,vietnam,proofs,OPC R1 8B,0.0
5310,gemini-2.5-pro,gemini/gemini-pro-2.5,vietnam_2025_2,vietnam,proofs,OPC R1 8B,1.0
5311,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,vietnam_2025_2,vietnam,proofs,OPC R1 8B,1.0
5312,GPT-5-mini (high),openai/gpt-5-mini,vietnam_2025_2,vietnam,proofs,OPC R1 8B,1.0
5313,Qwen3-4B (25/07),qwen/qwen3_4b,vietnam_2025_2,vietnam,proofs,OPC R1 8B,0.0
5314,GPT-5 (high),openai/gpt-5,vietnam_2025_2,vietnam,proofs,OPC R1 8B,1.0
5315,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,vietnam_2025_2,vietnam,proofs,OPC R1 8B,1.0
5316,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,vietnam_2025_2,vietnam,proofs,OPC R1 8B,0.0
5317,GPT OSS 120B (high),openai/oss-120b,vietnam_2025_3,vietnam,proofs,OPC R1 8B,1.0
5318,GPT-5-mini (high),openai/gpt-5-mini,vietnam_2025_3,vietnam,proofs,OPC R1 8B,0.0
5319,Grok 4,xai/grok-4,vietnam_2025_3,vietnam,proofs,OPC R1 8B,0.0
5320,GPT-5 (high),openai/gpt-5,vietnam_2025_3,vietnam,proofs,OPC R1 8B,0.0
5321,Qwen3-4B (25/07),qwen/qwen3_4b,vietnam_2025_3,vietnam,proofs,OPC R1 8B,0.0
5322,o4-mini (high),openai/o4-mini--high,vietnam_2025_3,vietnam,proofs,OPC R1 8B,0.0
5323,gemini-2.5-pro,gemini/gemini-pro-2.5,vietnam_2025_3,vietnam,proofs,OPC R1 8B,0.0
5324,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,vietnam_2025_3,vietnam,proofs,OPC R1 8B,0.0
5325,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,vietnam_2025_3,vietnam,proofs,OPC R1 8B,0.0
5326,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,vietnam_2025_3,vietnam,proofs,OPC R1 8B,0.0
5327,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,vietnam_2025_3,vietnam,proofs,OPC R1 8B,0.0
5328,Grok 4,xai/grok-4,vietnam_2025_4,vietnam,proofs,OPC R1 8B,0.0
5329,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,vietnam_2025_4,vietnam,proofs,OPC R1 8B,0.0
5330,GPT OSS 120B (high),openai/oss-120b,vietnam_2025_4,vietnam,proofs,OPC R1 8B,1.0
5331,Qwen3-4B (25/07),qwen/qwen3_4b,vietnam_2025_4,vietnam,proofs,OPC R1 8B,0.0
5332,GPT-5 (high),openai/gpt-5,vietnam_2025_4,vietnam,proofs,OPC R1 8B,0.0
5333,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,vietnam_2025_4,vietnam,proofs,OPC R1 8B,0.0
5334,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,vietnam_2025_4,vietnam,proofs,OPC R1 8B,0.0
5335,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,vietnam_2025_4,vietnam,proofs,OPC R1 8B,0.0
5336,o4-mini (high),openai/o4-mini--high,vietnam_2025_4,vietnam,proofs,OPC R1 8B,0.0
5337,gemini-2.5-pro,gemini/gemini-pro-2.5,vietnam_2025_4,vietnam,proofs,OPC R1 8B,0.0
5338,Grok 4,xai/grok-4,vietnam_2025_5,vietnam,proofs,OPC R1 8B,0.0
5339,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,vietnam_2025_5,vietnam,proofs,OPC R1 8B,0.0
5340,o4-mini (high),openai/o4-mini--high,vietnam_2025_5,vietnam,proofs,OPC R1 8B,0.0
5341,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,vietnam_2025_5,vietnam,proofs,OPC R1 8B,0.0
5342,GPT OSS 120B (high),openai/oss-120b,vietnam_2025_5,vietnam,proofs,OPC R1 8B,0.0
5343,Qwen3-4B (25/07),qwen/qwen3_4b,vietnam_2025_5,vietnam,proofs,OPC R1 8B,0.0
5344,GPT-5 (high),openai/gpt-5,vietnam_2025_5,vietnam,proofs,OPC R1 8B,0.0
5345,gemini-2.5-pro,gemini/gemini-pro-2.5,vietnam_2025_5,vietnam,proofs,OPC R1 8B,0.0
5346,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,vietnam_2025_5,vietnam,proofs,OPC R1 8B,0.0
5347,GPT-5-mini (high),openai/gpt-5-mini,vietnam_2025_5,vietnam,proofs,OPC R1 8B,1.0
5348,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,vietnam_2025_5,vietnam,proofs,OPC R1 8B,0.0
5349,GPT OSS 120B (high),openai/oss-120b,vietnam_2025_6,vietnam,proofs,OPC R1 8B,1.0
5350,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,vietnam_2025_6,vietnam,proofs,OPC R1 8B,0.0
5351,GPT-5 (high),openai/gpt-5,vietnam_2025_6,vietnam,proofs,OPC R1 8B,0.0
5352,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,vietnam_2025_6,vietnam,proofs,OPC R1 8B,0.0
5353,o4-mini (high),openai/o4-mini--high,vietnam_2025_6,vietnam,proofs,OPC R1 8B,0.0
5354,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,vietnam_2025_6,vietnam,proofs,OPC R1 8B,0.0
5355,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,vietnam_2025_6,vietnam,proofs,OPC R1 8B,0.0
5356,gemini-2.5-pro,gemini/gemini-pro-2.5,vietnam_2025_6,vietnam,proofs,OPC R1 8B,0.0
5357,Qwen3-4B (25/07),qwen/qwen3_4b,vietnam_2025_6,vietnam,proofs,OPC R1 8B,0.0
5358,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_aime/aime_2025_1,matharena,matharena,Final Answer Parser,1.0
5359,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_aime/aime_2025_10,matharena,matharena,Final Answer Parser,0.75
5360,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_aime/aime_2025_11,matharena,matharena,Final Answer Parser,1.0
5361,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_aime/aime_2025_12,matharena,matharena,Final Answer Parser,1.0
5362,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_aime/aime_2025_13,matharena,matharena,Final Answer Parser,1.0
5363,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_aime/aime_2025_14,matharena,matharena,Final Answer Parser,0.25
5364,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_aime/aime_2025_15,matharena,matharena,Final Answer Parser,0.0
5365,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_aime/aime_2025_16,matharena,matharena,Final Answer Parser,1.0
5366,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_aime/aime_2025_17,matharena,matharena,Final Answer Parser,1.0
5367,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_aime/aime_2025_18,matharena,matharena,Final Answer Parser,1.0
5368,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_aime/aime_2025_19,matharena,matharena,Final Answer Parser,1.0
5369,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_aime/aime_2025_2,matharena,matharena,Final Answer Parser,1.0
5370,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_aime/aime_2025_20,matharena,matharena,Final Answer Parser,1.0
5371,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_aime/aime_2025_21,matharena,matharena,Final Answer Parser,1.0
5372,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_aime/aime_2025_22,matharena,matharena,Final Answer Parser,1.0
5373,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_aime/aime_2025_23,matharena,matharena,Final Answer Parser,1.0
5374,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_aime/aime_2025_24,matharena,matharena,Final Answer Parser,1.0
5375,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_aime/aime_2025_25,matharena,matharena,Final Answer Parser,1.0
5376,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_aime/aime_2025_26,matharena,matharena,Final Answer Parser,1.0
5377,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_aime/aime_2025_27,matharena,matharena,Final Answer Parser,1.0
5378,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_aime/aime_2025_28,matharena,matharena,Final Answer Parser,1.0
5379,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_aime/aime_2025_29,matharena,matharena,Final Answer Parser,0.75
5380,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_aime/aime_2025_3,matharena,matharena,Final Answer Parser,1.0
5381,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_aime/aime_2025_30,matharena,matharena,Final Answer Parser,0.5
5382,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_aime/aime_2025_4,matharena,matharena,Final Answer Parser,1.0
5383,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_aime/aime_2025_5,matharena,matharena,Final Answer Parser,1.0
5384,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_aime/aime_2025_6,matharena,matharena,Final Answer Parser,1.0
5385,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_aime/aime_2025_7,matharena,matharena,Final Answer Parser,1.0
5386,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_aime/aime_2025_8,matharena,matharena,Final Answer Parser,1.0
5387,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_aime/aime_2025_9,matharena,matharena,Final Answer Parser,1.0
5388,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_aime/aime_2025_1,matharena,matharena,Final Answer Parser,1.0
5389,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_aime/aime_2025_10,matharena,matharena,Final Answer Parser,1.0
5390,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_aime/aime_2025_11,matharena,matharena,Final Answer Parser,1.0
5391,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_aime/aime_2025_12,matharena,matharena,Final Answer Parser,1.0
5392,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_aime/aime_2025_13,matharena,matharena,Final Answer Parser,0.75
5393,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_aime/aime_2025_14,matharena,matharena,Final Answer Parser,0.0
5394,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_aime/aime_2025_15,matharena,matharena,Final Answer Parser,0.0
5395,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_aime/aime_2025_16,matharena,matharena,Final Answer Parser,1.0
5396,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_aime/aime_2025_17,matharena,matharena,Final Answer Parser,1.0
5397,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_aime/aime_2025_18,matharena,matharena,Final Answer Parser,1.0
5398,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_aime/aime_2025_19,matharena,matharena,Final Answer Parser,1.0
5399,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_aime/aime_2025_2,matharena,matharena,Final Answer Parser,0.75
5400,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_aime/aime_2025_20,matharena,matharena,Final Answer Parser,0.5
5401,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_aime/aime_2025_21,matharena,matharena,Final Answer Parser,1.0
5402,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_aime/aime_2025_22,matharena,matharena,Final Answer Parser,1.0
5403,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_aime/aime_2025_23,matharena,matharena,Final Answer Parser,0.75
5404,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_aime/aime_2025_24,matharena,matharena,Final Answer Parser,1.0
5405,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_aime/aime_2025_25,matharena,matharena,Final Answer Parser,0.75
5406,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_aime/aime_2025_26,matharena,matharena,Final Answer Parser,1.0
5407,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_aime/aime_2025_27,matharena,matharena,Final Answer Parser,1.0
5408,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_aime/aime_2025_28,matharena,matharena,Final Answer Parser,1.0
5409,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_aime/aime_2025_29,matharena,matharena,Final Answer Parser,0.75
5410,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_aime/aime_2025_3,matharena,matharena,Final Answer Parser,1.0
5411,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_aime/aime_2025_30,matharena,matharena,Final Answer Parser,1.0
5412,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_aime/aime_2025_4,matharena,matharena,Final Answer Parser,1.0
5413,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_aime/aime_2025_5,matharena,matharena,Final Answer Parser,1.0
5414,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_aime/aime_2025_6,matharena,matharena,Final Answer Parser,1.0
5415,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_aime/aime_2025_7,matharena,matharena,Final Answer Parser,1.0
5416,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_aime/aime_2025_8,matharena,matharena,Final Answer Parser,1.0
5417,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_aime/aime_2025_9,matharena,matharena,Final Answer Parser,1.0
5418,o4-mini (high),openai/o4-mini--high,matharena_aime/aime_2025_1,matharena,matharena,Final Answer Parser,1.0
5419,o4-mini (high),openai/o4-mini--high,matharena_aime/aime_2025_10,matharena,matharena,Final Answer Parser,1.0
5420,o4-mini (high),openai/o4-mini--high,matharena_aime/aime_2025_11,matharena,matharena,Final Answer Parser,1.0
5421,o4-mini (high),openai/o4-mini--high,matharena_aime/aime_2025_12,matharena,matharena,Final Answer Parser,1.0
5422,o4-mini (high),openai/o4-mini--high,matharena_aime/aime_2025_13,matharena,matharena,Final Answer Parser,0.75
5423,o4-mini (high),openai/o4-mini--high,matharena_aime/aime_2025_14,matharena,matharena,Final Answer Parser,0.25
5424,o4-mini (high),openai/o4-mini--high,matharena_aime/aime_2025_15,matharena,matharena,Final Answer Parser,0.0
5425,o4-mini (high),openai/o4-mini--high,matharena_aime/aime_2025_16,matharena,matharena,Final Answer Parser,1.0
5426,o4-mini (high),openai/o4-mini--high,matharena_aime/aime_2025_17,matharena,matharena,Final Answer Parser,1.0
5427,o4-mini (high),openai/o4-mini--high,matharena_aime/aime_2025_18,matharena,matharena,Final Answer Parser,1.0
5428,o4-mini (high),openai/o4-mini--high,matharena_aime/aime_2025_19,matharena,matharena,Final Answer Parser,1.0
5429,o4-mini (high),openai/o4-mini--high,matharena_aime/aime_2025_2,matharena,matharena,Final Answer Parser,1.0
5430,o4-mini (high),openai/o4-mini--high,matharena_aime/aime_2025_20,matharena,matharena,Final Answer Parser,1.0
5431,o4-mini (high),openai/o4-mini--high,matharena_aime/aime_2025_21,matharena,matharena,Final Answer Parser,1.0
5432,o4-mini (high),openai/o4-mini--high,matharena_aime/aime_2025_22,matharena,matharena,Final Answer Parser,1.0
5433,o4-mini (high),openai/o4-mini--high,matharena_aime/aime_2025_23,matharena,matharena,Final Answer Parser,1.0
5434,o4-mini (high),openai/o4-mini--high,matharena_aime/aime_2025_24,matharena,matharena,Final Answer Parser,1.0
5435,o4-mini (high),openai/o4-mini--high,matharena_aime/aime_2025_25,matharena,matharena,Final Answer Parser,1.0
5436,o4-mini (high),openai/o4-mini--high,matharena_aime/aime_2025_26,matharena,matharena,Final Answer Parser,1.0
5437,o4-mini (high),openai/o4-mini--high,matharena_aime/aime_2025_27,matharena,matharena,Final Answer Parser,1.0
5438,o4-mini (high),openai/o4-mini--high,matharena_aime/aime_2025_28,matharena,matharena,Final Answer Parser,1.0
5439,o4-mini (high),openai/o4-mini--high,matharena_aime/aime_2025_29,matharena,matharena,Final Answer Parser,1.0
5440,o4-mini (high),openai/o4-mini--high,matharena_aime/aime_2025_3,matharena,matharena,Final Answer Parser,1.0
5441,o4-mini (high),openai/o4-mini--high,matharena_aime/aime_2025_30,matharena,matharena,Final Answer Parser,1.0
5442,o4-mini (high),openai/o4-mini--high,matharena_aime/aime_2025_4,matharena,matharena,Final Answer Parser,1.0
5443,o4-mini (high),openai/o4-mini--high,matharena_aime/aime_2025_5,matharena,matharena,Final Answer Parser,1.0
5444,o4-mini (high),openai/o4-mini--high,matharena_aime/aime_2025_6,matharena,matharena,Final Answer Parser,1.0
5445,o4-mini (high),openai/o4-mini--high,matharena_aime/aime_2025_7,matharena,matharena,Final Answer Parser,0.75
5446,o4-mini (high),openai/o4-mini--high,matharena_aime/aime_2025_8,matharena,matharena,Final Answer Parser,0.75
5447,o4-mini (high),openai/o4-mini--high,matharena_aime/aime_2025_9,matharena,matharena,Final Answer Parser,1.0
5448,GPT-5-mini (high),openai/gpt-5-mini,matharena_aime/aime_2025_1,matharena,matharena,Final Answer Parser,1.0
5449,GPT-5-mini (high),openai/gpt-5-mini,matharena_aime/aime_2025_10,matharena,matharena,Final Answer Parser,1.0
5450,GPT-5-mini (high),openai/gpt-5-mini,matharena_aime/aime_2025_11,matharena,matharena,Final Answer Parser,1.0
5451,GPT-5-mini (high),openai/gpt-5-mini,matharena_aime/aime_2025_12,matharena,matharena,Final Answer Parser,1.0
5452,GPT-5-mini (high),openai/gpt-5-mini,matharena_aime/aime_2025_13,matharena,matharena,Final Answer Parser,0.25
5453,GPT-5-mini (high),openai/gpt-5-mini,matharena_aime/aime_2025_14,matharena,matharena,Final Answer Parser,0.0
5454,GPT-5-mini (high),openai/gpt-5-mini,matharena_aime/aime_2025_15,matharena,matharena,Final Answer Parser,0.0
5455,GPT-5-mini (high),openai/gpt-5-mini,matharena_aime/aime_2025_16,matharena,matharena,Final Answer Parser,1.0
5456,GPT-5-mini (high),openai/gpt-5-mini,matharena_aime/aime_2025_17,matharena,matharena,Final Answer Parser,1.0
5457,GPT-5-mini (high),openai/gpt-5-mini,matharena_aime/aime_2025_18,matharena,matharena,Final Answer Parser,0.75
5458,GPT-5-mini (high),openai/gpt-5-mini,matharena_aime/aime_2025_19,matharena,matharena,Final Answer Parser,1.0
5459,GPT-5-mini (high),openai/gpt-5-mini,matharena_aime/aime_2025_2,matharena,matharena,Final Answer Parser,1.0
5460,GPT-5-mini (high),openai/gpt-5-mini,matharena_aime/aime_2025_20,matharena,matharena,Final Answer Parser,0.75
5461,GPT-5-mini (high),openai/gpt-5-mini,matharena_aime/aime_2025_21,matharena,matharena,Final Answer Parser,1.0
5462,GPT-5-mini (high),openai/gpt-5-mini,matharena_aime/aime_2025_22,matharena,matharena,Final Answer Parser,1.0
5463,GPT-5-mini (high),openai/gpt-5-mini,matharena_aime/aime_2025_23,matharena,matharena,Final Answer Parser,1.0
5464,GPT-5-mini (high),openai/gpt-5-mini,matharena_aime/aime_2025_24,matharena,matharena,Final Answer Parser,1.0
5465,GPT-5-mini (high),openai/gpt-5-mini,matharena_aime/aime_2025_25,matharena,matharena,Final Answer Parser,1.0
5466,GPT-5-mini (high),openai/gpt-5-mini,matharena_aime/aime_2025_26,matharena,matharena,Final Answer Parser,1.0
5467,GPT-5-mini (high),openai/gpt-5-mini,matharena_aime/aime_2025_27,matharena,matharena,Final Answer Parser,1.0
5468,GPT-5-mini (high),openai/gpt-5-mini,matharena_aime/aime_2025_28,matharena,matharena,Final Answer Parser,0.75
5469,GPT-5-mini (high),openai/gpt-5-mini,matharena_aime/aime_2025_29,matharena,matharena,Final Answer Parser,1.0
5470,GPT-5-mini (high),openai/gpt-5-mini,matharena_aime/aime_2025_3,matharena,matharena,Final Answer Parser,1.0
5471,GPT-5-mini (high),openai/gpt-5-mini,matharena_aime/aime_2025_30,matharena,matharena,Final Answer Parser,0.75
5472,GPT-5-mini (high),openai/gpt-5-mini,matharena_aime/aime_2025_4,matharena,matharena,Final Answer Parser,1.0
5473,GPT-5-mini (high),openai/gpt-5-mini,matharena_aime/aime_2025_5,matharena,matharena,Final Answer Parser,1.0
5474,GPT-5-mini (high),openai/gpt-5-mini,matharena_aime/aime_2025_6,matharena,matharena,Final Answer Parser,1.0
5475,GPT-5-mini (high),openai/gpt-5-mini,matharena_aime/aime_2025_7,matharena,matharena,Final Answer Parser,1.0
5476,GPT-5-mini (high),openai/gpt-5-mini,matharena_aime/aime_2025_8,matharena,matharena,Final Answer Parser,1.0
5477,GPT-5-mini (high),openai/gpt-5-mini,matharena_aime/aime_2025_9,matharena,matharena,Final Answer Parser,1.0
5478,GPT-5 (high),openai/gpt-5,matharena_aime/aime_2025_1,matharena,matharena,Final Answer Parser,1.0
5479,GPT-5 (high),openai/gpt-5,matharena_aime/aime_2025_10,matharena,matharena,Final Answer Parser,1.0
5480,GPT-5 (high),openai/gpt-5,matharena_aime/aime_2025_11,matharena,matharena,Final Answer Parser,1.0
5481,GPT-5 (high),openai/gpt-5,matharena_aime/aime_2025_12,matharena,matharena,Final Answer Parser,1.0
5482,GPT-5 (high),openai/gpt-5,matharena_aime/aime_2025_13,matharena,matharena,Final Answer Parser,1.0
5483,GPT-5 (high),openai/gpt-5,matharena_aime/aime_2025_14,matharena,matharena,Final Answer Parser,0.25
5484,GPT-5 (high),openai/gpt-5,matharena_aime/aime_2025_15,matharena,matharena,Final Answer Parser,0.5
5485,GPT-5 (high),openai/gpt-5,matharena_aime/aime_2025_16,matharena,matharena,Final Answer Parser,1.0
5486,GPT-5 (high),openai/gpt-5,matharena_aime/aime_2025_17,matharena,matharena,Final Answer Parser,1.0
5487,GPT-5 (high),openai/gpt-5,matharena_aime/aime_2025_18,matharena,matharena,Final Answer Parser,1.0
5488,GPT-5 (high),openai/gpt-5,matharena_aime/aime_2025_19,matharena,matharena,Final Answer Parser,1.0
5489,GPT-5 (high),openai/gpt-5,matharena_aime/aime_2025_2,matharena,matharena,Final Answer Parser,1.0
5490,GPT-5 (high),openai/gpt-5,matharena_aime/aime_2025_20,matharena,matharena,Final Answer Parser,1.0
5491,GPT-5 (high),openai/gpt-5,matharena_aime/aime_2025_21,matharena,matharena,Final Answer Parser,1.0
5492,GPT-5 (high),openai/gpt-5,matharena_aime/aime_2025_22,matharena,matharena,Final Answer Parser,1.0
5493,GPT-5 (high),openai/gpt-5,matharena_aime/aime_2025_23,matharena,matharena,Final Answer Parser,1.0
5494,GPT-5 (high),openai/gpt-5,matharena_aime/aime_2025_24,matharena,matharena,Final Answer Parser,1.0
5495,GPT-5 (high),openai/gpt-5,matharena_aime/aime_2025_25,matharena,matharena,Final Answer Parser,1.0
5496,GPT-5 (high),openai/gpt-5,matharena_aime/aime_2025_26,matharena,matharena,Final Answer Parser,1.0
5497,GPT-5 (high),openai/gpt-5,matharena_aime/aime_2025_27,matharena,matharena,Final Answer Parser,1.0
5498,GPT-5 (high),openai/gpt-5,matharena_aime/aime_2025_28,matharena,matharena,Final Answer Parser,0.75
5499,GPT-5 (high),openai/gpt-5,matharena_aime/aime_2025_29,matharena,matharena,Final Answer Parser,1.0
5500,GPT-5 (high),openai/gpt-5,matharena_aime/aime_2025_3,matharena,matharena,Final Answer Parser,1.0
5501,GPT-5 (high),openai/gpt-5,matharena_aime/aime_2025_30,matharena,matharena,Final Answer Parser,1.0
5502,GPT-5 (high),openai/gpt-5,matharena_aime/aime_2025_4,matharena,matharena,Final Answer Parser,1.0
5503,GPT-5 (high),openai/gpt-5,matharena_aime/aime_2025_5,matharena,matharena,Final Answer Parser,1.0
5504,GPT-5 (high),openai/gpt-5,matharena_aime/aime_2025_6,matharena,matharena,Final Answer Parser,1.0
5505,GPT-5 (high),openai/gpt-5,matharena_aime/aime_2025_7,matharena,matharena,Final Answer Parser,1.0
5506,GPT-5 (high),openai/gpt-5,matharena_aime/aime_2025_8,matharena,matharena,Final Answer Parser,1.0
5507,GPT-5 (high),openai/gpt-5,matharena_aime/aime_2025_9,matharena,matharena,Final Answer Parser,1.0
5538,GPT OSS 120B (high),openai/oss-20b,matharena_aime/aime_2025_1,matharena,matharena,Final Answer Parser,1.0
5539,GPT OSS 120B (high),openai/oss-20b,matharena_aime/aime_2025_10,matharena,matharena,Final Answer Parser,1.0
5540,GPT OSS 120B (high),openai/oss-20b,matharena_aime/aime_2025_11,matharena,matharena,Final Answer Parser,1.0
5541,GPT OSS 120B (high),openai/oss-20b,matharena_aime/aime_2025_12,matharena,matharena,Final Answer Parser,1.0
5542,GPT OSS 120B (high),openai/oss-20b,matharena_aime/aime_2025_13,matharena,matharena,Final Answer Parser,0.75
5543,GPT OSS 120B (high),openai/oss-20b,matharena_aime/aime_2025_14,matharena,matharena,Final Answer Parser,0.25
5544,GPT OSS 120B (high),openai/oss-20b,matharena_aime/aime_2025_15,matharena,matharena,Final Answer Parser,0.0
5545,GPT OSS 120B (high),openai/oss-20b,matharena_aime/aime_2025_16,matharena,matharena,Final Answer Parser,1.0
5546,GPT OSS 120B (high),openai/oss-20b,matharena_aime/aime_2025_17,matharena,matharena,Final Answer Parser,1.0
5547,GPT OSS 120B (high),openai/oss-20b,matharena_aime/aime_2025_18,matharena,matharena,Final Answer Parser,1.0
5548,GPT OSS 120B (high),openai/oss-20b,matharena_aime/aime_2025_19,matharena,matharena,Final Answer Parser,1.0
5549,GPT OSS 120B (high),openai/oss-20b,matharena_aime/aime_2025_2,matharena,matharena,Final Answer Parser,1.0
5550,GPT OSS 120B (high),openai/oss-20b,matharena_aime/aime_2025_20,matharena,matharena,Final Answer Parser,1.0
5551,GPT OSS 120B (high),openai/oss-20b,matharena_aime/aime_2025_21,matharena,matharena,Final Answer Parser,1.0
5552,GPT OSS 120B (high),openai/oss-20b,matharena_aime/aime_2025_22,matharena,matharena,Final Answer Parser,1.0
5553,GPT OSS 120B (high),openai/oss-20b,matharena_aime/aime_2025_23,matharena,matharena,Final Answer Parser,1.0
5554,GPT OSS 120B (high),openai/oss-20b,matharena_aime/aime_2025_24,matharena,matharena,Final Answer Parser,1.0
5555,GPT OSS 120B (high),openai/oss-20b,matharena_aime/aime_2025_25,matharena,matharena,Final Answer Parser,0.75
5556,GPT OSS 120B (high),openai/oss-20b,matharena_aime/aime_2025_26,matharena,matharena,Final Answer Parser,1.0
5557,GPT OSS 120B (high),openai/oss-20b,matharena_aime/aime_2025_27,matharena,matharena,Final Answer Parser,1.0
5558,GPT OSS 120B (high),openai/oss-20b,matharena_aime/aime_2025_28,matharena,matharena,Final Answer Parser,0.75
5559,GPT OSS 120B (high),openai/oss-20b,matharena_aime/aime_2025_29,matharena,matharena,Final Answer Parser,1.0
5560,GPT OSS 120B (high),openai/oss-20b,matharena_aime/aime_2025_3,matharena,matharena,Final Answer Parser,1.0
5561,GPT OSS 120B (high),openai/oss-20b,matharena_aime/aime_2025_30,matharena,matharena,Final Answer Parser,0.5
5562,GPT OSS 120B (high),openai/oss-20b,matharena_aime/aime_2025_4,matharena,matharena,Final Answer Parser,1.0
5563,GPT OSS 120B (high),openai/oss-20b,matharena_aime/aime_2025_5,matharena,matharena,Final Answer Parser,1.0
5564,GPT OSS 120B (high),openai/oss-20b,matharena_aime/aime_2025_6,matharena,matharena,Final Answer Parser,1.0
5565,GPT OSS 120B (high),openai/oss-20b,matharena_aime/aime_2025_7,matharena,matharena,Final Answer Parser,0.75
5566,GPT OSS 120B (high),openai/oss-20b,matharena_aime/aime_2025_8,matharena,matharena,Final Answer Parser,1.0
5567,GPT OSS 120B (high),openai/oss-20b,matharena_aime/aime_2025_9,matharena,matharena,Final Answer Parser,1.0
5568,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_aime/aime_2025_1,matharena,matharena,Final Answer Parser,1.0
5569,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_aime/aime_2025_10,matharena,matharena,Final Answer Parser,0.75
5570,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_aime/aime_2025_11,matharena,matharena,Final Answer Parser,1.0
5571,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_aime/aime_2025_12,matharena,matharena,Final Answer Parser,1.0
5572,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_aime/aime_2025_13,matharena,matharena,Final Answer Parser,0.25
5573,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_aime/aime_2025_14,matharena,matharena,Final Answer Parser,0.0
5574,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_aime/aime_2025_15,matharena,matharena,Final Answer Parser,0.0
5575,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_aime/aime_2025_16,matharena,matharena,Final Answer Parser,1.0
5576,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_aime/aime_2025_17,matharena,matharena,Final Answer Parser,1.0
5577,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_aime/aime_2025_18,matharena,matharena,Final Answer Parser,1.0
5578,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_aime/aime_2025_19,matharena,matharena,Final Answer Parser,1.0
5579,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_aime/aime_2025_2,matharena,matharena,Final Answer Parser,1.0
5580,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_aime/aime_2025_20,matharena,matharena,Final Answer Parser,0.75
5581,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_aime/aime_2025_21,matharena,matharena,Final Answer Parser,1.0
5582,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_aime/aime_2025_22,matharena,matharena,Final Answer Parser,1.0
5583,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_aime/aime_2025_23,matharena,matharena,Final Answer Parser,1.0
5584,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_aime/aime_2025_24,matharena,matharena,Final Answer Parser,1.0
5585,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_aime/aime_2025_25,matharena,matharena,Final Answer Parser,1.0
5586,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_aime/aime_2025_26,matharena,matharena,Final Answer Parser,1.0
5587,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_aime/aime_2025_27,matharena,matharena,Final Answer Parser,1.0
5588,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_aime/aime_2025_28,matharena,matharena,Final Answer Parser,0.25
5589,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_aime/aime_2025_29,matharena,matharena,Final Answer Parser,0.25
5590,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_aime/aime_2025_3,matharena,matharena,Final Answer Parser,1.0
5591,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_aime/aime_2025_30,matharena,matharena,Final Answer Parser,0.0
5592,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_aime/aime_2025_4,matharena,matharena,Final Answer Parser,1.0
5593,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_aime/aime_2025_5,matharena,matharena,Final Answer Parser,1.0
5594,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_aime/aime_2025_6,matharena,matharena,Final Answer Parser,1.0
5595,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_aime/aime_2025_7,matharena,matharena,Final Answer Parser,1.0
5596,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_aime/aime_2025_8,matharena,matharena,Final Answer Parser,1.0
5597,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_aime/aime_2025_9,matharena,matharena,Final Answer Parser,1.0
5598,Grok 4,xai/grok-4,matharena_aime/aime_2025_1,matharena,matharena,Final Answer Parser,1.0
5599,Grok 4,xai/grok-4,matharena_aime/aime_2025_10,matharena,matharena,Final Answer Parser,1.0
5600,Grok 4,xai/grok-4,matharena_aime/aime_2025_11,matharena,matharena,Final Answer Parser,1.0
5601,Grok 4,xai/grok-4,matharena_aime/aime_2025_12,matharena,matharena,Final Answer Parser,1.0
5602,Grok 4,xai/grok-4,matharena_aime/aime_2025_13,matharena,matharena,Final Answer Parser,1.0
5603,Grok 4,xai/grok-4,matharena_aime/aime_2025_14,matharena,matharena,Final Answer Parser,0.5
5604,Grok 4,xai/grok-4,matharena_aime/aime_2025_15,matharena,matharena,Final Answer Parser,0.0
5605,Grok 4,xai/grok-4,matharena_aime/aime_2025_16,matharena,matharena,Final Answer Parser,1.0
5606,Grok 4,xai/grok-4,matharena_aime/aime_2025_17,matharena,matharena,Final Answer Parser,1.0
5607,Grok 4,xai/grok-4,matharena_aime/aime_2025_18,matharena,matharena,Final Answer Parser,1.0
5608,Grok 4,xai/grok-4,matharena_aime/aime_2025_19,matharena,matharena,Final Answer Parser,1.0
5609,Grok 4,xai/grok-4,matharena_aime/aime_2025_2,matharena,matharena,Final Answer Parser,1.0
5610,Grok 4,xai/grok-4,matharena_aime/aime_2025_20,matharena,matharena,Final Answer Parser,1.0
5611,Grok 4,xai/grok-4,matharena_aime/aime_2025_21,matharena,matharena,Final Answer Parser,1.0
5612,Grok 4,xai/grok-4,matharena_aime/aime_2025_22,matharena,matharena,Final Answer Parser,1.0
5613,Grok 4,xai/grok-4,matharena_aime/aime_2025_23,matharena,matharena,Final Answer Parser,1.0
5614,Grok 4,xai/grok-4,matharena_aime/aime_2025_24,matharena,matharena,Final Answer Parser,1.0
5615,Grok 4,xai/grok-4,matharena_aime/aime_2025_25,matharena,matharena,Final Answer Parser,1.0
5616,Grok 4,xai/grok-4,matharena_aime/aime_2025_26,matharena,matharena,Final Answer Parser,1.0
5617,Grok 4,xai/grok-4,matharena_aime/aime_2025_27,matharena,matharena,Final Answer Parser,1.0
5618,Grok 4,xai/grok-4,matharena_aime/aime_2025_28,matharena,matharena,Final Answer Parser,0.25
5619,Grok 4,xai/grok-4,matharena_aime/aime_2025_29,matharena,matharena,Final Answer Parser,1.0
5620,Grok 4,xai/grok-4,matharena_aime/aime_2025_3,matharena,matharena,Final Answer Parser,1.0
5621,Grok 4,xai/grok-4,matharena_aime/aime_2025_30,matharena,matharena,Final Answer Parser,0.5
5622,Grok 4,xai/grok-4,matharena_aime/aime_2025_4,matharena,matharena,Final Answer Parser,1.0
5623,Grok 4,xai/grok-4,matharena_aime/aime_2025_5,matharena,matharena,Final Answer Parser,1.0
5624,Grok 4,xai/grok-4,matharena_aime/aime_2025_6,matharena,matharena,Final Answer Parser,1.0
5625,Grok 4,xai/grok-4,matharena_aime/aime_2025_7,matharena,matharena,Final Answer Parser,1.0
5626,Grok 4,xai/grok-4,matharena_aime/aime_2025_8,matharena,matharena,Final Answer Parser,1.0
5627,Grok 4,xai/grok-4,matharena_aime/aime_2025_9,matharena,matharena,Final Answer Parser,1.0
5628,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_1,matharena,matharena,Final Answer Parser,1.0
5629,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_10,matharena,matharena,Final Answer Parser,1.0
5630,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_11,matharena,matharena,Final Answer Parser,1.0
5631,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_12,matharena,matharena,Final Answer Parser,1.0
5632,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_13,matharena,matharena,Final Answer Parser,1.0
5633,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_14,matharena,matharena,Final Answer Parser,1.0
5634,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_15,matharena,matharena,Final Answer Parser,0.25
5635,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_16,matharena,matharena,Final Answer Parser,1.0
5636,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_17,matharena,matharena,Final Answer Parser,1.0
5637,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_18,matharena,matharena,Final Answer Parser,0.5
5638,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_19,matharena,matharena,Final Answer Parser,1.0
5639,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_2,matharena,matharena,Final Answer Parser,1.0
5640,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_20,matharena,matharena,Final Answer Parser,0.25
5641,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_21,matharena,matharena,Final Answer Parser,0.25
5642,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_22,matharena,matharena,Final Answer Parser,1.0
5643,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_23,matharena,matharena,Final Answer Parser,0.5
5644,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_24,matharena,matharena,Final Answer Parser,1.0
5645,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_25,matharena,matharena,Final Answer Parser,0.75
5646,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_26,matharena,matharena,Final Answer Parser,1.0
5647,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_27,matharena,matharena,Final Answer Parser,1.0
5648,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_28,matharena,matharena,Final Answer Parser,0.5
5649,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_29,matharena,matharena,Final Answer Parser,1.0
5650,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_3,matharena,matharena,Final Answer Parser,1.0
5651,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_30,matharena,matharena,Final Answer Parser,1.0
5652,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_31,matharena,matharena,Final Answer Parser,1.0
5653,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_32,matharena,matharena,Final Answer Parser,0.5
5654,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_33,matharena,matharena,Final Answer Parser,1.0
5655,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_34,matharena,matharena,Final Answer Parser,0.25
5656,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_35,matharena,matharena,Final Answer Parser,0.5
5657,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_36,matharena,matharena,Final Answer Parser,1.0
5658,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_37,matharena,matharena,Final Answer Parser,1.0
5659,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_38,matharena,matharena,Final Answer Parser,0.75
5660,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_39,matharena,matharena,Final Answer Parser,1.0
5661,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_4,matharena,matharena,Final Answer Parser,1.0
5662,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_40,matharena,matharena,Final Answer Parser,0.5
5663,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_5,matharena,matharena,Final Answer Parser,1.0
5664,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_6,matharena,matharena,Final Answer Parser,1.0
5665,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_7,matharena,matharena,Final Answer Parser,0.0
5666,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_8,matharena,matharena,Final Answer Parser,1.0
5667,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_9,matharena,matharena,Final Answer Parser,1.0
5668,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_1,matharena,matharena,Final Answer Parser,1.0
5669,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_10,matharena,matharena,Final Answer Parser,1.0
5670,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_11,matharena,matharena,Final Answer Parser,1.0
5671,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_12,matharena,matharena,Final Answer Parser,1.0
5672,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_13,matharena,matharena,Final Answer Parser,0.5
5673,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_14,matharena,matharena,Final Answer Parser,0.75
5674,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_15,matharena,matharena,Final Answer Parser,0.0
5675,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_16,matharena,matharena,Final Answer Parser,0.0
5676,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_17,matharena,matharena,Final Answer Parser,1.0
5677,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_18,matharena,matharena,Final Answer Parser,1.0
5678,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_19,matharena,matharena,Final Answer Parser,0.5
5679,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_2,matharena,matharena,Final Answer Parser,1.0
5680,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_20,matharena,matharena,Final Answer Parser,0.0
5681,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_21,matharena,matharena,Final Answer Parser,0.5
5682,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_22,matharena,matharena,Final Answer Parser,1.0
5683,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_23,matharena,matharena,Final Answer Parser,1.0
5684,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_24,matharena,matharena,Final Answer Parser,1.0
5685,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_25,matharena,matharena,Final Answer Parser,0.5
5686,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_26,matharena,matharena,Final Answer Parser,1.0
5687,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_27,matharena,matharena,Final Answer Parser,1.0
5688,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_28,matharena,matharena,Final Answer Parser,0.0
5689,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_29,matharena,matharena,Final Answer Parser,1.0
5690,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_3,matharena,matharena,Final Answer Parser,0.5
5691,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_30,matharena,matharena,Final Answer Parser,0.0
5692,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_31,matharena,matharena,Final Answer Parser,1.0
5693,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_32,matharena,matharena,Final Answer Parser,0.0
5694,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_33,matharena,matharena,Final Answer Parser,1.0
5695,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_34,matharena,matharena,Final Answer Parser,0.0
5696,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_35,matharena,matharena,Final Answer Parser,0.75
5697,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_36,matharena,matharena,Final Answer Parser,0.5
5698,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_37,matharena,matharena,Final Answer Parser,0.0
5699,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_38,matharena,matharena,Final Answer Parser,0.0
5700,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_39,matharena,matharena,Final Answer Parser,0.0
5701,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_4,matharena,matharena,Final Answer Parser,1.0
5702,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_40,matharena,matharena,Final Answer Parser,0.0
5703,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_5,matharena,matharena,Final Answer Parser,0.25
5704,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_6,matharena,matharena,Final Answer Parser,1.0
5705,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_7,matharena,matharena,Final Answer Parser,0.0
5706,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_8,matharena,matharena,Final Answer Parser,1.0
5707,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_9,matharena,matharena,Final Answer Parser,0.5
5708,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_1,matharena,matharena,Final Answer Parser,0.5
5709,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_10,matharena,matharena,Final Answer Parser,1.0
5710,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_11,matharena,matharena,Final Answer Parser,1.0
5711,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_12,matharena,matharena,Final Answer Parser,1.0
5712,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_13,matharena,matharena,Final Answer Parser,1.0
5713,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_14,matharena,matharena,Final Answer Parser,1.0
5714,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_15,matharena,matharena,Final Answer Parser,0.25
5715,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_16,matharena,matharena,Final Answer Parser,1.0
5716,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_17,matharena,matharena,Final Answer Parser,1.0
5717,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_18,matharena,matharena,Final Answer Parser,0.5
5718,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_19,matharena,matharena,Final Answer Parser,1.0
5719,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_2,matharena,matharena,Final Answer Parser,1.0
5720,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_20,matharena,matharena,Final Answer Parser,1.0
5721,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_21,matharena,matharena,Final Answer Parser,1.0
5722,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_22,matharena,matharena,Final Answer Parser,1.0
5723,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_23,matharena,matharena,Final Answer Parser,0.5
5724,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_24,matharena,matharena,Final Answer Parser,1.0
5725,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_25,matharena,matharena,Final Answer Parser,1.0
5726,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_26,matharena,matharena,Final Answer Parser,1.0
5727,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_27,matharena,matharena,Final Answer Parser,1.0
5728,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_28,matharena,matharena,Final Answer Parser,0.5
5729,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_29,matharena,matharena,Final Answer Parser,1.0
5730,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_3,matharena,matharena,Final Answer Parser,1.0
5731,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_30,matharena,matharena,Final Answer Parser,0.5
5732,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_31,matharena,matharena,Final Answer Parser,1.0
5733,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_32,matharena,matharena,Final Answer Parser,0.5
5734,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_33,matharena,matharena,Final Answer Parser,1.0
5735,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_34,matharena,matharena,Final Answer Parser,0.5
5736,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_35,matharena,matharena,Final Answer Parser,0.5
5737,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_36,matharena,matharena,Final Answer Parser,0.75
5738,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_37,matharena,matharena,Final Answer Parser,1.0
5739,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_38,matharena,matharena,Final Answer Parser,0.25
5740,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_39,matharena,matharena,Final Answer Parser,1.0
5741,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_4,matharena,matharena,Final Answer Parser,1.0
5742,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_40,matharena,matharena,Final Answer Parser,0.75
5743,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_5,matharena,matharena,Final Answer Parser,1.0
5744,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_6,matharena,matharena,Final Answer Parser,0.75
5745,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_7,matharena,matharena,Final Answer Parser,0.5
5746,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_8,matharena,matharena,Final Answer Parser,1.0
5747,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_9,matharena,matharena,Final Answer Parser,1.0
5748,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_1,matharena,matharena,Final Answer Parser,1.0
5749,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_10,matharena,matharena,Final Answer Parser,1.0
5750,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_11,matharena,matharena,Final Answer Parser,1.0
5751,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_12,matharena,matharena,Final Answer Parser,1.0
5752,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_13,matharena,matharena,Final Answer Parser,1.0
5753,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_14,matharena,matharena,Final Answer Parser,1.0
5754,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_15,matharena,matharena,Final Answer Parser,0.75
5755,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_16,matharena,matharena,Final Answer Parser,1.0
5756,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_17,matharena,matharena,Final Answer Parser,1.0
5757,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_18,matharena,matharena,Final Answer Parser,0.75
5758,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_19,matharena,matharena,Final Answer Parser,1.0
5759,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_2,matharena,matharena,Final Answer Parser,1.0
5760,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_20,matharena,matharena,Final Answer Parser,0.75
5761,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_21,matharena,matharena,Final Answer Parser,1.0
5762,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_22,matharena,matharena,Final Answer Parser,1.0
5763,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_23,matharena,matharena,Final Answer Parser,0.75
5764,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_24,matharena,matharena,Final Answer Parser,1.0
5765,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_25,matharena,matharena,Final Answer Parser,1.0
5766,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_26,matharena,matharena,Final Answer Parser,1.0
5767,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_27,matharena,matharena,Final Answer Parser,1.0
5768,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_28,matharena,matharena,Final Answer Parser,0.25
5769,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_29,matharena,matharena,Final Answer Parser,0.75
5770,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_3,matharena,matharena,Final Answer Parser,1.0
5771,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_30,matharena,matharena,Final Answer Parser,0.75
5772,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_31,matharena,matharena,Final Answer Parser,1.0
5773,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_32,matharena,matharena,Final Answer Parser,0.5
5774,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_33,matharena,matharena,Final Answer Parser,1.0
5775,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_34,matharena,matharena,Final Answer Parser,0.5
5776,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_35,matharena,matharena,Final Answer Parser,1.0
5777,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_36,matharena,matharena,Final Answer Parser,1.0
5778,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_37,matharena,matharena,Final Answer Parser,1.0
5779,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_38,matharena,matharena,Final Answer Parser,1.0
5780,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_39,matharena,matharena,Final Answer Parser,0.75
5781,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_4,matharena,matharena,Final Answer Parser,1.0
5782,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_40,matharena,matharena,Final Answer Parser,0.75
5783,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_5,matharena,matharena,Final Answer Parser,1.0
5784,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_6,matharena,matharena,Final Answer Parser,1.0
5785,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_7,matharena,matharena,Final Answer Parser,0.75
5786,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_8,matharena,matharena,Final Answer Parser,1.0
5787,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_9,matharena,matharena,Final Answer Parser,1.0
5788,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_1,matharena,matharena,Final Answer Parser,1.0
5789,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_10,matharena,matharena,Final Answer Parser,1.0
5790,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_11,matharena,matharena,Final Answer Parser,1.0
5791,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_12,matharena,matharena,Final Answer Parser,0.75
5792,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_13,matharena,matharena,Final Answer Parser,1.0
5793,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_14,matharena,matharena,Final Answer Parser,1.0
5794,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_15,matharena,matharena,Final Answer Parser,0.5
5795,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_16,matharena,matharena,Final Answer Parser,1.0
5796,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_17,matharena,matharena,Final Answer Parser,1.0
5797,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_18,matharena,matharena,Final Answer Parser,0.5
5798,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_19,matharena,matharena,Final Answer Parser,1.0
5799,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_2,matharena,matharena,Final Answer Parser,1.0
5800,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_20,matharena,matharena,Final Answer Parser,1.0
5801,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_21,matharena,matharena,Final Answer Parser,0.5
5802,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_22,matharena,matharena,Final Answer Parser,1.0
5803,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_23,matharena,matharena,Final Answer Parser,1.0
5804,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_24,matharena,matharena,Final Answer Parser,1.0
5805,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_25,matharena,matharena,Final Answer Parser,1.0
5806,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_26,matharena,matharena,Final Answer Parser,1.0
5807,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_27,matharena,matharena,Final Answer Parser,1.0
5808,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_28,matharena,matharena,Final Answer Parser,0.5
5809,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_29,matharena,matharena,Final Answer Parser,1.0
5810,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_3,matharena,matharena,Final Answer Parser,1.0
5811,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_30,matharena,matharena,Final Answer Parser,0.25
5812,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_31,matharena,matharena,Final Answer Parser,1.0
5813,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_32,matharena,matharena,Final Answer Parser,0.75
5814,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_33,matharena,matharena,Final Answer Parser,1.0
5815,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_34,matharena,matharena,Final Answer Parser,0.5
5816,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_35,matharena,matharena,Final Answer Parser,0.75
5817,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_36,matharena,matharena,Final Answer Parser,0.5
5818,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_37,matharena,matharena,Final Answer Parser,1.0
5819,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_38,matharena,matharena,Final Answer Parser,1.0
5820,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_39,matharena,matharena,Final Answer Parser,0.5
5821,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_4,matharena,matharena,Final Answer Parser,1.0
5822,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_40,matharena,matharena,Final Answer Parser,1.0
5823,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_5,matharena,matharena,Final Answer Parser,0.5
5824,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_6,matharena,matharena,Final Answer Parser,1.0
5825,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_7,matharena,matharena,Final Answer Parser,0.25
5826,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_8,matharena,matharena,Final Answer Parser,1.0
5827,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_9,matharena,matharena,Final Answer Parser,1.0
5868,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_1,matharena,matharena,Final Answer Parser,1.0
5869,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_10,matharena,matharena,Final Answer Parser,1.0
5870,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_11,matharena,matharena,Final Answer Parser,1.0
5871,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_12,matharena,matharena,Final Answer Parser,1.0
5872,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_13,matharena,matharena,Final Answer Parser,0.5
5873,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_14,matharena,matharena,Final Answer Parser,0.75
5874,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_15,matharena,matharena,Final Answer Parser,0.25
5875,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_16,matharena,matharena,Final Answer Parser,0.75
5876,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_17,matharena,matharena,Final Answer Parser,1.0
5877,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_18,matharena,matharena,Final Answer Parser,0.0
5878,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_19,matharena,matharena,Final Answer Parser,1.0
5879,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_2,matharena,matharena,Final Answer Parser,1.0
5880,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_20,matharena,matharena,Final Answer Parser,0.25
5881,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_21,matharena,matharena,Final Answer Parser,1.0
5882,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_22,matharena,matharena,Final Answer Parser,1.0
5883,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_23,matharena,matharena,Final Answer Parser,0.5
5884,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_24,matharena,matharena,Final Answer Parser,1.0
5885,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_25,matharena,matharena,Final Answer Parser,1.0
5886,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_26,matharena,matharena,Final Answer Parser,1.0
5887,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_27,matharena,matharena,Final Answer Parser,0.75
5888,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_28,matharena,matharena,Final Answer Parser,0.25
5889,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_29,matharena,matharena,Final Answer Parser,0.5
5890,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_3,matharena,matharena,Final Answer Parser,1.0
5891,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_30,matharena,matharena,Final Answer Parser,0.0
5892,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_31,matharena,matharena,Final Answer Parser,1.0
5893,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_32,matharena,matharena,Final Answer Parser,0.5
5894,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_33,matharena,matharena,Final Answer Parser,1.0
5895,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_34,matharena,matharena,Final Answer Parser,0.5
5896,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_35,matharena,matharena,Final Answer Parser,1.0
5897,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_36,matharena,matharena,Final Answer Parser,1.0
5898,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_37,matharena,matharena,Final Answer Parser,1.0
5899,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_38,matharena,matharena,Final Answer Parser,1.0
5900,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_39,matharena,matharena,Final Answer Parser,0.25
5901,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_4,matharena,matharena,Final Answer Parser,1.0
5902,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_40,matharena,matharena,Final Answer Parser,0.5
5903,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_5,matharena,matharena,Final Answer Parser,0.0
5904,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_6,matharena,matharena,Final Answer Parser,1.0
5905,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_7,matharena,matharena,Final Answer Parser,0.0
5906,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_8,matharena,matharena,Final Answer Parser,1.0
5907,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_9,matharena,matharena,Final Answer Parser,0.75
5908,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_1,matharena,matharena,Final Answer Parser,1.0
5909,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_10,matharena,matharena,Final Answer Parser,1.0
5910,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_11,matharena,matharena,Final Answer Parser,1.0
5911,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_12,matharena,matharena,Final Answer Parser,1.0
5912,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_13,matharena,matharena,Final Answer Parser,1.0
5913,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_14,matharena,matharena,Final Answer Parser,1.0
5914,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_15,matharena,matharena,Final Answer Parser,0.0
5915,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_16,matharena,matharena,Final Answer Parser,0.75
5916,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_17,matharena,matharena,Final Answer Parser,1.0
5917,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_18,matharena,matharena,Final Answer Parser,0.5
5918,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_19,matharena,matharena,Final Answer Parser,1.0
5919,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_2,matharena,matharena,Final Answer Parser,1.0
5920,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_20,matharena,matharena,Final Answer Parser,1.0
5921,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_21,matharena,matharena,Final Answer Parser,1.0
5922,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_22,matharena,matharena,Final Answer Parser,0.75
5923,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_23,matharena,matharena,Final Answer Parser,0.0
5924,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_24,matharena,matharena,Final Answer Parser,1.0
5925,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_25,matharena,matharena,Final Answer Parser,1.0
5926,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_26,matharena,matharena,Final Answer Parser,1.0
5927,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_27,matharena,matharena,Final Answer Parser,1.0
5928,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_28,matharena,matharena,Final Answer Parser,0.25
5929,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_29,matharena,matharena,Final Answer Parser,1.0
5930,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_3,matharena,matharena,Final Answer Parser,1.0
5931,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_30,matharena,matharena,Final Answer Parser,0.75
5932,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_31,matharena,matharena,Final Answer Parser,1.0
5933,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_32,matharena,matharena,Final Answer Parser,0.75
5934,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_33,matharena,matharena,Final Answer Parser,1.0
5935,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_34,matharena,matharena,Final Answer Parser,0.75
5936,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_35,matharena,matharena,Final Answer Parser,1.0
5937,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_36,matharena,matharena,Final Answer Parser,1.0
5938,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_37,matharena,matharena,Final Answer Parser,1.0
5939,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_38,matharena,matharena,Final Answer Parser,0.5
5940,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_39,matharena,matharena,Final Answer Parser,1.0
5941,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_4,matharena,matharena,Final Answer Parser,1.0
5942,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_40,matharena,matharena,Final Answer Parser,0.0
5943,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_5,matharena,matharena,Final Answer Parser,1.0
5944,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_6,matharena,matharena,Final Answer Parser,1.0
5945,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_7,matharena,matharena,Final Answer Parser,0.5
5946,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_8,matharena,matharena,Final Answer Parser,1.0
5947,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_9,matharena,matharena,Final Answer Parser,0.75
5948,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_hmmt/hmmt_feb_2025_1,matharena,matharena,Final Answer Parser,1.0
5949,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_hmmt/hmmt_feb_2025_10,matharena,matharena,Final Answer Parser,1.0
5950,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_hmmt/hmmt_feb_2025_11,matharena,matharena,Final Answer Parser,1.0
5951,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_hmmt/hmmt_feb_2025_12,matharena,matharena,Final Answer Parser,1.0
5952,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_hmmt/hmmt_feb_2025_13,matharena,matharena,Final Answer Parser,0.5
5953,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_hmmt/hmmt_feb_2025_14,matharena,matharena,Final Answer Parser,0.5
5954,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_hmmt/hmmt_feb_2025_15,matharena,matharena,Final Answer Parser,0.75
5955,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_hmmt/hmmt_feb_2025_16,matharena,matharena,Final Answer Parser,1.0
5956,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_hmmt/hmmt_feb_2025_17,matharena,matharena,Final Answer Parser,0.75
5957,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_hmmt/hmmt_feb_2025_18,matharena,matharena,Final Answer Parser,1.0
5958,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_hmmt/hmmt_feb_2025_19,matharena,matharena,Final Answer Parser,0.0
5959,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_hmmt/hmmt_feb_2025_2,matharena,matharena,Final Answer Parser,1.0
5960,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_hmmt/hmmt_feb_2025_20,matharena,matharena,Final Answer Parser,0.25
5961,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_hmmt/hmmt_feb_2025_21,matharena,matharena,Final Answer Parser,1.0
5962,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_hmmt/hmmt_feb_2025_22,matharena,matharena,Final Answer Parser,1.0
5963,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_hmmt/hmmt_feb_2025_23,matharena,matharena,Final Answer Parser,1.0
5964,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_hmmt/hmmt_feb_2025_24,matharena,matharena,Final Answer Parser,0.75
5965,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_hmmt/hmmt_feb_2025_25,matharena,matharena,Final Answer Parser,1.0
5966,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_hmmt/hmmt_feb_2025_26,matharena,matharena,Final Answer Parser,1.0
5967,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_hmmt/hmmt_feb_2025_27,matharena,matharena,Final Answer Parser,1.0
5968,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_hmmt/hmmt_feb_2025_28,matharena,matharena,Final Answer Parser,1.0
5969,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_hmmt/hmmt_feb_2025_29,matharena,matharena,Final Answer Parser,1.0
5970,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_hmmt/hmmt_feb_2025_3,matharena,matharena,Final Answer Parser,0.75
5971,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_hmmt/hmmt_feb_2025_30,matharena,matharena,Final Answer Parser,0.75
5972,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_hmmt/hmmt_feb_2025_4,matharena,matharena,Final Answer Parser,1.0
5973,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_hmmt/hmmt_feb_2025_5,matharena,matharena,Final Answer Parser,1.0
5974,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_hmmt/hmmt_feb_2025_6,matharena,matharena,Final Answer Parser,0.75
5975,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_hmmt/hmmt_feb_2025_7,matharena,matharena,Final Answer Parser,1.0
5976,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_hmmt/hmmt_feb_2025_8,matharena,matharena,Final Answer Parser,1.0
5977,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_hmmt/hmmt_feb_2025_9,matharena,matharena,Final Answer Parser,1.0
5978,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_hmmt/hmmt_feb_2025_1,matharena,matharena,Final Answer Parser,1.0
5979,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_hmmt/hmmt_feb_2025_10,matharena,matharena,Final Answer Parser,1.0
5980,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_hmmt/hmmt_feb_2025_11,matharena,matharena,Final Answer Parser,0.75
5981,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_hmmt/hmmt_feb_2025_12,matharena,matharena,Final Answer Parser,1.0
5982,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_hmmt/hmmt_feb_2025_13,matharena,matharena,Final Answer Parser,0.75
5983,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_hmmt/hmmt_feb_2025_14,matharena,matharena,Final Answer Parser,0.0
5984,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_hmmt/hmmt_feb_2025_15,matharena,matharena,Final Answer Parser,0.5
5985,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_hmmt/hmmt_feb_2025_16,matharena,matharena,Final Answer Parser,1.0
5986,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_hmmt/hmmt_feb_2025_17,matharena,matharena,Final Answer Parser,0.75
5987,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_hmmt/hmmt_feb_2025_18,matharena,matharena,Final Answer Parser,0.5
5988,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_hmmt/hmmt_feb_2025_19,matharena,matharena,Final Answer Parser,0.0
5989,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_hmmt/hmmt_feb_2025_2,matharena,matharena,Final Answer Parser,1.0
5990,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_hmmt/hmmt_feb_2025_20,matharena,matharena,Final Answer Parser,0.0
5991,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_hmmt/hmmt_feb_2025_21,matharena,matharena,Final Answer Parser,1.0
5992,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_hmmt/hmmt_feb_2025_22,matharena,matharena,Final Answer Parser,1.0
5993,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_hmmt/hmmt_feb_2025_23,matharena,matharena,Final Answer Parser,1.0
5994,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_hmmt/hmmt_feb_2025_24,matharena,matharena,Final Answer Parser,1.0
5995,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_hmmt/hmmt_feb_2025_25,matharena,matharena,Final Answer Parser,0.75
5996,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_hmmt/hmmt_feb_2025_26,matharena,matharena,Final Answer Parser,1.0
5997,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_hmmt/hmmt_feb_2025_27,matharena,matharena,Final Answer Parser,1.0
5998,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_hmmt/hmmt_feb_2025_28,matharena,matharena,Final Answer Parser,1.0
5999,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_hmmt/hmmt_feb_2025_29,matharena,matharena,Final Answer Parser,1.0
6000,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_hmmt/hmmt_feb_2025_3,matharena,matharena,Final Answer Parser,1.0
6001,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_hmmt/hmmt_feb_2025_30,matharena,matharena,Final Answer Parser,0.75
6002,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_hmmt/hmmt_feb_2025_4,matharena,matharena,Final Answer Parser,1.0
6003,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_hmmt/hmmt_feb_2025_5,matharena,matharena,Final Answer Parser,1.0
6004,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_hmmt/hmmt_feb_2025_6,matharena,matharena,Final Answer Parser,1.0
6005,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_hmmt/hmmt_feb_2025_7,matharena,matharena,Final Answer Parser,1.0
6006,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_hmmt/hmmt_feb_2025_8,matharena,matharena,Final Answer Parser,1.0
6007,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_hmmt/hmmt_feb_2025_9,matharena,matharena,Final Answer Parser,1.0
6008,o4-mini (high),openai/o4-mini--high,matharena_hmmt/hmmt_feb_2025_1,matharena,matharena,Final Answer Parser,1.0
6009,o4-mini (high),openai/o4-mini--high,matharena_hmmt/hmmt_feb_2025_10,matharena,matharena,Final Answer Parser,1.0
6010,o4-mini (high),openai/o4-mini--high,matharena_hmmt/hmmt_feb_2025_11,matharena,matharena,Final Answer Parser,1.0
6011,o4-mini (high),openai/o4-mini--high,matharena_hmmt/hmmt_feb_2025_12,matharena,matharena,Final Answer Parser,1.0
6012,o4-mini (high),openai/o4-mini--high,matharena_hmmt/hmmt_feb_2025_13,matharena,matharena,Final Answer Parser,1.0
6013,o4-mini (high),openai/o4-mini--high,matharena_hmmt/hmmt_feb_2025_14,matharena,matharena,Final Answer Parser,1.0
6014,o4-mini (high),openai/o4-mini--high,matharena_hmmt/hmmt_feb_2025_15,matharena,matharena,Final Answer Parser,1.0
6015,o4-mini (high),openai/o4-mini--high,matharena_hmmt/hmmt_feb_2025_16,matharena,matharena,Final Answer Parser,0.75
6016,o4-mini (high),openai/o4-mini--high,matharena_hmmt/hmmt_feb_2025_17,matharena,matharena,Final Answer Parser,0.25
6017,o4-mini (high),openai/o4-mini--high,matharena_hmmt/hmmt_feb_2025_18,matharena,matharena,Final Answer Parser,0.75
6018,o4-mini (high),openai/o4-mini--high,matharena_hmmt/hmmt_feb_2025_19,matharena,matharena,Final Answer Parser,0.0
6019,o4-mini (high),openai/o4-mini--high,matharena_hmmt/hmmt_feb_2025_2,matharena,matharena,Final Answer Parser,1.0
6020,o4-mini (high),openai/o4-mini--high,matharena_hmmt/hmmt_feb_2025_20,matharena,matharena,Final Answer Parser,0.0
6021,o4-mini (high),openai/o4-mini--high,matharena_hmmt/hmmt_feb_2025_21,matharena,matharena,Final Answer Parser,1.0
6022,o4-mini (high),openai/o4-mini--high,matharena_hmmt/hmmt_feb_2025_22,matharena,matharena,Final Answer Parser,1.0
6023,o4-mini (high),openai/o4-mini--high,matharena_hmmt/hmmt_feb_2025_23,matharena,matharena,Final Answer Parser,1.0
6024,o4-mini (high),openai/o4-mini--high,matharena_hmmt/hmmt_feb_2025_24,matharena,matharena,Final Answer Parser,1.0
6025,o4-mini (high),openai/o4-mini--high,matharena_hmmt/hmmt_feb_2025_25,matharena,matharena,Final Answer Parser,1.0
6026,o4-mini (high),openai/o4-mini--high,matharena_hmmt/hmmt_feb_2025_26,matharena,matharena,Final Answer Parser,0.75
6027,o4-mini (high),openai/o4-mini--high,matharena_hmmt/hmmt_feb_2025_27,matharena,matharena,Final Answer Parser,0.75
6028,o4-mini (high),openai/o4-mini--high,matharena_hmmt/hmmt_feb_2025_28,matharena,matharena,Final Answer Parser,1.0
6029,o4-mini (high),openai/o4-mini--high,matharena_hmmt/hmmt_feb_2025_29,matharena,matharena,Final Answer Parser,1.0
6030,o4-mini (high),openai/o4-mini--high,matharena_hmmt/hmmt_feb_2025_3,matharena,matharena,Final Answer Parser,1.0
6031,o4-mini (high),openai/o4-mini--high,matharena_hmmt/hmmt_feb_2025_30,matharena,matharena,Final Answer Parser,0.0
6032,o4-mini (high),openai/o4-mini--high,matharena_hmmt/hmmt_feb_2025_4,matharena,matharena,Final Answer Parser,1.0
6033,o4-mini (high),openai/o4-mini--high,matharena_hmmt/hmmt_feb_2025_5,matharena,matharena,Final Answer Parser,0.75
6034,o4-mini (high),openai/o4-mini--high,matharena_hmmt/hmmt_feb_2025_6,matharena,matharena,Final Answer Parser,1.0
6035,o4-mini (high),openai/o4-mini--high,matharena_hmmt/hmmt_feb_2025_7,matharena,matharena,Final Answer Parser,1.0
6036,o4-mini (high),openai/o4-mini--high,matharena_hmmt/hmmt_feb_2025_8,matharena,matharena,Final Answer Parser,1.0
6037,o4-mini (high),openai/o4-mini--high,matharena_hmmt/hmmt_feb_2025_9,matharena,matharena,Final Answer Parser,0.75
6038,GPT-5-mini (high),openai/gpt-5-mini,matharena_hmmt/hmmt_feb_2025_1,matharena,matharena,Final Answer Parser,1.0
6039,GPT-5-mini (high),openai/gpt-5-mini,matharena_hmmt/hmmt_feb_2025_10,matharena,matharena,Final Answer Parser,1.0
6040,GPT-5-mini (high),openai/gpt-5-mini,matharena_hmmt/hmmt_feb_2025_11,matharena,matharena,Final Answer Parser,1.0
6041,GPT-5-mini (high),openai/gpt-5-mini,matharena_hmmt/hmmt_feb_2025_12,matharena,matharena,Final Answer Parser,1.0
6042,GPT-5-mini (high),openai/gpt-5-mini,matharena_hmmt/hmmt_feb_2025_13,matharena,matharena,Final Answer Parser,0.75
6043,GPT-5-mini (high),openai/gpt-5-mini,matharena_hmmt/hmmt_feb_2025_14,matharena,matharena,Final Answer Parser,1.0
6044,GPT-5-mini (high),openai/gpt-5-mini,matharena_hmmt/hmmt_feb_2025_15,matharena,matharena,Final Answer Parser,1.0
6045,GPT-5-mini (high),openai/gpt-5-mini,matharena_hmmt/hmmt_feb_2025_16,matharena,matharena,Final Answer Parser,1.0
6046,GPT-5-mini (high),openai/gpt-5-mini,matharena_hmmt/hmmt_feb_2025_17,matharena,matharena,Final Answer Parser,0.5
6047,GPT-5-mini (high),openai/gpt-5-mini,matharena_hmmt/hmmt_feb_2025_18,matharena,matharena,Final Answer Parser,1.0
6048,GPT-5-mini (high),openai/gpt-5-mini,matharena_hmmt/hmmt_feb_2025_19,matharena,matharena,Final Answer Parser,0.25
6049,GPT-5-mini (high),openai/gpt-5-mini,matharena_hmmt/hmmt_feb_2025_2,matharena,matharena,Final Answer Parser,1.0
6050,GPT-5-mini (high),openai/gpt-5-mini,matharena_hmmt/hmmt_feb_2025_20,matharena,matharena,Final Answer Parser,0.0
6051,GPT-5-mini (high),openai/gpt-5-mini,matharena_hmmt/hmmt_feb_2025_21,matharena,matharena,Final Answer Parser,1.0
6052,GPT-5-mini (high),openai/gpt-5-mini,matharena_hmmt/hmmt_feb_2025_22,matharena,matharena,Final Answer Parser,1.0
6053,GPT-5-mini (high),openai/gpt-5-mini,matharena_hmmt/hmmt_feb_2025_23,matharena,matharena,Final Answer Parser,1.0
6054,GPT-5-mini (high),openai/gpt-5-mini,matharena_hmmt/hmmt_feb_2025_24,matharena,matharena,Final Answer Parser,1.0
6055,GPT-5-mini (high),openai/gpt-5-mini,matharena_hmmt/hmmt_feb_2025_25,matharena,matharena,Final Answer Parser,0.75
6056,GPT-5-mini (high),openai/gpt-5-mini,matharena_hmmt/hmmt_feb_2025_26,matharena,matharena,Final Answer Parser,1.0
6057,GPT-5-mini (high),openai/gpt-5-mini,matharena_hmmt/hmmt_feb_2025_27,matharena,matharena,Final Answer Parser,1.0
6058,GPT-5-mini (high),openai/gpt-5-mini,matharena_hmmt/hmmt_feb_2025_28,matharena,matharena,Final Answer Parser,1.0
6059,GPT-5-mini (high),openai/gpt-5-mini,matharena_hmmt/hmmt_feb_2025_29,matharena,matharena,Final Answer Parser,1.0
6060,GPT-5-mini (high),openai/gpt-5-mini,matharena_hmmt/hmmt_feb_2025_3,matharena,matharena,Final Answer Parser,1.0
6061,GPT-5-mini (high),openai/gpt-5-mini,matharena_hmmt/hmmt_feb_2025_30,matharena,matharena,Final Answer Parser,0.5
6062,GPT-5-mini (high),openai/gpt-5-mini,matharena_hmmt/hmmt_feb_2025_4,matharena,matharena,Final Answer Parser,1.0
6063,GPT-5-mini (high),openai/gpt-5-mini,matharena_hmmt/hmmt_feb_2025_5,matharena,matharena,Final Answer Parser,1.0
6064,GPT-5-mini (high),openai/gpt-5-mini,matharena_hmmt/hmmt_feb_2025_6,matharena,matharena,Final Answer Parser,1.0
6065,GPT-5-mini (high),openai/gpt-5-mini,matharena_hmmt/hmmt_feb_2025_7,matharena,matharena,Final Answer Parser,1.0
6066,GPT-5-mini (high),openai/gpt-5-mini,matharena_hmmt/hmmt_feb_2025_8,matharena,matharena,Final Answer Parser,1.0
6067,GPT-5-mini (high),openai/gpt-5-mini,matharena_hmmt/hmmt_feb_2025_9,matharena,matharena,Final Answer Parser,1.0
6068,GPT-5 (high),openai/gpt-5,matharena_hmmt/hmmt_feb_2025_1,matharena,matharena,Final Answer Parser,1.0
6069,GPT-5 (high),openai/gpt-5,matharena_hmmt/hmmt_feb_2025_10,matharena,matharena,Final Answer Parser,1.0
6070,GPT-5 (high),openai/gpt-5,matharena_hmmt/hmmt_feb_2025_11,matharena,matharena,Final Answer Parser,1.0
6071,GPT-5 (high),openai/gpt-5,matharena_hmmt/hmmt_feb_2025_12,matharena,matharena,Final Answer Parser,1.0
6072,GPT-5 (high),openai/gpt-5,matharena_hmmt/hmmt_feb_2025_13,matharena,matharena,Final Answer Parser,1.0
6073,GPT-5 (high),openai/gpt-5,matharena_hmmt/hmmt_feb_2025_14,matharena,matharena,Final Answer Parser,1.0
6074,GPT-5 (high),openai/gpt-5,matharena_hmmt/hmmt_feb_2025_15,matharena,matharena,Final Answer Parser,1.0
6075,GPT-5 (high),openai/gpt-5,matharena_hmmt/hmmt_feb_2025_16,matharena,matharena,Final Answer Parser,1.0
6076,GPT-5 (high),openai/gpt-5,matharena_hmmt/hmmt_feb_2025_17,matharena,matharena,Final Answer Parser,0.25
6077,GPT-5 (high),openai/gpt-5,matharena_hmmt/hmmt_feb_2025_18,matharena,matharena,Final Answer Parser,0.5
6078,GPT-5 (high),openai/gpt-5,matharena_hmmt/hmmt_feb_2025_19,matharena,matharena,Final Answer Parser,0.5
6079,GPT-5 (high),openai/gpt-5,matharena_hmmt/hmmt_feb_2025_2,matharena,matharena,Final Answer Parser,1.0
6080,GPT-5 (high),openai/gpt-5,matharena_hmmt/hmmt_feb_2025_20,matharena,matharena,Final Answer Parser,0.75
6081,GPT-5 (high),openai/gpt-5,matharena_hmmt/hmmt_feb_2025_21,matharena,matharena,Final Answer Parser,1.0
6082,GPT-5 (high),openai/gpt-5,matharena_hmmt/hmmt_feb_2025_22,matharena,matharena,Final Answer Parser,1.0
6083,GPT-5 (high),openai/gpt-5,matharena_hmmt/hmmt_feb_2025_23,matharena,matharena,Final Answer Parser,1.0
6084,GPT-5 (high),openai/gpt-5,matharena_hmmt/hmmt_feb_2025_24,matharena,matharena,Final Answer Parser,1.0
6085,GPT-5 (high),openai/gpt-5,matharena_hmmt/hmmt_feb_2025_25,matharena,matharena,Final Answer Parser,0.75
6086,GPT-5 (high),openai/gpt-5,matharena_hmmt/hmmt_feb_2025_26,matharena,matharena,Final Answer Parser,1.0
6087,GPT-5 (high),openai/gpt-5,matharena_hmmt/hmmt_feb_2025_27,matharena,matharena,Final Answer Parser,0.75
6088,GPT-5 (high),openai/gpt-5,matharena_hmmt/hmmt_feb_2025_28,matharena,matharena,Final Answer Parser,1.0
6089,GPT-5 (high),openai/gpt-5,matharena_hmmt/hmmt_feb_2025_29,matharena,matharena,Final Answer Parser,1.0
6090,GPT-5 (high),openai/gpt-5,matharena_hmmt/hmmt_feb_2025_3,matharena,matharena,Final Answer Parser,1.0
6091,GPT-5 (high),openai/gpt-5,matharena_hmmt/hmmt_feb_2025_30,matharena,matharena,Final Answer Parser,0.0
6092,GPT-5 (high),openai/gpt-5,matharena_hmmt/hmmt_feb_2025_4,matharena,matharena,Final Answer Parser,1.0
6093,GPT-5 (high),openai/gpt-5,matharena_hmmt/hmmt_feb_2025_5,matharena,matharena,Final Answer Parser,1.0
6094,GPT-5 (high),openai/gpt-5,matharena_hmmt/hmmt_feb_2025_6,matharena,matharena,Final Answer Parser,1.0
6095,GPT-5 (high),openai/gpt-5,matharena_hmmt/hmmt_feb_2025_7,matharena,matharena,Final Answer Parser,1.0
6096,GPT-5 (high),openai/gpt-5,matharena_hmmt/hmmt_feb_2025_8,matharena,matharena,Final Answer Parser,1.0
6097,GPT-5 (high),openai/gpt-5,matharena_hmmt/hmmt_feb_2025_9,matharena,matharena,Final Answer Parser,1.0
6128,GPT OSS 120B (high),openai/oss-20b,matharena_hmmt/hmmt_feb_2025_1,matharena,matharena,Final Answer Parser,1.0
6129,GPT OSS 120B (high),openai/oss-20b,matharena_hmmt/hmmt_feb_2025_10,matharena,matharena,Final Answer Parser,0.25
6130,GPT OSS 120B (high),openai/oss-20b,matharena_hmmt/hmmt_feb_2025_11,matharena,matharena,Final Answer Parser,0.75
6131,GPT OSS 120B (high),openai/oss-20b,matharena_hmmt/hmmt_feb_2025_12,matharena,matharena,Final Answer Parser,1.0
6132,GPT OSS 120B (high),openai/oss-20b,matharena_hmmt/hmmt_feb_2025_13,matharena,matharena,Final Answer Parser,1.0
6133,GPT OSS 120B (high),openai/oss-20b,matharena_hmmt/hmmt_feb_2025_14,matharena,matharena,Final Answer Parser,0.25
6134,GPT OSS 120B (high),openai/oss-20b,matharena_hmmt/hmmt_feb_2025_15,matharena,matharena,Final Answer Parser,1.0
6135,GPT OSS 120B (high),openai/oss-20b,matharena_hmmt/hmmt_feb_2025_16,matharena,matharena,Final Answer Parser,0.5
6136,GPT OSS 120B (high),openai/oss-20b,matharena_hmmt/hmmt_feb_2025_17,matharena,matharena,Final Answer Parser,0.5
6137,GPT OSS 120B (high),openai/oss-20b,matharena_hmmt/hmmt_feb_2025_18,matharena,matharena,Final Answer Parser,0.25
6138,GPT OSS 120B (high),openai/oss-20b,matharena_hmmt/hmmt_feb_2025_19,matharena,matharena,Final Answer Parser,0.0
6139,GPT OSS 120B (high),openai/oss-20b,matharena_hmmt/hmmt_feb_2025_2,matharena,matharena,Final Answer Parser,1.0
6140,GPT OSS 120B (high),openai/oss-20b,matharena_hmmt/hmmt_feb_2025_20,matharena,matharena,Final Answer Parser,0.0
6141,GPT OSS 120B (high),openai/oss-20b,matharena_hmmt/hmmt_feb_2025_21,matharena,matharena,Final Answer Parser,1.0
6142,GPT OSS 120B (high),openai/oss-20b,matharena_hmmt/hmmt_feb_2025_22,matharena,matharena,Final Answer Parser,1.0
6143,GPT OSS 120B (high),openai/oss-20b,matharena_hmmt/hmmt_feb_2025_23,matharena,matharena,Final Answer Parser,1.0
6144,GPT OSS 120B (high),openai/oss-20b,matharena_hmmt/hmmt_feb_2025_24,matharena,matharena,Final Answer Parser,0.75
6145,GPT OSS 120B (high),openai/oss-20b,matharena_hmmt/hmmt_feb_2025_25,matharena,matharena,Final Answer Parser,1.0
6146,GPT OSS 120B (high),openai/oss-20b,matharena_hmmt/hmmt_feb_2025_26,matharena,matharena,Final Answer Parser,1.0
6147,GPT OSS 120B (high),openai/oss-20b,matharena_hmmt/hmmt_feb_2025_27,matharena,matharena,Final Answer Parser,1.0
6148,GPT OSS 120B (high),openai/oss-20b,matharena_hmmt/hmmt_feb_2025_28,matharena,matharena,Final Answer Parser,1.0
6149,GPT OSS 120B (high),openai/oss-20b,matharena_hmmt/hmmt_feb_2025_29,matharena,matharena,Final Answer Parser,0.0
6150,GPT OSS 120B (high),openai/oss-20b,matharena_hmmt/hmmt_feb_2025_3,matharena,matharena,Final Answer Parser,1.0
6151,GPT OSS 120B (high),openai/oss-20b,matharena_hmmt/hmmt_feb_2025_30,matharena,matharena,Final Answer Parser,0.25
6152,GPT OSS 120B (high),openai/oss-20b,matharena_hmmt/hmmt_feb_2025_4,matharena,matharena,Final Answer Parser,1.0
6153,GPT OSS 120B (high),openai/oss-20b,matharena_hmmt/hmmt_feb_2025_5,matharena,matharena,Final Answer Parser,1.0
6154,GPT OSS 120B (high),openai/oss-20b,matharena_hmmt/hmmt_feb_2025_6,matharena,matharena,Final Answer Parser,1.0
6155,GPT OSS 120B (high),openai/oss-20b,matharena_hmmt/hmmt_feb_2025_7,matharena,matharena,Final Answer Parser,1.0
6156,GPT OSS 120B (high),openai/oss-20b,matharena_hmmt/hmmt_feb_2025_8,matharena,matharena,Final Answer Parser,1.0
6157,GPT OSS 120B (high),openai/oss-20b,matharena_hmmt/hmmt_feb_2025_9,matharena,matharena,Final Answer Parser,1.0
6158,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_hmmt/hmmt_feb_2025_1,matharena,matharena,Final Answer Parser,1.0
6159,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_hmmt/hmmt_feb_2025_10,matharena,matharena,Final Answer Parser,0.75
6160,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_hmmt/hmmt_feb_2025_11,matharena,matharena,Final Answer Parser,0.75
6161,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_hmmt/hmmt_feb_2025_12,matharena,matharena,Final Answer Parser,0.25
6162,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_hmmt/hmmt_feb_2025_13,matharena,matharena,Final Answer Parser,0.0
6163,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_hmmt/hmmt_feb_2025_14,matharena,matharena,Final Answer Parser,0.0
6164,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_hmmt/hmmt_feb_2025_15,matharena,matharena,Final Answer Parser,0.25
6165,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_hmmt/hmmt_feb_2025_16,matharena,matharena,Final Answer Parser,0.75
6166,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_hmmt/hmmt_feb_2025_17,matharena,matharena,Final Answer Parser,0.0
6167,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_hmmt/hmmt_feb_2025_18,matharena,matharena,Final Answer Parser,0.75
6168,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_hmmt/hmmt_feb_2025_19,matharena,matharena,Final Answer Parser,0.0
6169,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_hmmt/hmmt_feb_2025_2,matharena,matharena,Final Answer Parser,1.0
6170,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_hmmt/hmmt_feb_2025_20,matharena,matharena,Final Answer Parser,0.0
6171,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_hmmt/hmmt_feb_2025_21,matharena,matharena,Final Answer Parser,1.0
6172,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_hmmt/hmmt_feb_2025_22,matharena,matharena,Final Answer Parser,1.0
6173,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_hmmt/hmmt_feb_2025_23,matharena,matharena,Final Answer Parser,1.0
6174,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_hmmt/hmmt_feb_2025_24,matharena,matharena,Final Answer Parser,0.5
6175,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_hmmt/hmmt_feb_2025_25,matharena,matharena,Final Answer Parser,0.0
6176,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_hmmt/hmmt_feb_2025_26,matharena,matharena,Final Answer Parser,0.75
6177,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_hmmt/hmmt_feb_2025_27,matharena,matharena,Final Answer Parser,1.0
6178,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_hmmt/hmmt_feb_2025_28,matharena,matharena,Final Answer Parser,1.0
6179,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_hmmt/hmmt_feb_2025_29,matharena,matharena,Final Answer Parser,0.5
6180,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_hmmt/hmmt_feb_2025_3,matharena,matharena,Final Answer Parser,1.0
6181,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_hmmt/hmmt_feb_2025_30,matharena,matharena,Final Answer Parser,0.0
6182,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_hmmt/hmmt_feb_2025_4,matharena,matharena,Final Answer Parser,1.0
6183,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_hmmt/hmmt_feb_2025_5,matharena,matharena,Final Answer Parser,1.0
6184,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_hmmt/hmmt_feb_2025_6,matharena,matharena,Final Answer Parser,1.0
6185,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_hmmt/hmmt_feb_2025_7,matharena,matharena,Final Answer Parser,0.75
6186,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_hmmt/hmmt_feb_2025_8,matharena,matharena,Final Answer Parser,1.0
6187,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_hmmt/hmmt_feb_2025_9,matharena,matharena,Final Answer Parser,0.75
6188,Grok 4,xai/grok-4,matharena_hmmt/hmmt_feb_2025_1,matharena,matharena,Final Answer Parser,1.0
6189,Grok 4,xai/grok-4,matharena_hmmt/hmmt_feb_2025_10,matharena,matharena,Final Answer Parser,1.0
6190,Grok 4,xai/grok-4,matharena_hmmt/hmmt_feb_2025_11,matharena,matharena,Final Answer Parser,1.0
6191,Grok 4,xai/grok-4,matharena_hmmt/hmmt_feb_2025_12,matharena,matharena,Final Answer Parser,1.0
6192,Grok 4,xai/grok-4,matharena_hmmt/hmmt_feb_2025_13,matharena,matharena,Final Answer Parser,0.75
6193,Grok 4,xai/grok-4,matharena_hmmt/hmmt_feb_2025_14,matharena,matharena,Final Answer Parser,1.0
6194,Grok 4,xai/grok-4,matharena_hmmt/hmmt_feb_2025_15,matharena,matharena,Final Answer Parser,1.0
6195,Grok 4,xai/grok-4,matharena_hmmt/hmmt_feb_2025_16,matharena,matharena,Final Answer Parser,1.0
6196,Grok 4,xai/grok-4,matharena_hmmt/hmmt_feb_2025_17,matharena,matharena,Final Answer Parser,0.75
6197,Grok 4,xai/grok-4,matharena_hmmt/hmmt_feb_2025_18,matharena,matharena,Final Answer Parser,1.0
6198,Grok 4,xai/grok-4,matharena_hmmt/hmmt_feb_2025_19,matharena,matharena,Final Answer Parser,0.5
6199,Grok 4,xai/grok-4,matharena_hmmt/hmmt_feb_2025_2,matharena,matharena,Final Answer Parser,1.0
6200,Grok 4,xai/grok-4,matharena_hmmt/hmmt_feb_2025_20,matharena,matharena,Final Answer Parser,0.5
6201,Grok 4,xai/grok-4,matharena_hmmt/hmmt_feb_2025_21,matharena,matharena,Final Answer Parser,1.0
6202,Grok 4,xai/grok-4,matharena_hmmt/hmmt_feb_2025_22,matharena,matharena,Final Answer Parser,1.0
6203,Grok 4,xai/grok-4,matharena_hmmt/hmmt_feb_2025_23,matharena,matharena,Final Answer Parser,1.0
6204,Grok 4,xai/grok-4,matharena_hmmt/hmmt_feb_2025_24,matharena,matharena,Final Answer Parser,1.0
6205,Grok 4,xai/grok-4,matharena_hmmt/hmmt_feb_2025_25,matharena,matharena,Final Answer Parser,1.0
6206,Grok 4,xai/grok-4,matharena_hmmt/hmmt_feb_2025_26,matharena,matharena,Final Answer Parser,1.0
6207,Grok 4,xai/grok-4,matharena_hmmt/hmmt_feb_2025_27,matharena,matharena,Final Answer Parser,1.0
6208,Grok 4,xai/grok-4,matharena_hmmt/hmmt_feb_2025_28,matharena,matharena,Final Answer Parser,1.0
6209,Grok 4,xai/grok-4,matharena_hmmt/hmmt_feb_2025_29,matharena,matharena,Final Answer Parser,0.75
6210,Grok 4,xai/grok-4,matharena_hmmt/hmmt_feb_2025_3,matharena,matharena,Final Answer Parser,1.0
6211,Grok 4,xai/grok-4,matharena_hmmt/hmmt_feb_2025_30,matharena,matharena,Final Answer Parser,0.5
6212,Grok 4,xai/grok-4,matharena_hmmt/hmmt_feb_2025_4,matharena,matharena,Final Answer Parser,1.0
6213,Grok 4,xai/grok-4,matharena_hmmt/hmmt_feb_2025_5,matharena,matharena,Final Answer Parser,1.0
6214,Grok 4,xai/grok-4,matharena_hmmt/hmmt_feb_2025_6,matharena,matharena,Final Answer Parser,1.0
6215,Grok 4,xai/grok-4,matharena_hmmt/hmmt_feb_2025_7,matharena,matharena,Final Answer Parser,1.0
6216,Grok 4,xai/grok-4,matharena_hmmt/hmmt_feb_2025_8,matharena,matharena,Final Answer Parser,1.0
6217,Grok 4,xai/grok-4,matharena_hmmt/hmmt_feb_2025_9,matharena,matharena,Final Answer Parser,1.0
6218,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_1,matharena,matharena,Final Answer Parser,1.0
6219,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_10,matharena,matharena,Final Answer Parser,1.0
6220,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_11,matharena,matharena,Final Answer Parser,1.0
6221,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_12,matharena,matharena,Final Answer Parser,1.0
6222,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_13,matharena,matharena,Final Answer Parser,1.0
6223,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_14,matharena,matharena,Final Answer Parser,1.0
6224,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_15,matharena,matharena,Final Answer Parser,1.0
6225,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_16,matharena,matharena,Final Answer Parser,1.0
6226,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_17,matharena,matharena,Final Answer Parser,1.0
6227,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_18,matharena,matharena,Final Answer Parser,1.0
6228,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_19,matharena,matharena,Final Answer Parser,1.0
6229,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_2,matharena,matharena,Final Answer Parser,1.0
6230,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_20,matharena,matharena,Final Answer Parser,0.0
6231,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_21,matharena,matharena,Final Answer Parser,1.0
6232,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_22,matharena,matharena,Final Answer Parser,0.5
6233,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_23,matharena,matharena,Final Answer Parser,1.0
6234,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_24,matharena,matharena,Final Answer Parser,1.0
6235,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_25,matharena,matharena,Final Answer Parser,1.0
6236,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_26,matharena,matharena,Final Answer Parser,1.0
6237,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_27,matharena,matharena,Final Answer Parser,0.0
6238,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_28,matharena,matharena,Final Answer Parser,1.0
6239,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_29,matharena,matharena,Final Answer Parser,1.0
6240,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_3,matharena,matharena,Final Answer Parser,1.0
6241,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_30,matharena,matharena,Final Answer Parser,0.5
6242,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_31,matharena,matharena,Final Answer Parser,1.0
6243,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_32,matharena,matharena,Final Answer Parser,1.0
6244,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_33,matharena,matharena,Final Answer Parser,1.0
6245,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_34,matharena,matharena,Final Answer Parser,1.0
6246,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_35,matharena,matharena,Final Answer Parser,1.0
6247,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_36,matharena,matharena,Final Answer Parser,1.0
6248,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_37,matharena,matharena,Final Answer Parser,0.5
6249,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_38,matharena,matharena,Final Answer Parser,0.75
6250,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_39,matharena,matharena,Final Answer Parser,1.0
6251,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_4,matharena,matharena,Final Answer Parser,1.0
6252,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_40,matharena,matharena,Final Answer Parser,0.75
6253,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_41,matharena,matharena,Final Answer Parser,1.0
6254,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_42,matharena,matharena,Final Answer Parser,0.0
6255,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_43,matharena,matharena,Final Answer Parser,0.0
6256,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_44,matharena,matharena,Final Answer Parser,1.0
6257,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_45,matharena,matharena,Final Answer Parser,1.0
6258,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_46,matharena,matharena,Final Answer Parser,1.0
6259,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_47,matharena,matharena,Final Answer Parser,1.0
6260,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_48,matharena,matharena,Final Answer Parser,1.0
6261,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_49,matharena,matharena,Final Answer Parser,1.0
6262,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_5,matharena,matharena,Final Answer Parser,1.0
6263,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_50,matharena,matharena,Final Answer Parser,0.0
6264,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_51,matharena,matharena,Final Answer Parser,1.0
6265,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_52,matharena,matharena,Final Answer Parser,1.0
6266,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_53,matharena,matharena,Final Answer Parser,0.5
6267,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_6,matharena,matharena,Final Answer Parser,1.0
6268,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_7,matharena,matharena,Final Answer Parser,1.0
6269,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_8,matharena,matharena,Final Answer Parser,0.0
6270,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_9,matharena,matharena,Final Answer Parser,1.0
6271,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_1,matharena,matharena,Final Answer Parser,1.0
6272,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_10,matharena,matharena,Final Answer Parser,1.0
6273,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_11,matharena,matharena,Final Answer Parser,1.0
6274,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_12,matharena,matharena,Final Answer Parser,1.0
6275,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_13,matharena,matharena,Final Answer Parser,0.75
6276,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_14,matharena,matharena,Final Answer Parser,1.0
6277,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_15,matharena,matharena,Final Answer Parser,1.0
6278,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_16,matharena,matharena,Final Answer Parser,1.0
6279,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_17,matharena,matharena,Final Answer Parser,0.5
6280,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_18,matharena,matharena,Final Answer Parser,0.75
6281,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_19,matharena,matharena,Final Answer Parser,1.0
6282,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_2,matharena,matharena,Final Answer Parser,1.0
6283,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_20,matharena,matharena,Final Answer Parser,0.0
6284,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_21,matharena,matharena,Final Answer Parser,1.0
6285,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_22,matharena,matharena,Final Answer Parser,0.25
6286,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_23,matharena,matharena,Final Answer Parser,1.0
6287,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_24,matharena,matharena,Final Answer Parser,1.0
6288,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_25,matharena,matharena,Final Answer Parser,1.0
6289,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_26,matharena,matharena,Final Answer Parser,1.0
6290,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_27,matharena,matharena,Final Answer Parser,1.0
6291,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_28,matharena,matharena,Final Answer Parser,1.0
6292,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_29,matharena,matharena,Final Answer Parser,1.0
6293,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_3,matharena,matharena,Final Answer Parser,1.0
6294,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_30,matharena,matharena,Final Answer Parser,0.25
6295,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_31,matharena,matharena,Final Answer Parser,1.0
6296,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_32,matharena,matharena,Final Answer Parser,1.0
6297,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_33,matharena,matharena,Final Answer Parser,1.0
6298,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_34,matharena,matharena,Final Answer Parser,0.75
6299,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_35,matharena,matharena,Final Answer Parser,1.0
6300,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_36,matharena,matharena,Final Answer Parser,1.0
6301,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_37,matharena,matharena,Final Answer Parser,0.5
6302,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_38,matharena,matharena,Final Answer Parser,0.75
6303,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_39,matharena,matharena,Final Answer Parser,1.0
6304,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_4,matharena,matharena,Final Answer Parser,1.0
6305,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_40,matharena,matharena,Final Answer Parser,1.0
6306,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_41,matharena,matharena,Final Answer Parser,1.0
6307,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_42,matharena,matharena,Final Answer Parser,0.0
6308,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_43,matharena,matharena,Final Answer Parser,0.0
6309,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_44,matharena,matharena,Final Answer Parser,1.0
6310,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_45,matharena,matharena,Final Answer Parser,1.0
6311,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_46,matharena,matharena,Final Answer Parser,1.0
6312,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_47,matharena,matharena,Final Answer Parser,1.0
6313,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_48,matharena,matharena,Final Answer Parser,1.0
6314,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_49,matharena,matharena,Final Answer Parser,1.0
6315,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_5,matharena,matharena,Final Answer Parser,1.0
6316,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_50,matharena,matharena,Final Answer Parser,1.0
6317,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_51,matharena,matharena,Final Answer Parser,1.0
6318,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_52,matharena,matharena,Final Answer Parser,1.0
6319,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_53,matharena,matharena,Final Answer Parser,0.5
6320,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_6,matharena,matharena,Final Answer Parser,1.0
6321,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_7,matharena,matharena,Final Answer Parser,1.0
6322,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_8,matharena,matharena,Final Answer Parser,0.0
6323,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_9,matharena,matharena,Final Answer Parser,1.0
6324,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_1,matharena,matharena,Final Answer Parser,1.0
6325,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_10,matharena,matharena,Final Answer Parser,1.0
6326,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_11,matharena,matharena,Final Answer Parser,1.0
6327,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_12,matharena,matharena,Final Answer Parser,1.0
6328,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_13,matharena,matharena,Final Answer Parser,0.5
6329,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_14,matharena,matharena,Final Answer Parser,1.0
6330,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_15,matharena,matharena,Final Answer Parser,1.0
6331,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_16,matharena,matharena,Final Answer Parser,1.0
6332,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_17,matharena,matharena,Final Answer Parser,1.0
6333,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_18,matharena,matharena,Final Answer Parser,1.0
6334,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_19,matharena,matharena,Final Answer Parser,1.0
6335,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_2,matharena,matharena,Final Answer Parser,1.0
6336,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_20,matharena,matharena,Final Answer Parser,0.0
6337,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_21,matharena,matharena,Final Answer Parser,1.0
6338,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_22,matharena,matharena,Final Answer Parser,1.0
6339,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_23,matharena,matharena,Final Answer Parser,1.0
6340,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_24,matharena,matharena,Final Answer Parser,0.5
6341,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_25,matharena,matharena,Final Answer Parser,1.0
6342,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_26,matharena,matharena,Final Answer Parser,1.0
6343,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_27,matharena,matharena,Final Answer Parser,0.75
6344,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_28,matharena,matharena,Final Answer Parser,1.0
6345,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_29,matharena,matharena,Final Answer Parser,1.0
6346,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_3,matharena,matharena,Final Answer Parser,1.0
6347,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_30,matharena,matharena,Final Answer Parser,1.0
6348,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_31,matharena,matharena,Final Answer Parser,1.0
6349,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_32,matharena,matharena,Final Answer Parser,1.0
6350,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_33,matharena,matharena,Final Answer Parser,1.0
6351,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_34,matharena,matharena,Final Answer Parser,1.0
6352,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_35,matharena,matharena,Final Answer Parser,1.0
6353,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_36,matharena,matharena,Final Answer Parser,1.0
6354,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_37,matharena,matharena,Final Answer Parser,1.0
6355,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_38,matharena,matharena,Final Answer Parser,1.0
6356,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_39,matharena,matharena,Final Answer Parser,1.0
6357,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_4,matharena,matharena,Final Answer Parser,1.0
6358,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_40,matharena,matharena,Final Answer Parser,1.0
6359,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_41,matharena,matharena,Final Answer Parser,0.75
6360,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_42,matharena,matharena,Final Answer Parser,0.0
6361,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_43,matharena,matharena,Final Answer Parser,0.0
6362,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_44,matharena,matharena,Final Answer Parser,1.0
6363,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_45,matharena,matharena,Final Answer Parser,1.0
6364,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_46,matharena,matharena,Final Answer Parser,1.0
6365,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_47,matharena,matharena,Final Answer Parser,1.0
6366,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_48,matharena,matharena,Final Answer Parser,1.0
6367,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_49,matharena,matharena,Final Answer Parser,1.0
6368,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_5,matharena,matharena,Final Answer Parser,1.0
6369,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_50,matharena,matharena,Final Answer Parser,1.0
6370,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_51,matharena,matharena,Final Answer Parser,1.0
6371,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_52,matharena,matharena,Final Answer Parser,1.0
6372,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_53,matharena,matharena,Final Answer Parser,0.5
6373,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_6,matharena,matharena,Final Answer Parser,1.0
6374,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_7,matharena,matharena,Final Answer Parser,1.0
6375,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_8,matharena,matharena,Final Answer Parser,0.0
6376,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_9,matharena,matharena,Final Answer Parser,1.0
6377,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_1,matharena,matharena,Final Answer Parser,1.0
6378,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_10,matharena,matharena,Final Answer Parser,1.0
6379,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_11,matharena,matharena,Final Answer Parser,1.0
6380,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_12,matharena,matharena,Final Answer Parser,1.0
6381,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_13,matharena,matharena,Final Answer Parser,1.0
6382,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_14,matharena,matharena,Final Answer Parser,1.0
6383,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_15,matharena,matharena,Final Answer Parser,1.0
6384,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_16,matharena,matharena,Final Answer Parser,1.0
6385,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_17,matharena,matharena,Final Answer Parser,1.0
6386,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_18,matharena,matharena,Final Answer Parser,1.0
6387,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_19,matharena,matharena,Final Answer Parser,1.0
6388,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_2,matharena,matharena,Final Answer Parser,1.0
6389,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_20,matharena,matharena,Final Answer Parser,0.5
6390,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_21,matharena,matharena,Final Answer Parser,1.0
6391,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_22,matharena,matharena,Final Answer Parser,1.0
6392,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_23,matharena,matharena,Final Answer Parser,1.0
6393,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_24,matharena,matharena,Final Answer Parser,1.0
6394,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_25,matharena,matharena,Final Answer Parser,1.0
6395,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_26,matharena,matharena,Final Answer Parser,1.0
6396,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_27,matharena,matharena,Final Answer Parser,0.75
6397,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_28,matharena,matharena,Final Answer Parser,1.0
6398,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_29,matharena,matharena,Final Answer Parser,1.0
6399,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_3,matharena,matharena,Final Answer Parser,1.0
6400,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_30,matharena,matharena,Final Answer Parser,1.0
6401,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_31,matharena,matharena,Final Answer Parser,1.0
6402,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_32,matharena,matharena,Final Answer Parser,1.0
6403,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_33,matharena,matharena,Final Answer Parser,1.0
6404,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_34,matharena,matharena,Final Answer Parser,1.0
6405,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_35,matharena,matharena,Final Answer Parser,1.0
6406,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_36,matharena,matharena,Final Answer Parser,1.0
6407,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_37,matharena,matharena,Final Answer Parser,1.0
6408,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_38,matharena,matharena,Final Answer Parser,1.0
6409,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_39,matharena,matharena,Final Answer Parser,1.0
6410,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_4,matharena,matharena,Final Answer Parser,1.0
6411,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_40,matharena,matharena,Final Answer Parser,1.0
6412,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_41,matharena,matharena,Final Answer Parser,1.0
6413,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_42,matharena,matharena,Final Answer Parser,0.0
6414,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_43,matharena,matharena,Final Answer Parser,0.0
6415,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_44,matharena,matharena,Final Answer Parser,1.0
6416,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_45,matharena,matharena,Final Answer Parser,1.0
6417,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_46,matharena,matharena,Final Answer Parser,1.0
6418,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_47,matharena,matharena,Final Answer Parser,1.0
6419,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_48,matharena,matharena,Final Answer Parser,1.0
6420,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_49,matharena,matharena,Final Answer Parser,1.0
6421,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_5,matharena,matharena,Final Answer Parser,1.0
6422,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_50,matharena,matharena,Final Answer Parser,1.0
6423,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_51,matharena,matharena,Final Answer Parser,1.0
6424,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_52,matharena,matharena,Final Answer Parser,1.0
6425,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_53,matharena,matharena,Final Answer Parser,0.5
6426,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_6,matharena,matharena,Final Answer Parser,1.0
6427,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_7,matharena,matharena,Final Answer Parser,1.0
6428,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_8,matharena,matharena,Final Answer Parser,0.0
6429,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_9,matharena,matharena,Final Answer Parser,1.0
6430,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_1,matharena,matharena,Final Answer Parser,1.0
6431,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_10,matharena,matharena,Final Answer Parser,1.0
6432,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_11,matharena,matharena,Final Answer Parser,1.0
6433,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_12,matharena,matharena,Final Answer Parser,1.0
6434,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_13,matharena,matharena,Final Answer Parser,0.75
6435,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_14,matharena,matharena,Final Answer Parser,1.0
6436,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_15,matharena,matharena,Final Answer Parser,1.0
6437,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_16,matharena,matharena,Final Answer Parser,1.0
6438,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_17,matharena,matharena,Final Answer Parser,1.0
6439,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_18,matharena,matharena,Final Answer Parser,1.0
6440,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_19,matharena,matharena,Final Answer Parser,1.0
6441,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_2,matharena,matharena,Final Answer Parser,1.0
6442,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_20,matharena,matharena,Final Answer Parser,0.0
6443,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_21,matharena,matharena,Final Answer Parser,1.0
6444,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_22,matharena,matharena,Final Answer Parser,1.0
6445,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_23,matharena,matharena,Final Answer Parser,1.0
6446,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_24,matharena,matharena,Final Answer Parser,1.0
6447,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_25,matharena,matharena,Final Answer Parser,1.0
6448,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_26,matharena,matharena,Final Answer Parser,1.0
6449,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_27,matharena,matharena,Final Answer Parser,0.75
6450,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_28,matharena,matharena,Final Answer Parser,1.0
6451,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_29,matharena,matharena,Final Answer Parser,1.0
6452,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_3,matharena,matharena,Final Answer Parser,1.0
6453,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_30,matharena,matharena,Final Answer Parser,1.0
6454,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_31,matharena,matharena,Final Answer Parser,1.0
6455,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_32,matharena,matharena,Final Answer Parser,0.75
6456,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_33,matharena,matharena,Final Answer Parser,0.75
6457,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_34,matharena,matharena,Final Answer Parser,0.75
6458,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_35,matharena,matharena,Final Answer Parser,1.0
6459,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_36,matharena,matharena,Final Answer Parser,1.0
6460,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_37,matharena,matharena,Final Answer Parser,0.75
6461,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_38,matharena,matharena,Final Answer Parser,1.0
6462,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_39,matharena,matharena,Final Answer Parser,1.0
6463,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_4,matharena,matharena,Final Answer Parser,1.0
6464,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_40,matharena,matharena,Final Answer Parser,1.0
6465,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_41,matharena,matharena,Final Answer Parser,1.0
6466,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_42,matharena,matharena,Final Answer Parser,0.0
6467,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_43,matharena,matharena,Final Answer Parser,0.0
6468,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_44,matharena,matharena,Final Answer Parser,1.0
6469,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_45,matharena,matharena,Final Answer Parser,1.0
6470,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_46,matharena,matharena,Final Answer Parser,1.0
6471,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_47,matharena,matharena,Final Answer Parser,1.0
6472,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_48,matharena,matharena,Final Answer Parser,0.75
6473,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_49,matharena,matharena,Final Answer Parser,1.0
6474,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_5,matharena,matharena,Final Answer Parser,1.0
6475,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_50,matharena,matharena,Final Answer Parser,1.0
6476,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_51,matharena,matharena,Final Answer Parser,1.0
6477,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_52,matharena,matharena,Final Answer Parser,1.0
6478,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_53,matharena,matharena,Final Answer Parser,0.75
6479,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_6,matharena,matharena,Final Answer Parser,1.0
6480,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_7,matharena,matharena,Final Answer Parser,1.0
6481,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_8,matharena,matharena,Final Answer Parser,0.0
6482,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_9,matharena,matharena,Final Answer Parser,1.0
6536,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_1,matharena,matharena,Final Answer Parser,1.0
6537,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_10,matharena,matharena,Final Answer Parser,1.0
6538,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_11,matharena,matharena,Final Answer Parser,1.0
6539,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_12,matharena,matharena,Final Answer Parser,1.0
6540,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_13,matharena,matharena,Final Answer Parser,0.5
6541,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_14,matharena,matharena,Final Answer Parser,1.0
6542,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_15,matharena,matharena,Final Answer Parser,1.0
6543,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_16,matharena,matharena,Final Answer Parser,1.0
6544,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_17,matharena,matharena,Final Answer Parser,0.75
6545,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_18,matharena,matharena,Final Answer Parser,1.0
6546,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_19,matharena,matharena,Final Answer Parser,0.75
6547,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_2,matharena,matharena,Final Answer Parser,1.0
6548,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_20,matharena,matharena,Final Answer Parser,0.0
6549,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_21,matharena,matharena,Final Answer Parser,1.0
6550,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_22,matharena,matharena,Final Answer Parser,0.5
6551,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_23,matharena,matharena,Final Answer Parser,1.0
6552,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_24,matharena,matharena,Final Answer Parser,1.0
6553,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_25,matharena,matharena,Final Answer Parser,1.0
6554,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_26,matharena,matharena,Final Answer Parser,1.0
6555,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_27,matharena,matharena,Final Answer Parser,0.25
6556,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_28,matharena,matharena,Final Answer Parser,1.0
6557,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_29,matharena,matharena,Final Answer Parser,1.0
6558,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_3,matharena,matharena,Final Answer Parser,1.0
6559,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_30,matharena,matharena,Final Answer Parser,0.5
6560,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_31,matharena,matharena,Final Answer Parser,1.0
6561,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_32,matharena,matharena,Final Answer Parser,0.25
6562,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_33,matharena,matharena,Final Answer Parser,0.25
6563,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_34,matharena,matharena,Final Answer Parser,1.0
6564,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_35,matharena,matharena,Final Answer Parser,1.0
6565,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_36,matharena,matharena,Final Answer Parser,1.0
6566,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_37,matharena,matharena,Final Answer Parser,1.0
6567,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_38,matharena,matharena,Final Answer Parser,1.0
6568,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_39,matharena,matharena,Final Answer Parser,0.75
6569,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_4,matharena,matharena,Final Answer Parser,1.0
6570,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_40,matharena,matharena,Final Answer Parser,1.0
6571,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_41,matharena,matharena,Final Answer Parser,1.0
6572,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_42,matharena,matharena,Final Answer Parser,0.0
6573,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_43,matharena,matharena,Final Answer Parser,0.0
6574,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_44,matharena,matharena,Final Answer Parser,1.0
6575,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_45,matharena,matharena,Final Answer Parser,1.0
6576,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_46,matharena,matharena,Final Answer Parser,1.0
6577,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_47,matharena,matharena,Final Answer Parser,1.0
6578,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_48,matharena,matharena,Final Answer Parser,1.0
6579,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_49,matharena,matharena,Final Answer Parser,0.75
6580,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_5,matharena,matharena,Final Answer Parser,1.0
6581,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_50,matharena,matharena,Final Answer Parser,1.0
6582,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_51,matharena,matharena,Final Answer Parser,1.0
6583,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_52,matharena,matharena,Final Answer Parser,1.0
6584,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_53,matharena,matharena,Final Answer Parser,0.0
6585,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_6,matharena,matharena,Final Answer Parser,1.0
6586,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_7,matharena,matharena,Final Answer Parser,1.0
6587,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_8,matharena,matharena,Final Answer Parser,0.0
6588,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_9,matharena,matharena,Final Answer Parser,1.0
6589,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_1,matharena,matharena,Final Answer Parser,1.0
6590,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_10,matharena,matharena,Final Answer Parser,1.0
6591,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_11,matharena,matharena,Final Answer Parser,1.0
6592,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_12,matharena,matharena,Final Answer Parser,1.0
6593,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_13,matharena,matharena,Final Answer Parser,0.0
6594,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_14,matharena,matharena,Final Answer Parser,1.0
6595,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_15,matharena,matharena,Final Answer Parser,1.0
6596,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_16,matharena,matharena,Final Answer Parser,1.0
6597,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_17,matharena,matharena,Final Answer Parser,1.0
6598,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_18,matharena,matharena,Final Answer Parser,1.0
6599,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_19,matharena,matharena,Final Answer Parser,0.5
6600,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_2,matharena,matharena,Final Answer Parser,1.0
6601,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_20,matharena,matharena,Final Answer Parser,0.0
6602,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_21,matharena,matharena,Final Answer Parser,1.0
6603,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_22,matharena,matharena,Final Answer Parser,0.75
6604,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_23,matharena,matharena,Final Answer Parser,1.0
6605,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_24,matharena,matharena,Final Answer Parser,0.75
6606,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_25,matharena,matharena,Final Answer Parser,1.0
6607,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_26,matharena,matharena,Final Answer Parser,1.0
6608,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_27,matharena,matharena,Final Answer Parser,0.0
6609,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_28,matharena,matharena,Final Answer Parser,1.0
6610,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_29,matharena,matharena,Final Answer Parser,1.0
6611,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_3,matharena,matharena,Final Answer Parser,1.0
6612,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_30,matharena,matharena,Final Answer Parser,0.75
6613,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_31,matharena,matharena,Final Answer Parser,1.0
6614,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_32,matharena,matharena,Final Answer Parser,1.0
6615,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_33,matharena,matharena,Final Answer Parser,1.0
6616,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_34,matharena,matharena,Final Answer Parser,0.75
6617,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_35,matharena,matharena,Final Answer Parser,1.0
6618,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_36,matharena,matharena,Final Answer Parser,0.75
6619,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_37,matharena,matharena,Final Answer Parser,1.0
6620,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_38,matharena,matharena,Final Answer Parser,0.0
6621,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_39,matharena,matharena,Final Answer Parser,0.75
6622,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_4,matharena,matharena,Final Answer Parser,1.0
6623,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_40,matharena,matharena,Final Answer Parser,1.0
6624,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_41,matharena,matharena,Final Answer Parser,0.25
6625,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_42,matharena,matharena,Final Answer Parser,0.0
6626,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_43,matharena,matharena,Final Answer Parser,0.0
6627,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_44,matharena,matharena,Final Answer Parser,1.0
6628,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_45,matharena,matharena,Final Answer Parser,1.0
6629,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_46,matharena,matharena,Final Answer Parser,1.0
6630,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_47,matharena,matharena,Final Answer Parser,1.0
6631,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_48,matharena,matharena,Final Answer Parser,0.75
6632,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_49,matharena,matharena,Final Answer Parser,1.0
6633,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_5,matharena,matharena,Final Answer Parser,1.0
6634,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_50,matharena,matharena,Final Answer Parser,0.0
6635,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_51,matharena,matharena,Final Answer Parser,0.75
6636,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_52,matharena,matharena,Final Answer Parser,0.75
6637,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_53,matharena,matharena,Final Answer Parser,0.5
6638,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_6,matharena,matharena,Final Answer Parser,1.0
6639,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_7,matharena,matharena,Final Answer Parser,1.0
6640,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_8,matharena,matharena,Final Answer Parser,0.0
6641,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_9,matharena,matharena,Final Answer Parser,0.75
6642,Grok 4,xai/grok-4,matharena_smt/smt_2025_1,matharena,matharena,Final Answer Parser,1.0
6643,Grok 4,xai/grok-4,matharena_smt/smt_2025_10,matharena,matharena,Final Answer Parser,1.0
6644,Grok 4,xai/grok-4,matharena_smt/smt_2025_11,matharena,matharena,Final Answer Parser,1.0
6645,Grok 4,xai/grok-4,matharena_smt/smt_2025_12,matharena,matharena,Final Answer Parser,1.0
6646,Grok 4,xai/grok-4,matharena_smt/smt_2025_13,matharena,matharena,Final Answer Parser,1.0
6647,Grok 4,xai/grok-4,matharena_smt/smt_2025_14,matharena,matharena,Final Answer Parser,1.0
6648,Grok 4,xai/grok-4,matharena_smt/smt_2025_15,matharena,matharena,Final Answer Parser,1.0
6649,Grok 4,xai/grok-4,matharena_smt/smt_2025_16,matharena,matharena,Final Answer Parser,1.0
6650,Grok 4,xai/grok-4,matharena_smt/smt_2025_17,matharena,matharena,Final Answer Parser,1.0
6651,Grok 4,xai/grok-4,matharena_smt/smt_2025_18,matharena,matharena,Final Answer Parser,1.0
6652,Grok 4,xai/grok-4,matharena_smt/smt_2025_19,matharena,matharena,Final Answer Parser,1.0
6653,Grok 4,xai/grok-4,matharena_smt/smt_2025_2,matharena,matharena,Final Answer Parser,1.0
6654,Grok 4,xai/grok-4,matharena_smt/smt_2025_20,matharena,matharena,Final Answer Parser,0.0
6655,Grok 4,xai/grok-4,matharena_smt/smt_2025_21,matharena,matharena,Final Answer Parser,1.0
6656,Grok 4,xai/grok-4,matharena_smt/smt_2025_22,matharena,matharena,Final Answer Parser,1.0
6657,Grok 4,xai/grok-4,matharena_smt/smt_2025_23,matharena,matharena,Final Answer Parser,1.0
6658,Grok 4,xai/grok-4,matharena_smt/smt_2025_24,matharena,matharena,Final Answer Parser,1.0
6659,Grok 4,xai/grok-4,matharena_smt/smt_2025_25,matharena,matharena,Final Answer Parser,1.0
6660,Grok 4,xai/grok-4,matharena_smt/smt_2025_26,matharena,matharena,Final Answer Parser,1.0
6661,Grok 4,xai/grok-4,matharena_smt/smt_2025_27,matharena,matharena,Final Answer Parser,0.0
6662,Grok 4,xai/grok-4,matharena_smt/smt_2025_28,matharena,matharena,Final Answer Parser,1.0
6663,Grok 4,xai/grok-4,matharena_smt/smt_2025_29,matharena,matharena,Final Answer Parser,1.0
6664,Grok 4,xai/grok-4,matharena_smt/smt_2025_3,matharena,matharena,Final Answer Parser,1.0
6665,Grok 4,xai/grok-4,matharena_smt/smt_2025_30,matharena,matharena,Final Answer Parser,1.0
6666,Grok 4,xai/grok-4,matharena_smt/smt_2025_31,matharena,matharena,Final Answer Parser,1.0
6667,Grok 4,xai/grok-4,matharena_smt/smt_2025_32,matharena,matharena,Final Answer Parser,1.0
6668,Grok 4,xai/grok-4,matharena_smt/smt_2025_33,matharena,matharena,Final Answer Parser,1.0
6669,Grok 4,xai/grok-4,matharena_smt/smt_2025_34,matharena,matharena,Final Answer Parser,1.0
6670,Grok 4,xai/grok-4,matharena_smt/smt_2025_35,matharena,matharena,Final Answer Parser,1.0
6671,Grok 4,xai/grok-4,matharena_smt/smt_2025_36,matharena,matharena,Final Answer Parser,1.0
6672,Grok 4,xai/grok-4,matharena_smt/smt_2025_37,matharena,matharena,Final Answer Parser,0.75
6673,Grok 4,xai/grok-4,matharena_smt/smt_2025_38,matharena,matharena,Final Answer Parser,0.25
6674,Grok 4,xai/grok-4,matharena_smt/smt_2025_39,matharena,matharena,Final Answer Parser,1.0
6675,Grok 4,xai/grok-4,matharena_smt/smt_2025_4,matharena,matharena,Final Answer Parser,0.75
6676,Grok 4,xai/grok-4,matharena_smt/smt_2025_40,matharena,matharena,Final Answer Parser,1.0
6677,Grok 4,xai/grok-4,matharena_smt/smt_2025_41,matharena,matharena,Final Answer Parser,1.0
6678,Grok 4,xai/grok-4,matharena_smt/smt_2025_42,matharena,matharena,Final Answer Parser,0.0
6679,Grok 4,xai/grok-4,matharena_smt/smt_2025_43,matharena,matharena,Final Answer Parser,0.0
6680,Grok 4,xai/grok-4,matharena_smt/smt_2025_44,matharena,matharena,Final Answer Parser,1.0
6681,Grok 4,xai/grok-4,matharena_smt/smt_2025_45,matharena,matharena,Final Answer Parser,1.0
6682,Grok 4,xai/grok-4,matharena_smt/smt_2025_46,matharena,matharena,Final Answer Parser,1.0
6683,Grok 4,xai/grok-4,matharena_smt/smt_2025_47,matharena,matharena,Final Answer Parser,1.0
6684,Grok 4,xai/grok-4,matharena_smt/smt_2025_48,matharena,matharena,Final Answer Parser,1.0
6685,Grok 4,xai/grok-4,matharena_smt/smt_2025_49,matharena,matharena,Final Answer Parser,1.0
6686,Grok 4,xai/grok-4,matharena_smt/smt_2025_5,matharena,matharena,Final Answer Parser,1.0
6687,Grok 4,xai/grok-4,matharena_smt/smt_2025_50,matharena,matharena,Final Answer Parser,0.75
6688,Grok 4,xai/grok-4,matharena_smt/smt_2025_51,matharena,matharena,Final Answer Parser,1.0
6689,Grok 4,xai/grok-4,matharena_smt/smt_2025_52,matharena,matharena,Final Answer Parser,1.0
6690,Grok 4,xai/grok-4,matharena_smt/smt_2025_53,matharena,matharena,Final Answer Parser,0.0
6691,Grok 4,xai/grok-4,matharena_smt/smt_2025_6,matharena,matharena,Final Answer Parser,1.0
6692,Grok 4,xai/grok-4,matharena_smt/smt_2025_7,matharena,matharena,Final Answer Parser,1.0
6693,Grok 4,xai/grok-4,matharena_smt/smt_2025_8,matharena,matharena,Final Answer Parser,0.0
6694,Grok 4,xai/grok-4,matharena_smt/smt_2025_9,matharena,matharena,Final Answer Parser,1.0
6695,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_brumo/brumo_2025_1,matharena,matharena,Final Answer Parser,1.0
6696,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_brumo/brumo_2025_10,matharena,matharena,Final Answer Parser,1.0
6697,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_brumo/brumo_2025_11,matharena,matharena,Final Answer Parser,1.0
6698,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_brumo/brumo_2025_12,matharena,matharena,Final Answer Parser,0.75
6699,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_brumo/brumo_2025_13,matharena,matharena,Final Answer Parser,0.25
6700,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_brumo/brumo_2025_14,matharena,matharena,Final Answer Parser,1.0
6701,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_brumo/brumo_2025_15,matharena,matharena,Final Answer Parser,1.0
6702,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_brumo/brumo_2025_16,matharena,matharena,Final Answer Parser,1.0
6703,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_brumo/brumo_2025_17,matharena,matharena,Final Answer Parser,1.0
6704,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_brumo/brumo_2025_18,matharena,matharena,Final Answer Parser,1.0
6705,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_brumo/brumo_2025_19,matharena,matharena,Final Answer Parser,1.0
6706,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_brumo/brumo_2025_2,matharena,matharena,Final Answer Parser,1.0
6707,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_brumo/brumo_2025_20,matharena,matharena,Final Answer Parser,1.0
6708,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_brumo/brumo_2025_21,matharena,matharena,Final Answer Parser,1.0
6709,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_brumo/brumo_2025_22,matharena,matharena,Final Answer Parser,1.0
6710,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_brumo/brumo_2025_23,matharena,matharena,Final Answer Parser,1.0
6711,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_brumo/brumo_2025_24,matharena,matharena,Final Answer Parser,1.0
6712,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_brumo/brumo_2025_25,matharena,matharena,Final Answer Parser,0.5
6713,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_brumo/brumo_2025_26,matharena,matharena,Final Answer Parser,1.0
6714,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_brumo/brumo_2025_27,matharena,matharena,Final Answer Parser,1.0
6715,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_brumo/brumo_2025_28,matharena,matharena,Final Answer Parser,0.5
6716,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_brumo/brumo_2025_29,matharena,matharena,Final Answer Parser,1.0
6717,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_brumo/brumo_2025_3,matharena,matharena,Final Answer Parser,1.0
6718,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_brumo/brumo_2025_30,matharena,matharena,Final Answer Parser,0.25
6719,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_brumo/brumo_2025_4,matharena,matharena,Final Answer Parser,1.0
6720,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_brumo/brumo_2025_5,matharena,matharena,Final Answer Parser,1.0
6721,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_brumo/brumo_2025_6,matharena,matharena,Final Answer Parser,0.75
6722,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_brumo/brumo_2025_7,matharena,matharena,Final Answer Parser,1.0
6723,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_brumo/brumo_2025_8,matharena,matharena,Final Answer Parser,1.0
6724,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_brumo/brumo_2025_9,matharena,matharena,Final Answer Parser,1.0
6725,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_brumo/brumo_2025_10,matharena,matharena,Final Answer Parser,1.0
6726,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_brumo/brumo_2025_12,matharena,matharena,Final Answer Parser,0.5
6727,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_brumo/brumo_2025_14,matharena,matharena,Final Answer Parser,1.0
6728,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_brumo/brumo_2025_15,matharena,matharena,Final Answer Parser,1.0
6729,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_brumo/brumo_2025_16,matharena,matharena,Final Answer Parser,1.0
6730,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_brumo/brumo_2025_19,matharena,matharena,Final Answer Parser,1.0
6731,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_brumo/brumo_2025_20,matharena,matharena,Final Answer Parser,1.0
6732,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_brumo/brumo_2025_21,matharena,matharena,Final Answer Parser,1.0
6733,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_brumo/brumo_2025_22,matharena,matharena,Final Answer Parser,0.75
6734,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_brumo/brumo_2025_23,matharena,matharena,Final Answer Parser,1.0
6735,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_brumo/brumo_2025_24,matharena,matharena,Final Answer Parser,1.0
6736,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_brumo/brumo_2025_26,matharena,matharena,Final Answer Parser,0.75
6737,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_brumo/brumo_2025_27,matharena,matharena,Final Answer Parser,1.0
6738,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_brumo/brumo_2025_5,matharena,matharena,Final Answer Parser,1.0
6739,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_brumo/brumo_2025_6,matharena,matharena,Final Answer Parser,1.0
6740,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_brumo/brumo_2025_7,matharena,matharena,Final Answer Parser,1.0
6741,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_brumo/brumo_2025_8,matharena,matharena,Final Answer Parser,1.0
6742,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_brumo/brumo_2025_9,matharena,matharena,Final Answer Parser,1.0
6743,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_brumo/brumo_2025_1,matharena,matharena,Final Answer Parser,1.0
6744,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_brumo/brumo_2025_11,matharena,matharena,Final Answer Parser,0.75
6745,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_brumo/brumo_2025_13,matharena,matharena,Final Answer Parser,0.5
6746,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_brumo/brumo_2025_17,matharena,matharena,Final Answer Parser,1.0
6747,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_brumo/brumo_2025_18,matharena,matharena,Final Answer Parser,1.0
6748,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_brumo/brumo_2025_2,matharena,matharena,Final Answer Parser,1.0
6749,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_brumo/brumo_2025_25,matharena,matharena,Final Answer Parser,1.0
6750,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_brumo/brumo_2025_28,matharena,matharena,Final Answer Parser,0.75
6751,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_brumo/brumo_2025_29,matharena,matharena,Final Answer Parser,1.0
6752,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_brumo/brumo_2025_3,matharena,matharena,Final Answer Parser,1.0
6753,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_brumo/brumo_2025_30,matharena,matharena,Final Answer Parser,0.0
6754,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_brumo/brumo_2025_4,matharena,matharena,Final Answer Parser,1.0
6755,o4-mini (high),openai/o4-mini--high,matharena_brumo/brumo_2025_10,matharena,matharena,Final Answer Parser,1.0
6756,o4-mini (high),openai/o4-mini--high,matharena_brumo/brumo_2025_12,matharena,matharena,Final Answer Parser,1.0
6757,o4-mini (high),openai/o4-mini--high,matharena_brumo/brumo_2025_14,matharena,matharena,Final Answer Parser,1.0
6758,o4-mini (high),openai/o4-mini--high,matharena_brumo/brumo_2025_15,matharena,matharena,Final Answer Parser,0.75
6759,o4-mini (high),openai/o4-mini--high,matharena_brumo/brumo_2025_16,matharena,matharena,Final Answer Parser,1.0
6760,o4-mini (high),openai/o4-mini--high,matharena_brumo/brumo_2025_19,matharena,matharena,Final Answer Parser,1.0
6761,o4-mini (high),openai/o4-mini--high,matharena_brumo/brumo_2025_20,matharena,matharena,Final Answer Parser,1.0
6762,o4-mini (high),openai/o4-mini--high,matharena_brumo/brumo_2025_21,matharena,matharena,Final Answer Parser,1.0
6763,o4-mini (high),openai/o4-mini--high,matharena_brumo/brumo_2025_22,matharena,matharena,Final Answer Parser,1.0
6764,o4-mini (high),openai/o4-mini--high,matharena_brumo/brumo_2025_23,matharena,matharena,Final Answer Parser,1.0
6765,o4-mini (high),openai/o4-mini--high,matharena_brumo/brumo_2025_24,matharena,matharena,Final Answer Parser,1.0
6766,o4-mini (high),openai/o4-mini--high,matharena_brumo/brumo_2025_26,matharena,matharena,Final Answer Parser,1.0
6767,o4-mini (high),openai/o4-mini--high,matharena_brumo/brumo_2025_27,matharena,matharena,Final Answer Parser,1.0
6768,o4-mini (high),openai/o4-mini--high,matharena_brumo/brumo_2025_5,matharena,matharena,Final Answer Parser,1.0
6769,o4-mini (high),openai/o4-mini--high,matharena_brumo/brumo_2025_6,matharena,matharena,Final Answer Parser,0.75
6770,o4-mini (high),openai/o4-mini--high,matharena_brumo/brumo_2025_7,matharena,matharena,Final Answer Parser,1.0
6771,o4-mini (high),openai/o4-mini--high,matharena_brumo/brumo_2025_8,matharena,matharena,Final Answer Parser,1.0
6772,o4-mini (high),openai/o4-mini--high,matharena_brumo/brumo_2025_9,matharena,matharena,Final Answer Parser,0.75
6773,o4-mini (high),openai/o4-mini--high,matharena_brumo/brumo_2025_1,matharena,matharena,Final Answer Parser,1.0
6774,o4-mini (high),openai/o4-mini--high,matharena_brumo/brumo_2025_11,matharena,matharena,Final Answer Parser,1.0
6775,o4-mini (high),openai/o4-mini--high,matharena_brumo/brumo_2025_13,matharena,matharena,Final Answer Parser,0.5
6776,o4-mini (high),openai/o4-mini--high,matharena_brumo/brumo_2025_17,matharena,matharena,Final Answer Parser,1.0
6777,o4-mini (high),openai/o4-mini--high,matharena_brumo/brumo_2025_18,matharena,matharena,Final Answer Parser,1.0
6778,o4-mini (high),openai/o4-mini--high,matharena_brumo/brumo_2025_2,matharena,matharena,Final Answer Parser,1.0
6779,o4-mini (high),openai/o4-mini--high,matharena_brumo/brumo_2025_25,matharena,matharena,Final Answer Parser,0.25
6780,o4-mini (high),openai/o4-mini--high,matharena_brumo/brumo_2025_28,matharena,matharena,Final Answer Parser,0.25
6781,o4-mini (high),openai/o4-mini--high,matharena_brumo/brumo_2025_29,matharena,matharena,Final Answer Parser,0.75
6782,o4-mini (high),openai/o4-mini--high,matharena_brumo/brumo_2025_3,matharena,matharena,Final Answer Parser,1.0
6783,o4-mini (high),openai/o4-mini--high,matharena_brumo/brumo_2025_30,matharena,matharena,Final Answer Parser,0.0
6784,o4-mini (high),openai/o4-mini--high,matharena_brumo/brumo_2025_4,matharena,matharena,Final Answer Parser,1.0
6785,GPT-5-mini (high),openai/gpt-5-mini,matharena_brumo/brumo_2025_1,matharena,matharena,Final Answer Parser,1.0
6786,GPT-5-mini (high),openai/gpt-5-mini,matharena_brumo/brumo_2025_10,matharena,matharena,Final Answer Parser,1.0
6787,GPT-5-mini (high),openai/gpt-5-mini,matharena_brumo/brumo_2025_11,matharena,matharena,Final Answer Parser,1.0
6788,GPT-5-mini (high),openai/gpt-5-mini,matharena_brumo/brumo_2025_12,matharena,matharena,Final Answer Parser,1.0
6789,GPT-5-mini (high),openai/gpt-5-mini,matharena_brumo/brumo_2025_13,matharena,matharena,Final Answer Parser,0.25
6790,GPT-5-mini (high),openai/gpt-5-mini,matharena_brumo/brumo_2025_14,matharena,matharena,Final Answer Parser,0.75
6791,GPT-5-mini (high),openai/gpt-5-mini,matharena_brumo/brumo_2025_15,matharena,matharena,Final Answer Parser,1.0
6792,GPT-5-mini (high),openai/gpt-5-mini,matharena_brumo/brumo_2025_16,matharena,matharena,Final Answer Parser,1.0
6793,GPT-5-mini (high),openai/gpt-5-mini,matharena_brumo/brumo_2025_17,matharena,matharena,Final Answer Parser,0.75
6794,GPT-5-mini (high),openai/gpt-5-mini,matharena_brumo/brumo_2025_18,matharena,matharena,Final Answer Parser,1.0
6795,GPT-5-mini (high),openai/gpt-5-mini,matharena_brumo/brumo_2025_19,matharena,matharena,Final Answer Parser,1.0
6796,GPT-5-mini (high),openai/gpt-5-mini,matharena_brumo/brumo_2025_2,matharena,matharena,Final Answer Parser,1.0
6797,GPT-5-mini (high),openai/gpt-5-mini,matharena_brumo/brumo_2025_20,matharena,matharena,Final Answer Parser,1.0
6798,GPT-5-mini (high),openai/gpt-5-mini,matharena_brumo/brumo_2025_21,matharena,matharena,Final Answer Parser,1.0
6799,GPT-5-mini (high),openai/gpt-5-mini,matharena_brumo/brumo_2025_22,matharena,matharena,Final Answer Parser,1.0
6800,GPT-5-mini (high),openai/gpt-5-mini,matharena_brumo/brumo_2025_23,matharena,matharena,Final Answer Parser,1.0
6801,GPT-5-mini (high),openai/gpt-5-mini,matharena_brumo/brumo_2025_24,matharena,matharena,Final Answer Parser,1.0
6802,GPT-5-mini (high),openai/gpt-5-mini,matharena_brumo/brumo_2025_25,matharena,matharena,Final Answer Parser,0.5
6803,GPT-5-mini (high),openai/gpt-5-mini,matharena_brumo/brumo_2025_26,matharena,matharena,Final Answer Parser,1.0
6804,GPT-5-mini (high),openai/gpt-5-mini,matharena_brumo/brumo_2025_27,matharena,matharena,Final Answer Parser,1.0
6805,GPT-5-mini (high),openai/gpt-5-mini,matharena_brumo/brumo_2025_28,matharena,matharena,Final Answer Parser,1.0
6806,GPT-5-mini (high),openai/gpt-5-mini,matharena_brumo/brumo_2025_29,matharena,matharena,Final Answer Parser,1.0
6807,GPT-5-mini (high),openai/gpt-5-mini,matharena_brumo/brumo_2025_3,matharena,matharena,Final Answer Parser,1.0
6808,GPT-5-mini (high),openai/gpt-5-mini,matharena_brumo/brumo_2025_30,matharena,matharena,Final Answer Parser,0.0
6809,GPT-5-mini (high),openai/gpt-5-mini,matharena_brumo/brumo_2025_4,matharena,matharena,Final Answer Parser,1.0
6810,GPT-5-mini (high),openai/gpt-5-mini,matharena_brumo/brumo_2025_5,matharena,matharena,Final Answer Parser,1.0
6811,GPT-5-mini (high),openai/gpt-5-mini,matharena_brumo/brumo_2025_6,matharena,matharena,Final Answer Parser,1.0
6812,GPT-5-mini (high),openai/gpt-5-mini,matharena_brumo/brumo_2025_7,matharena,matharena,Final Answer Parser,0.75
6813,GPT-5-mini (high),openai/gpt-5-mini,matharena_brumo/brumo_2025_8,matharena,matharena,Final Answer Parser,1.0
6814,GPT-5-mini (high),openai/gpt-5-mini,matharena_brumo/brumo_2025_9,matharena,matharena,Final Answer Parser,1.0
6815,GPT-5 (high),openai/gpt-5,matharena_brumo/brumo_2025_1,matharena,matharena,Final Answer Parser,1.0
6816,GPT-5 (high),openai/gpt-5,matharena_brumo/brumo_2025_10,matharena,matharena,Final Answer Parser,1.0
6817,GPT-5 (high),openai/gpt-5,matharena_brumo/brumo_2025_11,matharena,matharena,Final Answer Parser,1.0
6818,GPT-5 (high),openai/gpt-5,matharena_brumo/brumo_2025_12,matharena,matharena,Final Answer Parser,1.0
6819,GPT-5 (high),openai/gpt-5,matharena_brumo/brumo_2025_13,matharena,matharena,Final Answer Parser,0.25
6820,GPT-5 (high),openai/gpt-5,matharena_brumo/brumo_2025_14,matharena,matharena,Final Answer Parser,1.0
6821,GPT-5 (high),openai/gpt-5,matharena_brumo/brumo_2025_15,matharena,matharena,Final Answer Parser,1.0
6822,GPT-5 (high),openai/gpt-5,matharena_brumo/brumo_2025_16,matharena,matharena,Final Answer Parser,1.0
6823,GPT-5 (high),openai/gpt-5,matharena_brumo/brumo_2025_17,matharena,matharena,Final Answer Parser,0.5
6824,GPT-5 (high),openai/gpt-5,matharena_brumo/brumo_2025_18,matharena,matharena,Final Answer Parser,1.0
6825,GPT-5 (high),openai/gpt-5,matharena_brumo/brumo_2025_19,matharena,matharena,Final Answer Parser,1.0
6826,GPT-5 (high),openai/gpt-5,matharena_brumo/brumo_2025_2,matharena,matharena,Final Answer Parser,1.0
6827,GPT-5 (high),openai/gpt-5,matharena_brumo/brumo_2025_20,matharena,matharena,Final Answer Parser,1.0
6828,GPT-5 (high),openai/gpt-5,matharena_brumo/brumo_2025_21,matharena,matharena,Final Answer Parser,1.0
6829,GPT-5 (high),openai/gpt-5,matharena_brumo/brumo_2025_22,matharena,matharena,Final Answer Parser,1.0
6830,GPT-5 (high),openai/gpt-5,matharena_brumo/brumo_2025_23,matharena,matharena,Final Answer Parser,1.0
6831,GPT-5 (high),openai/gpt-5,matharena_brumo/brumo_2025_24,matharena,matharena,Final Answer Parser,1.0
6832,GPT-5 (high),openai/gpt-5,matharena_brumo/brumo_2025_25,matharena,matharena,Final Answer Parser,0.5
6833,GPT-5 (high),openai/gpt-5,matharena_brumo/brumo_2025_26,matharena,matharena,Final Answer Parser,1.0
6834,GPT-5 (high),openai/gpt-5,matharena_brumo/brumo_2025_27,matharena,matharena,Final Answer Parser,1.0
6835,GPT-5 (high),openai/gpt-5,matharena_brumo/brumo_2025_28,matharena,matharena,Final Answer Parser,1.0
6836,GPT-5 (high),openai/gpt-5,matharena_brumo/brumo_2025_29,matharena,matharena,Final Answer Parser,1.0
6837,GPT-5 (high),openai/gpt-5,matharena_brumo/brumo_2025_3,matharena,matharena,Final Answer Parser,1.0
6838,GPT-5 (high),openai/gpt-5,matharena_brumo/brumo_2025_30,matharena,matharena,Final Answer Parser,0.25
6839,GPT-5 (high),openai/gpt-5,matharena_brumo/brumo_2025_4,matharena,matharena,Final Answer Parser,1.0
6840,GPT-5 (high),openai/gpt-5,matharena_brumo/brumo_2025_5,matharena,matharena,Final Answer Parser,1.0
6841,GPT-5 (high),openai/gpt-5,matharena_brumo/brumo_2025_6,matharena,matharena,Final Answer Parser,1.0
6842,GPT-5 (high),openai/gpt-5,matharena_brumo/brumo_2025_7,matharena,matharena,Final Answer Parser,1.0
6843,GPT-5 (high),openai/gpt-5,matharena_brumo/brumo_2025_8,matharena,matharena,Final Answer Parser,1.0
6844,GPT-5 (high),openai/gpt-5,matharena_brumo/brumo_2025_9,matharena,matharena,Final Answer Parser,1.0
6875,GPT OSS 120B (high),openai/oss-20b,matharena_brumo/brumo_2025_1,matharena,matharena,Final Answer Parser,1.0
6876,GPT OSS 120B (high),openai/oss-20b,matharena_brumo/brumo_2025_10,matharena,matharena,Final Answer Parser,1.0
6877,GPT OSS 120B (high),openai/oss-20b,matharena_brumo/brumo_2025_11,matharena,matharena,Final Answer Parser,0.75
6878,GPT OSS 120B (high),openai/oss-20b,matharena_brumo/brumo_2025_12,matharena,matharena,Final Answer Parser,0.75
6879,GPT OSS 120B (high),openai/oss-20b,matharena_brumo/brumo_2025_13,matharena,matharena,Final Answer Parser,0.75
6880,GPT OSS 120B (high),openai/oss-20b,matharena_brumo/brumo_2025_14,matharena,matharena,Final Answer Parser,1.0
6881,GPT OSS 120B (high),openai/oss-20b,matharena_brumo/brumo_2025_15,matharena,matharena,Final Answer Parser,0.75
6882,GPT OSS 120B (high),openai/oss-20b,matharena_brumo/brumo_2025_16,matharena,matharena,Final Answer Parser,1.0
6883,GPT OSS 120B (high),openai/oss-20b,matharena_brumo/brumo_2025_17,matharena,matharena,Final Answer Parser,0.75
6884,GPT OSS 120B (high),openai/oss-20b,matharena_brumo/brumo_2025_18,matharena,matharena,Final Answer Parser,1.0
6885,GPT OSS 120B (high),openai/oss-20b,matharena_brumo/brumo_2025_19,matharena,matharena,Final Answer Parser,1.0
6886,GPT OSS 120B (high),openai/oss-20b,matharena_brumo/brumo_2025_2,matharena,matharena,Final Answer Parser,1.0
6887,GPT OSS 120B (high),openai/oss-20b,matharena_brumo/brumo_2025_20,matharena,matharena,Final Answer Parser,1.0
6888,GPT OSS 120B (high),openai/oss-20b,matharena_brumo/brumo_2025_21,matharena,matharena,Final Answer Parser,1.0
6889,GPT OSS 120B (high),openai/oss-20b,matharena_brumo/brumo_2025_22,matharena,matharena,Final Answer Parser,0.75
6890,GPT OSS 120B (high),openai/oss-20b,matharena_brumo/brumo_2025_23,matharena,matharena,Final Answer Parser,0.75
6891,GPT OSS 120B (high),openai/oss-20b,matharena_brumo/brumo_2025_24,matharena,matharena,Final Answer Parser,0.75
6892,GPT OSS 120B (high),openai/oss-20b,matharena_brumo/brumo_2025_25,matharena,matharena,Final Answer Parser,0.75
6893,GPT OSS 120B (high),openai/oss-20b,matharena_brumo/brumo_2025_26,matharena,matharena,Final Answer Parser,1.0
6894,GPT OSS 120B (high),openai/oss-20b,matharena_brumo/brumo_2025_27,matharena,matharena,Final Answer Parser,0.75
6895,GPT OSS 120B (high),openai/oss-20b,matharena_brumo/brumo_2025_28,matharena,matharena,Final Answer Parser,0.0
6896,GPT OSS 120B (high),openai/oss-20b,matharena_brumo/brumo_2025_29,matharena,matharena,Final Answer Parser,0.75
6897,GPT OSS 120B (high),openai/oss-20b,matharena_brumo/brumo_2025_3,matharena,matharena,Final Answer Parser,1.0
6898,GPT OSS 120B (high),openai/oss-20b,matharena_brumo/brumo_2025_30,matharena,matharena,Final Answer Parser,0.25
6899,GPT OSS 120B (high),openai/oss-20b,matharena_brumo/brumo_2025_4,matharena,matharena,Final Answer Parser,1.0
6900,GPT OSS 120B (high),openai/oss-20b,matharena_brumo/brumo_2025_5,matharena,matharena,Final Answer Parser,1.0
6901,GPT OSS 120B (high),openai/oss-20b,matharena_brumo/brumo_2025_6,matharena,matharena,Final Answer Parser,1.0
6902,GPT OSS 120B (high),openai/oss-20b,matharena_brumo/brumo_2025_7,matharena,matharena,Final Answer Parser,1.0
6903,GPT OSS 120B (high),openai/oss-20b,matharena_brumo/brumo_2025_8,matharena,matharena,Final Answer Parser,1.0
6904,GPT OSS 120B (high),openai/oss-20b,matharena_brumo/brumo_2025_9,matharena,matharena,Final Answer Parser,1.0
6905,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_brumo/brumo_2025_1,matharena,matharena,Final Answer Parser,1.0
6906,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_brumo/brumo_2025_12,matharena,matharena,Final Answer Parser,0.25
6907,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_brumo/brumo_2025_13,matharena,matharena,Final Answer Parser,0.75
6908,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_brumo/brumo_2025_15,matharena,matharena,Final Answer Parser,0.5
6909,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_brumo/brumo_2025_17,matharena,matharena,Final Answer Parser,0.75
6910,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_brumo/brumo_2025_18,matharena,matharena,Final Answer Parser,1.0
6911,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_brumo/brumo_2025_19,matharena,matharena,Final Answer Parser,1.0
6912,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_brumo/brumo_2025_2,matharena,matharena,Final Answer Parser,1.0
6913,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_brumo/brumo_2025_20,matharena,matharena,Final Answer Parser,1.0
6914,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_brumo/brumo_2025_21,matharena,matharena,Final Answer Parser,1.0
6915,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_brumo/brumo_2025_22,matharena,matharena,Final Answer Parser,1.0
6916,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_brumo/brumo_2025_23,matharena,matharena,Final Answer Parser,1.0
6917,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_brumo/brumo_2025_24,matharena,matharena,Final Answer Parser,1.0
6918,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_brumo/brumo_2025_26,matharena,matharena,Final Answer Parser,1.0
6919,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_brumo/brumo_2025_27,matharena,matharena,Final Answer Parser,0.75
6920,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_brumo/brumo_2025_28,matharena,matharena,Final Answer Parser,0.25
6921,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_brumo/brumo_2025_4,matharena,matharena,Final Answer Parser,1.0
6922,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_brumo/brumo_2025_5,matharena,matharena,Final Answer Parser,1.0
6923,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_brumo/brumo_2025_9,matharena,matharena,Final Answer Parser,1.0
6924,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_brumo/brumo_2025_10,matharena,matharena,Final Answer Parser,0.75
6925,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_brumo/brumo_2025_11,matharena,matharena,Final Answer Parser,1.0
6926,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_brumo/brumo_2025_14,matharena,matharena,Final Answer Parser,1.0
6927,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_brumo/brumo_2025_16,matharena,matharena,Final Answer Parser,1.0
6928,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_brumo/brumo_2025_25,matharena,matharena,Final Answer Parser,1.0
6929,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_brumo/brumo_2025_29,matharena,matharena,Final Answer Parser,1.0
6930,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_brumo/brumo_2025_3,matharena,matharena,Final Answer Parser,1.0
6931,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_brumo/brumo_2025_30,matharena,matharena,Final Answer Parser,0.0
6932,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_brumo/brumo_2025_6,matharena,matharena,Final Answer Parser,1.0
6933,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_brumo/brumo_2025_7,matharena,matharena,Final Answer Parser,1.0
6934,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_brumo/brumo_2025_8,matharena,matharena,Final Answer Parser,1.0
6935,Grok 4,xai/grok-4,matharena_brumo/brumo_2025_1,matharena,matharena,Final Answer Parser,1.0
6936,Grok 4,xai/grok-4,matharena_brumo/brumo_2025_10,matharena,matharena,Final Answer Parser,1.0
6937,Grok 4,xai/grok-4,matharena_brumo/brumo_2025_11,matharena,matharena,Final Answer Parser,1.0
6938,Grok 4,xai/grok-4,matharena_brumo/brumo_2025_12,matharena,matharena,Final Answer Parser,0.75
6939,Grok 4,xai/grok-4,matharena_brumo/brumo_2025_13,matharena,matharena,Final Answer Parser,1.0
6940,Grok 4,xai/grok-4,matharena_brumo/brumo_2025_14,matharena,matharena,Final Answer Parser,1.0
6941,Grok 4,xai/grok-4,matharena_brumo/brumo_2025_15,matharena,matharena,Final Answer Parser,1.0
6942,Grok 4,xai/grok-4,matharena_brumo/brumo_2025_16,matharena,matharena,Final Answer Parser,1.0
6943,Grok 4,xai/grok-4,matharena_brumo/brumo_2025_17,matharena,matharena,Final Answer Parser,1.0
6944,Grok 4,xai/grok-4,matharena_brumo/brumo_2025_18,matharena,matharena,Final Answer Parser,1.0
6945,Grok 4,xai/grok-4,matharena_brumo/brumo_2025_19,matharena,matharena,Final Answer Parser,1.0
6946,Grok 4,xai/grok-4,matharena_brumo/brumo_2025_2,matharena,matharena,Final Answer Parser,1.0
6947,Grok 4,xai/grok-4,matharena_brumo/brumo_2025_20,matharena,matharena,Final Answer Parser,1.0
6948,Grok 4,xai/grok-4,matharena_brumo/brumo_2025_21,matharena,matharena,Final Answer Parser,1.0
6949,Grok 4,xai/grok-4,matharena_brumo/brumo_2025_22,matharena,matharena,Final Answer Parser,1.0
6950,Grok 4,xai/grok-4,matharena_brumo/brumo_2025_23,matharena,matharena,Final Answer Parser,1.0
6951,Grok 4,xai/grok-4,matharena_brumo/brumo_2025_24,matharena,matharena,Final Answer Parser,1.0
6952,Grok 4,xai/grok-4,matharena_brumo/brumo_2025_25,matharena,matharena,Final Answer Parser,1.0
6953,Grok 4,xai/grok-4,matharena_brumo/brumo_2025_26,matharena,matharena,Final Answer Parser,1.0
6954,Grok 4,xai/grok-4,matharena_brumo/brumo_2025_27,matharena,matharena,Final Answer Parser,0.75
6955,Grok 4,xai/grok-4,matharena_brumo/brumo_2025_28,matharena,matharena,Final Answer Parser,0.75
6956,Grok 4,xai/grok-4,matharena_brumo/brumo_2025_29,matharena,matharena,Final Answer Parser,1.0
6957,Grok 4,xai/grok-4,matharena_brumo/brumo_2025_3,matharena,matharena,Final Answer Parser,1.0
6958,Grok 4,xai/grok-4,matharena_brumo/brumo_2025_30,matharena,matharena,Final Answer Parser,0.5
6959,Grok 4,xai/grok-4,matharena_brumo/brumo_2025_4,matharena,matharena,Final Answer Parser,1.0
6960,Grok 4,xai/grok-4,matharena_brumo/brumo_2025_5,matharena,matharena,Final Answer Parser,1.0
6961,Grok 4,xai/grok-4,matharena_brumo/brumo_2025_6,matharena,matharena,Final Answer Parser,0.75
6962,Grok 4,xai/grok-4,matharena_brumo/brumo_2025_7,matharena,matharena,Final Answer Parser,1.0
6963,Grok 4,xai/grok-4,matharena_brumo/brumo_2025_8,matharena,matharena,Final Answer Parser,1.0
6964,Grok 4,xai/grok-4,matharena_brumo/brumo_2025_9,matharena,matharena,Final Answer Parser,1.0
