,solver,solver_id,problem,competition,split,judge,accuracy
0,GPT OSS 120B (high),openai/oss-120b,allrussian_2025_1,allrussian,proofs,OPC R1 8B,0.0
1,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,allrussian_2025_1,allrussian,proofs,OPC R1 8B,1.0
2,Qwen3-4B (25/07),qwen/qwen3_4b,allrussian_2025_1,allrussian,proofs,OPC R1 8B,0.0
3,o4-mini (high),openai/o4-mini--high,allrussian_2025_1,allrussian,proofs,OPC R1 8B,0.0
4,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,allrussian_2025_1,allrussian,proofs,OPC R1 8B,0.0
5,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,allrussian_2025_1,allrussian,proofs,OPC R1 8B,0.0
6,GPT-5-mini (high),openai/gpt-5-mini,allrussian_2025_1,allrussian,proofs,OPC R1 8B,0.0
7,GPT-5 (high),openai/gpt-5,allrussian_2025_1,allrussian,proofs,OPC R1 8B,0.0
8,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,allrussian_2025_1,allrussian,proofs,OPC R1 8B,1.0
9,Grok 4,xai/grok-4,allrussian_2025_1,allrussian,proofs,OPC R1 8B,0.0
10,gemini-2.5-pro,gemini/gemini-pro-2.5,allrussian_2025_1,allrussian,proofs,OPC R1 8B,0.0
11,Grok 4,xai/grok-4,allrussian_2025_10,allrussian,proofs,OPC R1 8B,1.0
12,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,allrussian_2025_10,allrussian,proofs,OPC R1 8B,0.0
13,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,allrussian_2025_10,allrussian,proofs,OPC R1 8B,1.0
14,gemini-2.5-pro,gemini/gemini-pro-2.5,allrussian_2025_10,allrussian,proofs,OPC R1 8B,0.0
15,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,allrussian_2025_10,allrussian,proofs,OPC R1 8B,0.0
16,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,allrussian_2025_10,allrussian,proofs,OPC R1 8B,1.0
17,Qwen3-4B (25/07),qwen/qwen3_4b,allrussian_2025_10,allrussian,proofs,OPC R1 8B,0.0
18,o4-mini (high),openai/o4-mini--high,allrussian_2025_10,allrussian,proofs,OPC R1 8B,0.0
19,GPT-5-mini (high),openai/gpt-5-mini,allrussian_2025_10,allrussian,proofs,OPC R1 8B,1.0
20,GPT-5 (high),openai/gpt-5,allrussian_2025_10,allrussian,proofs,OPC R1 8B,1.0
21,GPT OSS 120B (high),openai/oss-120b,allrussian_2025_10,allrussian,proofs,OPC R1 8B,0.0
22,gemini-2.5-pro,gemini/gemini-pro-2.5,allrussian_2025_11,allrussian,proofs,OPC R1 8B,0.0
23,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,allrussian_2025_11,allrussian,proofs,OPC R1 8B,0.0
24,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,allrussian_2025_11,allrussian,proofs,OPC R1 8B,0.0
25,GPT OSS 120B (high),openai/oss-120b,allrussian_2025_11,allrussian,proofs,OPC R1 8B,0.0
26,GPT-5-mini (high),openai/gpt-5-mini,allrussian_2025_11,allrussian,proofs,OPC R1 8B,0.0
27,GPT-5 (high),openai/gpt-5,allrussian_2025_11,allrussian,proofs,OPC R1 8B,0.0
28,o4-mini (high),openai/o4-mini--high,allrussian_2025_11,allrussian,proofs,OPC R1 8B,0.0
29,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,allrussian_2025_11,allrussian,proofs,OPC R1 8B,1.0
30,Qwen3-4B (25/07),qwen/qwen3_4b,allrussian_2025_11,allrussian,proofs,OPC R1 8B,0.0
31,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,allrussian_2025_11,allrussian,proofs,OPC R1 8B,0.0
32,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,allrussian_2025_12,allrussian,proofs,OPC R1 8B,0.0
33,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,allrussian_2025_12,allrussian,proofs,OPC R1 8B,0.0
34,GPT-5-mini (high),openai/gpt-5-mini,allrussian_2025_12,allrussian,proofs,OPC R1 8B,0.0
35,GPT OSS 120B (high),openai/oss-120b,allrussian_2025_12,allrussian,proofs,OPC R1 8B,0.0
36,o4-mini (high),openai/o4-mini--high,allrussian_2025_12,allrussian,proofs,OPC R1 8B,0.0
37,Qwen3-4B (25/07),qwen/qwen3_4b,allrussian_2025_12,allrussian,proofs,OPC R1 8B,0.0
38,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,allrussian_2025_12,allrussian,proofs,OPC R1 8B,0.0
39,Grok 4,xai/grok-4,allrussian_2025_12,allrussian,proofs,OPC R1 8B,0.0
40,GPT-5 (high),openai/gpt-5,allrussian_2025_12,allrussian,proofs,OPC R1 8B,0.0
41,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,allrussian_2025_12,allrussian,proofs,OPC R1 8B,0.0
42,gemini-2.5-pro,gemini/gemini-pro-2.5,allrussian_2025_12,allrussian,proofs,OPC R1 8B,0.0
43,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,allrussian_2025_13,allrussian,proofs,OPC R1 8B,1.0
44,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,allrussian_2025_13,allrussian,proofs,OPC R1 8B,1.0
45,GPT OSS 120B (high),openai/oss-120b,allrussian_2025_13,allrussian,proofs,OPC R1 8B,0.0
46,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,allrussian_2025_13,allrussian,proofs,OPC R1 8B,1.0
47,GPT-5 (high),openai/gpt-5,allrussian_2025_13,allrussian,proofs,OPC R1 8B,1.0
48,Grok 4,xai/grok-4,allrussian_2025_13,allrussian,proofs,OPC R1 8B,1.0
49,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,allrussian_2025_13,allrussian,proofs,OPC R1 8B,1.0
50,GPT-5-mini (high),openai/gpt-5-mini,allrussian_2025_13,allrussian,proofs,OPC R1 8B,1.0
51,Qwen3-4B (25/07),qwen/qwen3_4b,allrussian_2025_13,allrussian,proofs,OPC R1 8B,0.0
52,gemini-2.5-pro,gemini/gemini-pro-2.5,allrussian_2025_13,allrussian,proofs,OPC R1 8B,0.0
53,o4-mini (high),openai/o4-mini--high,allrussian_2025_13,allrussian,proofs,OPC R1 8B,0.0
54,gemini-2.5-pro,gemini/gemini-pro-2.5,allrussian_2025_14,allrussian,proofs,OPC R1 8B,0.0
55,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,allrussian_2025_14,allrussian,proofs,OPC R1 8B,1.0
56,GPT-5-mini (high),openai/gpt-5-mini,allrussian_2025_14,allrussian,proofs,OPC R1 8B,0.0
57,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,allrussian_2025_14,allrussian,proofs,OPC R1 8B,0.0
58,GPT OSS 120B (high),openai/oss-120b,allrussian_2025_14,allrussian,proofs,OPC R1 8B,1.0
59,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,allrussian_2025_14,allrussian,proofs,OPC R1 8B,0.0
60,Qwen3-4B (25/07),qwen/qwen3_4b,allrussian_2025_14,allrussian,proofs,OPC R1 8B,0.0
61,Grok 4,xai/grok-4,allrussian_2025_14,allrussian,proofs,OPC R1 8B,0.0
62,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,allrussian_2025_14,allrussian,proofs,OPC R1 8B,0.0
63,o4-mini (high),openai/o4-mini--high,allrussian_2025_14,allrussian,proofs,OPC R1 8B,0.0
64,GPT-5 (high),openai/gpt-5,allrussian_2025_14,allrussian,proofs,OPC R1 8B,0.0
65,Qwen3-4B (25/07),qwen/qwen3_4b,allrussian_2025_15,allrussian,proofs,OPC R1 8B,0.0
66,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,allrussian_2025_15,allrussian,proofs,OPC R1 8B,0.0
67,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,allrussian_2025_15,allrussian,proofs,OPC R1 8B,0.0
68,GPT-5-mini (high),openai/gpt-5-mini,allrussian_2025_15,allrussian,proofs,OPC R1 8B,0.0
69,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,allrussian_2025_15,allrussian,proofs,OPC R1 8B,0.0
70,Grok 4,xai/grok-4,allrussian_2025_15,allrussian,proofs,OPC R1 8B,0.0
71,GPT OSS 120B (high),openai/oss-120b,allrussian_2025_15,allrussian,proofs,OPC R1 8B,1.0
72,o4-mini (high),openai/o4-mini--high,allrussian_2025_15,allrussian,proofs,OPC R1 8B,0.0
73,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,allrussian_2025_15,allrussian,proofs,OPC R1 8B,0.0
74,gemini-2.5-pro,gemini/gemini-pro-2.5,allrussian_2025_15,allrussian,proofs,OPC R1 8B,0.0
75,gemini-2.5-pro,gemini/gemini-pro-2.5,allrussian_2025_16,allrussian,proofs,OPC R1 8B,1.0
76,o4-mini (high),openai/o4-mini--high,allrussian_2025_16,allrussian,proofs,OPC R1 8B,1.0
77,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,allrussian_2025_16,allrussian,proofs,OPC R1 8B,0.0
78,Qwen3-4B (25/07),qwen/qwen3_4b,allrussian_2025_16,allrussian,proofs,OPC R1 8B,1.0
79,Grok 4,xai/grok-4,allrussian_2025_16,allrussian,proofs,OPC R1 8B,0.0
80,GPT-5-mini (high),openai/gpt-5-mini,allrussian_2025_16,allrussian,proofs,OPC R1 8B,1.0
81,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,allrussian_2025_16,allrussian,proofs,OPC R1 8B,0.0
82,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,allrussian_2025_16,allrussian,proofs,OPC R1 8B,0.0
83,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,allrussian_2025_16,allrussian,proofs,OPC R1 8B,1.0
84,GPT-5 (high),openai/gpt-5,allrussian_2025_16,allrussian,proofs,OPC R1 8B,0.0
85,GPT OSS 120B (high),openai/oss-120b,allrussian_2025_16,allrussian,proofs,OPC R1 8B,0.0
86,Grok 4,xai/grok-4,allrussian_2025_2,allrussian,proofs,OPC R1 8B,0.0
87,GPT-5-mini (high),openai/gpt-5-mini,allrussian_2025_2,allrussian,proofs,OPC R1 8B,1.0
88,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,allrussian_2025_2,allrussian,proofs,OPC R1 8B,0.0
89,Qwen3-4B (25/07),qwen/qwen3_4b,allrussian_2025_2,allrussian,proofs,OPC R1 8B,0.0
90,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,allrussian_2025_2,allrussian,proofs,OPC R1 8B,0.0
91,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,allrussian_2025_2,allrussian,proofs,OPC R1 8B,0.0
92,gemini-2.5-pro,gemini/gemini-pro-2.5,allrussian_2025_2,allrussian,proofs,OPC R1 8B,1.0
93,GPT-5 (high),openai/gpt-5,allrussian_2025_2,allrussian,proofs,OPC R1 8B,1.0
94,o4-mini (high),openai/o4-mini--high,allrussian_2025_2,allrussian,proofs,OPC R1 8B,0.0
95,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,allrussian_2025_2,allrussian,proofs,OPC R1 8B,0.0
96,GPT OSS 120B (high),openai/oss-120b,allrussian_2025_2,allrussian,proofs,OPC R1 8B,0.0
97,GPT-5-mini (high),openai/gpt-5-mini,allrussian_2025_3,allrussian,proofs,OPC R1 8B,0.0
98,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,allrussian_2025_3,allrussian,proofs,OPC R1 8B,1.0
99,Grok 4,xai/grok-4,allrussian_2025_3,allrussian,proofs,OPC R1 8B,0.0
100,o4-mini (high),openai/o4-mini--high,allrussian_2025_3,allrussian,proofs,OPC R1 8B,0.0
101,gemini-2.5-pro,gemini/gemini-pro-2.5,allrussian_2025_3,allrussian,proofs,OPC R1 8B,1.0
102,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,allrussian_2025_3,allrussian,proofs,OPC R1 8B,1.0
103,Qwen3-4B (25/07),qwen/qwen3_4b,allrussian_2025_3,allrussian,proofs,OPC R1 8B,1.0
104,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,allrussian_2025_3,allrussian,proofs,OPC R1 8B,0.0
105,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,allrussian_2025_3,allrussian,proofs,OPC R1 8B,1.0
106,GPT OSS 120B (high),openai/oss-120b,allrussian_2025_3,allrussian,proofs,OPC R1 8B,0.0
107,GPT-5 (high),openai/gpt-5,allrussian_2025_3,allrussian,proofs,OPC R1 8B,0.0
108,GPT OSS 120B (high),openai/oss-120b,allrussian_2025_4,allrussian,proofs,OPC R1 8B,0.0
109,GPT-5 (high),openai/gpt-5,allrussian_2025_4,allrussian,proofs,OPC R1 8B,1.0
110,o4-mini (high),openai/o4-mini--high,allrussian_2025_4,allrussian,proofs,OPC R1 8B,0.0
111,gemini-2.5-pro,gemini/gemini-pro-2.5,allrussian_2025_4,allrussian,proofs,OPC R1 8B,0.0
112,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,allrussian_2025_4,allrussian,proofs,OPC R1 8B,0.0
113,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,allrussian_2025_4,allrussian,proofs,OPC R1 8B,0.0
114,Grok 4,xai/grok-4,allrussian_2025_4,allrussian,proofs,OPC R1 8B,0.0
115,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,allrussian_2025_4,allrussian,proofs,OPC R1 8B,0.0
116,Qwen3-4B (25/07),qwen/qwen3_4b,allrussian_2025_4,allrussian,proofs,OPC R1 8B,0.0
117,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,allrussian_2025_4,allrussian,proofs,OPC R1 8B,0.0
118,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,allrussian_2025_5,allrussian,proofs,OPC R1 8B,0.0
119,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,allrussian_2025_5,allrussian,proofs,OPC R1 8B,1.0
120,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,allrussian_2025_5,allrussian,proofs,OPC R1 8B,1.0
121,Qwen3-4B (25/07),qwen/qwen3_4b,allrussian_2025_5,allrussian,proofs,OPC R1 8B,1.0
122,GPT OSS 120B (high),openai/oss-120b,allrussian_2025_5,allrussian,proofs,OPC R1 8B,0.0
123,GPT-5 (high),openai/gpt-5,allrussian_2025_5,allrussian,proofs,OPC R1 8B,1.0
124,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,allrussian_2025_5,allrussian,proofs,OPC R1 8B,0.0
125,Grok 4,xai/grok-4,allrussian_2025_5,allrussian,proofs,OPC R1 8B,0.0
126,GPT-5-mini (high),openai/gpt-5-mini,allrussian_2025_5,allrussian,proofs,OPC R1 8B,1.0
127,o4-mini (high),openai/o4-mini--high,allrussian_2025_5,allrussian,proofs,OPC R1 8B,1.0
128,gemini-2.5-pro,gemini/gemini-pro-2.5,allrussian_2025_5,allrussian,proofs,OPC R1 8B,1.0
129,Qwen3-4B (25/07),qwen/qwen3_4b,allrussian_2025_6,allrussian,proofs,OPC R1 8B,0.0
130,GPT-5 (high),openai/gpt-5,allrussian_2025_6,allrussian,proofs,OPC R1 8B,1.0
131,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,allrussian_2025_6,allrussian,proofs,OPC R1 8B,0.0
132,o4-mini (high),openai/o4-mini--high,allrussian_2025_6,allrussian,proofs,OPC R1 8B,1.0
133,GPT-5-mini (high),openai/gpt-5-mini,allrussian_2025_6,allrussian,proofs,OPC R1 8B,0.0
134,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,allrussian_2025_6,allrussian,proofs,OPC R1 8B,0.0
135,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,allrussian_2025_6,allrussian,proofs,OPC R1 8B,0.0
136,Grok 4,xai/grok-4,allrussian_2025_6,allrussian,proofs,OPC R1 8B,0.0
137,gemini-2.5-pro,gemini/gemini-pro-2.5,allrussian_2025_6,allrussian,proofs,OPC R1 8B,0.0
138,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,allrussian_2025_6,allrussian,proofs,OPC R1 8B,1.0
139,GPT OSS 120B (high),openai/oss-120b,allrussian_2025_6,allrussian,proofs,OPC R1 8B,0.0
140,o4-mini (high),openai/o4-mini--high,allrussian_2025_7,allrussian,proofs,OPC R1 8B,0.0
141,GPT-5-mini (high),openai/gpt-5-mini,allrussian_2025_7,allrussian,proofs,OPC R1 8B,0.0
142,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,allrussian_2025_7,allrussian,proofs,OPC R1 8B,0.0
143,gemini-2.5-pro,gemini/gemini-pro-2.5,allrussian_2025_7,allrussian,proofs,OPC R1 8B,1.0
144,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,allrussian_2025_7,allrussian,proofs,OPC R1 8B,0.0
145,GPT-5 (high),openai/gpt-5,allrussian_2025_7,allrussian,proofs,OPC R1 8B,0.0
146,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,allrussian_2025_7,allrussian,proofs,OPC R1 8B,1.0
147,Qwen3-4B (25/07),qwen/qwen3_4b,allrussian_2025_7,allrussian,proofs,OPC R1 8B,0.0
148,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,allrussian_2025_7,allrussian,proofs,OPC R1 8B,0.0
149,GPT OSS 120B (high),openai/oss-120b,allrussian_2025_7,allrussian,proofs,OPC R1 8B,0.0
150,gemini-2.5-pro,gemini/gemini-pro-2.5,allrussian_2025_8,allrussian,proofs,OPC R1 8B,0.0
151,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,allrussian_2025_8,allrussian,proofs,OPC R1 8B,0.0
152,o4-mini (high),openai/o4-mini--high,allrussian_2025_8,allrussian,proofs,OPC R1 8B,0.0
153,Qwen3-4B (25/07),qwen/qwen3_4b,allrussian_2025_8,allrussian,proofs,OPC R1 8B,0.0
154,GPT-5-mini (high),openai/gpt-5-mini,allrussian_2025_8,allrussian,proofs,OPC R1 8B,0.0
155,Grok 4,xai/grok-4,allrussian_2025_8,allrussian,proofs,OPC R1 8B,0.0
156,GPT OSS 120B (high),openai/oss-120b,allrussian_2025_8,allrussian,proofs,OPC R1 8B,1.0
157,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,allrussian_2025_8,allrussian,proofs,OPC R1 8B,0.0
158,GPT-5 (high),openai/gpt-5,allrussian_2025_8,allrussian,proofs,OPC R1 8B,0.0
159,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,allrussian_2025_8,allrussian,proofs,OPC R1 8B,0.0
160,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,allrussian_2025_8,allrussian,proofs,OPC R1 8B,0.0
161,gemini-2.5-pro,gemini/gemini-pro-2.5,allrussian_2025_9,allrussian,proofs,OPC R1 8B,1.0
162,GPT-5 (high),openai/gpt-5,allrussian_2025_9,allrussian,proofs,OPC R1 8B,1.0
163,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,allrussian_2025_9,allrussian,proofs,OPC R1 8B,1.0
164,Grok 4,xai/grok-4,allrussian_2025_9,allrussian,proofs,OPC R1 8B,1.0
165,o4-mini (high),openai/o4-mini--high,allrussian_2025_9,allrussian,proofs,OPC R1 8B,1.0
166,Qwen3-4B (25/07),qwen/qwen3_4b,allrussian_2025_9,allrussian,proofs,OPC R1 8B,0.0
167,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,allrussian_2025_9,allrussian,proofs,OPC R1 8B,1.0
168,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,allrussian_2025_9,allrussian,proofs,OPC R1 8B,0.0
169,GPT-5-mini (high),openai/gpt-5-mini,allrussian_2025_9,allrussian,proofs,OPC R1 8B,1.0
170,GPT OSS 120B (high),openai/oss-120b,allrussian_2025_9,allrussian,proofs,OPC R1 8B,0.0
171,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,allrussian_2025_9,allrussian,proofs,OPC R1 8B,1.0
172,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,bmo_2025_1,bmo,proofs,OPC R1 8B,0.0
173,GPT OSS 120B (high),openai/oss-120b,bmo_2025_1,bmo,proofs,OPC R1 8B,0.0
174,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,bmo_2025_1,bmo,proofs,OPC R1 8B,1.0
175,o4-mini (high),openai/o4-mini--high,bmo_2025_1,bmo,proofs,OPC R1 8B,0.0
176,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,bmo_2025_1,bmo,proofs,OPC R1 8B,0.0
177,Qwen3-4B (25/07),qwen/qwen3_4b,bmo_2025_1,bmo,proofs,OPC R1 8B,0.0
178,gemini-2.5-pro,gemini/gemini-pro-2.5,bmo_2025_1,bmo,proofs,OPC R1 8B,0.0
179,Grok 4,xai/grok-4,bmo_2025_1,bmo,proofs,OPC R1 8B,0.0
180,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,bmo_2025_1,bmo,proofs,OPC R1 8B,0.0
181,GPT-5 (high),openai/gpt-5,bmo_2025_1,bmo,proofs,OPC R1 8B,1.0
182,Grok 4,xai/grok-4,bmo_2025_2,bmo,proofs,OPC R1 8B,0.0
183,Qwen3-4B (25/07),qwen/qwen3_4b,bmo_2025_2,bmo,proofs,OPC R1 8B,0.0
184,GPT OSS 120B (high),openai/oss-120b,bmo_2025_2,bmo,proofs,OPC R1 8B,1.0
185,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,bmo_2025_2,bmo,proofs,OPC R1 8B,0.0
186,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,bmo_2025_2,bmo,proofs,OPC R1 8B,0.0
187,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,bmo_2025_2,bmo,proofs,OPC R1 8B,0.0
188,o4-mini (high),openai/o4-mini--high,bmo_2025_2,bmo,proofs,OPC R1 8B,0.0
189,GPT-5 (high),openai/gpt-5,bmo_2025_2,bmo,proofs,OPC R1 8B,0.0
190,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,bmo_2025_2,bmo,proofs,OPC R1 8B,0.0
191,gemini-2.5-pro,gemini/gemini-pro-2.5,bmo_2025_2,bmo,proofs,OPC R1 8B,0.0
192,Qwen3-4B (25/07),qwen/qwen3_4b,bmo_2025_3,bmo,proofs,OPC R1 8B,0.0
193,GPT OSS 120B (high),openai/oss-120b,bmo_2025_3,bmo,proofs,OPC R1 8B,0.0
194,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,bmo_2025_3,bmo,proofs,OPC R1 8B,1.0
195,GPT-5 (high),openai/gpt-5,bmo_2025_3,bmo,proofs,OPC R1 8B,0.0
196,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,bmo_2025_3,bmo,proofs,OPC R1 8B,0.0
197,o4-mini (high),openai/o4-mini--high,bmo_2025_3,bmo,proofs,OPC R1 8B,0.0
198,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,bmo_2025_3,bmo,proofs,OPC R1 8B,1.0
199,Grok 4,xai/grok-4,bmo_2025_3,bmo,proofs,OPC R1 8B,0.0
200,GPT-5-mini (high),openai/gpt-5-mini,bmo_2025_3,bmo,proofs,OPC R1 8B,0.0
201,gemini-2.5-pro,gemini/gemini-pro-2.5,bmo_2025_3,bmo,proofs,OPC R1 8B,0.0
202,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,bmo_2025_3,bmo,proofs,OPC R1 8B,0.0
203,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,bmo_2025_4,bmo,proofs,OPC R1 8B,0.0
204,o4-mini (high),openai/o4-mini--high,bmo_2025_4,bmo,proofs,OPC R1 8B,0.0
205,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,bmo_2025_4,bmo,proofs,OPC R1 8B,1.0
206,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,bmo_2025_4,bmo,proofs,OPC R1 8B,0.0
207,Qwen3-4B (25/07),qwen/qwen3_4b,bmo_2025_4,bmo,proofs,OPC R1 8B,0.0
208,GPT-5 (high),openai/gpt-5,bmo_2025_4,bmo,proofs,OPC R1 8B,1.0
209,gemini-2.5-pro,gemini/gemini-pro-2.5,bmo_2025_4,bmo,proofs,OPC R1 8B,0.0
210,Grok 4,xai/grok-4,bmo_2025_4,bmo,proofs,OPC R1 8B,0.0
211,GPT-5-mini (high),openai/gpt-5-mini,bmo_2025_4,bmo,proofs,OPC R1 8B,0.0
212,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,bmo_2025_4,bmo,proofs,OPC R1 8B,0.0
213,GPT OSS 120B (high),openai/oss-120b,bmo_2025_4,bmo,proofs,OPC R1 8B,0.0
214,GPT-5 (high),openai/gpt-5,bmosl_A_2025_1,bmosl,proofs,OPC R1 8B,1.0
215,GPT OSS 120B (high),openai/oss-120b,bmosl_A_2025_1,bmosl,proofs,OPC R1 8B,1.0
216,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,bmosl_A_2025_1,bmosl,proofs,OPC R1 8B,0.0
217,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,bmosl_A_2025_1,bmosl,proofs,OPC R1 8B,0.0
218,o4-mini (high),openai/o4-mini--high,bmosl_A_2025_1,bmosl,proofs,OPC R1 8B,0.0
219,Grok 4,xai/grok-4,bmosl_A_2025_1,bmosl,proofs,OPC R1 8B,0.0
220,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,bmosl_A_2025_1,bmosl,proofs,OPC R1 8B,1.0
221,GPT-5-mini (high),openai/gpt-5-mini,bmosl_A_2025_1,bmosl,proofs,OPC R1 8B,1.0
222,gemini-2.5-pro,gemini/gemini-pro-2.5,bmosl_A_2025_1,bmosl,proofs,OPC R1 8B,0.0
223,Qwen3-4B (25/07),qwen/qwen3_4b,bmosl_A_2025_1,bmosl,proofs,OPC R1 8B,0.0
224,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,bmosl_A_2025_1,bmosl,proofs,OPC R1 8B,1.0
225,Qwen3-4B (25/07),qwen/qwen3_4b,bmosl_A_2025_2,bmosl,proofs,OPC R1 8B,0.0
226,Grok 4,xai/grok-4,bmosl_A_2025_2,bmosl,proofs,OPC R1 8B,0.0
227,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,bmosl_A_2025_2,bmosl,proofs,OPC R1 8B,0.0
228,GPT-5 (high),openai/gpt-5,bmosl_A_2025_2,bmosl,proofs,OPC R1 8B,1.0
229,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,bmosl_A_2025_2,bmosl,proofs,OPC R1 8B,1.0
230,gemini-2.5-pro,gemini/gemini-pro-2.5,bmosl_A_2025_2,bmosl,proofs,OPC R1 8B,1.0
231,o4-mini (high),openai/o4-mini--high,bmosl_A_2025_2,bmosl,proofs,OPC R1 8B,1.0
232,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,bmosl_A_2025_2,bmosl,proofs,OPC R1 8B,0.0
233,GPT OSS 120B (high),openai/oss-120b,bmosl_A_2025_2,bmosl,proofs,OPC R1 8B,0.0
234,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,bmosl_A_2025_2,bmosl,proofs,OPC R1 8B,0.0
235,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,bmosl_A_2025_3,bmosl,proofs,OPC R1 8B,1.0
236,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,bmosl_A_2025_3,bmosl,proofs,OPC R1 8B,0.0
237,GPT-5 (high),openai/gpt-5,bmosl_A_2025_3,bmosl,proofs,OPC R1 8B,1.0
238,o4-mini (high),openai/o4-mini--high,bmosl_A_2025_3,bmosl,proofs,OPC R1 8B,1.0
239,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,bmosl_A_2025_3,bmosl,proofs,OPC R1 8B,0.0
240,gemini-2.5-pro,gemini/gemini-pro-2.5,bmosl_A_2025_3,bmosl,proofs,OPC R1 8B,1.0
241,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,bmosl_A_2025_3,bmosl,proofs,OPC R1 8B,0.0
242,GPT OSS 120B (high),openai/oss-120b,bmosl_A_2025_3,bmosl,proofs,OPC R1 8B,0.0
243,Qwen3-4B (25/07),qwen/qwen3_4b,bmosl_A_2025_3,bmosl,proofs,OPC R1 8B,0.0
244,o4-mini (high),openai/o4-mini--high,bmosl_A_2025_4,bmosl,proofs,OPC R1 8B,0.0
245,gemini-2.5-pro,gemini/gemini-pro-2.5,bmosl_A_2025_4,bmosl,proofs,OPC R1 8B,0.0
246,Grok 4,xai/grok-4,bmosl_A_2025_4,bmosl,proofs,OPC R1 8B,1.0
247,GPT-5 (high),openai/gpt-5,bmosl_A_2025_4,bmosl,proofs,OPC R1 8B,0.0
248,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,bmosl_A_2025_4,bmosl,proofs,OPC R1 8B,1.0
249,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,bmosl_A_2025_4,bmosl,proofs,OPC R1 8B,0.0
250,Qwen3-4B (25/07),qwen/qwen3_4b,bmosl_A_2025_4,bmosl,proofs,OPC R1 8B,0.0
251,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,bmosl_A_2025_4,bmosl,proofs,OPC R1 8B,0.0
252,GPT OSS 120B (high),openai/oss-120b,bmosl_A_2025_4,bmosl,proofs,OPC R1 8B,1.0
253,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,bmosl_A_2025_4,bmosl,proofs,OPC R1 8B,0.0
254,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,bmosl_A_2025_5,bmosl,proofs,OPC R1 8B,0.0
255,Grok 4,xai/grok-4,bmosl_A_2025_5,bmosl,proofs,OPC R1 8B,0.0
256,gemini-2.5-pro,gemini/gemini-pro-2.5,bmosl_A_2025_5,bmosl,proofs,OPC R1 8B,0.0
257,GPT OSS 120B (high),openai/oss-120b,bmosl_A_2025_5,bmosl,proofs,OPC R1 8B,0.0
258,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,bmosl_A_2025_5,bmosl,proofs,OPC R1 8B,0.0
259,o4-mini (high),openai/o4-mini--high,bmosl_A_2025_5,bmosl,proofs,OPC R1 8B,0.0
260,GPT-5-mini (high),openai/gpt-5-mini,bmosl_A_2025_5,bmosl,proofs,OPC R1 8B,1.0
261,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,bmosl_A_2025_5,bmosl,proofs,OPC R1 8B,0.0
262,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,bmosl_A_2025_5,bmosl,proofs,OPC R1 8B,0.0
263,Qwen3-4B (25/07),qwen/qwen3_4b,bmosl_A_2025_5,bmosl,proofs,OPC R1 8B,0.0
264,GPT OSS 120B (high),openai/oss-120b,bmosl_A_2025_6,bmosl,proofs,OPC R1 8B,0.0
265,Grok 4,xai/grok-4,bmosl_A_2025_6,bmosl,proofs,OPC R1 8B,0.0
266,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,bmosl_A_2025_6,bmosl,proofs,OPC R1 8B,0.0
267,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,bmosl_A_2025_6,bmosl,proofs,OPC R1 8B,0.0
268,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,bmosl_A_2025_6,bmosl,proofs,OPC R1 8B,0.0
269,o4-mini (high),openai/o4-mini--high,bmosl_A_2025_6,bmosl,proofs,OPC R1 8B,0.0
270,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,bmosl_A_2025_6,bmosl,proofs,OPC R1 8B,0.0
271,gemini-2.5-pro,gemini/gemini-pro-2.5,bmosl_A_2025_6,bmosl,proofs,OPC R1 8B,0.0
272,Qwen3-4B (25/07),qwen/qwen3_4b,bmosl_A_2025_6,bmosl,proofs,OPC R1 8B,0.0
273,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,bmosl_C_2025_1,bmosl,proofs,OPC R1 8B,0.0
274,GPT OSS 120B (high),openai/oss-120b,bmosl_C_2025_1,bmosl,proofs,OPC R1 8B,0.0
275,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,bmosl_C_2025_1,bmosl,proofs,OPC R1 8B,0.0
276,gemini-2.5-pro,gemini/gemini-pro-2.5,bmosl_C_2025_1,bmosl,proofs,OPC R1 8B,1.0
277,o4-mini (high),openai/o4-mini--high,bmosl_C_2025_1,bmosl,proofs,OPC R1 8B,1.0
278,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,bmosl_C_2025_1,bmosl,proofs,OPC R1 8B,0.0
279,Qwen3-4B (25/07),qwen/qwen3_4b,bmosl_C_2025_1,bmosl,proofs,OPC R1 8B,0.0
280,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,bmosl_C_2025_1,bmosl,proofs,OPC R1 8B,1.0
281,Grok 4,xai/grok-4,bmosl_C_2025_1,bmosl,proofs,OPC R1 8B,0.0
282,Qwen3-4B (25/07),qwen/qwen3_4b,bmosl_C_2025_2,bmosl,proofs,OPC R1 8B,0.0
283,GPT-5 (high),openai/gpt-5,bmosl_C_2025_2,bmosl,proofs,OPC R1 8B,1.0
284,GPT OSS 120B (high),openai/oss-120b,bmosl_C_2025_2,bmosl,proofs,OPC R1 8B,1.0
285,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,bmosl_C_2025_2,bmosl,proofs,OPC R1 8B,0.0
286,o4-mini (high),openai/o4-mini--high,bmosl_C_2025_2,bmosl,proofs,OPC R1 8B,0.0
287,GPT-5-mini (high),openai/gpt-5-mini,bmosl_C_2025_2,bmosl,proofs,OPC R1 8B,0.0
288,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,bmosl_C_2025_2,bmosl,proofs,OPC R1 8B,1.0
289,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,bmosl_C_2025_2,bmosl,proofs,OPC R1 8B,0.0
290,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,bmosl_C_2025_2,bmosl,proofs,OPC R1 8B,0.0
291,Grok 4,xai/grok-4,bmosl_C_2025_2,bmosl,proofs,OPC R1 8B,0.0
292,gemini-2.5-pro,gemini/gemini-pro-2.5,bmosl_C_2025_2,bmosl,proofs,OPC R1 8B,0.0
293,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,bmosl_C_2025_3,bmosl,proofs,OPC R1 8B,1.0
294,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,bmosl_C_2025_3,bmosl,proofs,OPC R1 8B,0.0
295,Grok 4,xai/grok-4,bmosl_C_2025_3,bmosl,proofs,OPC R1 8B,0.0
296,GPT-5-mini (high),openai/gpt-5-mini,bmosl_C_2025_3,bmosl,proofs,OPC R1 8B,1.0
297,o4-mini (high),openai/o4-mini--high,bmosl_C_2025_3,bmosl,proofs,OPC R1 8B,0.0
298,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,bmosl_C_2025_3,bmosl,proofs,OPC R1 8B,0.0
299,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,bmosl_C_2025_3,bmosl,proofs,OPC R1 8B,0.0
300,gemini-2.5-pro,gemini/gemini-pro-2.5,bmosl_C_2025_3,bmosl,proofs,OPC R1 8B,0.0
301,Qwen3-4B (25/07),qwen/qwen3_4b,bmosl_C_2025_3,bmosl,proofs,OPC R1 8B,0.0
302,GPT OSS 120B (high),openai/oss-120b,bmosl_C_2025_3,bmosl,proofs,OPC R1 8B,1.0
303,Grok 4,xai/grok-4,bmosl_C_2025_4,bmosl,proofs,OPC R1 8B,0.0
304,GPT OSS 120B (high),openai/oss-120b,bmosl_C_2025_4,bmosl,proofs,OPC R1 8B,1.0
305,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,bmosl_C_2025_4,bmosl,proofs,OPC R1 8B,0.0
306,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,bmosl_C_2025_4,bmosl,proofs,OPC R1 8B,0.0
307,o4-mini (high),openai/o4-mini--high,bmosl_C_2025_4,bmosl,proofs,OPC R1 8B,0.0
308,gemini-2.5-pro,gemini/gemini-pro-2.5,bmosl_C_2025_4,bmosl,proofs,OPC R1 8B,0.0
309,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,bmosl_C_2025_4,bmosl,proofs,OPC R1 8B,0.0
310,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,bmosl_C_2025_4,bmosl,proofs,OPC R1 8B,0.0
311,Qwen3-4B (25/07),qwen/qwen3_4b,bmosl_C_2025_4,bmosl,proofs,OPC R1 8B,0.0
312,GPT OSS 120B (high),openai/oss-120b,bmosl_C_2025_5,bmosl,proofs,OPC R1 8B,0.0
313,o4-mini (high),openai/o4-mini--high,bmosl_C_2025_5,bmosl,proofs,OPC R1 8B,0.0
314,gemini-2.5-pro,gemini/gemini-pro-2.5,bmosl_C_2025_5,bmosl,proofs,OPC R1 8B,0.0
315,Qwen3-4B (25/07),qwen/qwen3_4b,bmosl_C_2025_5,bmosl,proofs,OPC R1 8B,0.0
316,GPT-5-mini (high),openai/gpt-5-mini,bmosl_C_2025_5,bmosl,proofs,OPC R1 8B,0.0
317,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,bmosl_C_2025_5,bmosl,proofs,OPC R1 8B,0.0
318,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,bmosl_C_2025_5,bmosl,proofs,OPC R1 8B,0.0
319,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,bmosl_C_2025_5,bmosl,proofs,OPC R1 8B,0.0
320,Grok 4,xai/grok-4,bmosl_C_2025_5,bmosl,proofs,OPC R1 8B,0.0
321,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,bmosl_C_2025_5,bmosl,proofs,OPC R1 8B,0.0
322,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,bmosl_C_2025_6,bmosl,proofs,OPC R1 8B,0.0
323,gemini-2.5-pro,gemini/gemini-pro-2.5,bmosl_C_2025_6,bmosl,proofs,OPC R1 8B,0.0
324,Grok 4,xai/grok-4,bmosl_C_2025_6,bmosl,proofs,OPC R1 8B,0.0
325,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,bmosl_C_2025_6,bmosl,proofs,OPC R1 8B,1.0
326,o4-mini (high),openai/o4-mini--high,bmosl_C_2025_6,bmosl,proofs,OPC R1 8B,0.0
327,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,bmosl_C_2025_6,bmosl,proofs,OPC R1 8B,0.0
328,Qwen3-4B (25/07),qwen/qwen3_4b,bmosl_C_2025_6,bmosl,proofs,OPC R1 8B,1.0
329,GPT OSS 120B (high),openai/oss-120b,bmosl_C_2025_6,bmosl,proofs,OPC R1 8B,0.0
330,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,bmosl_C_2025_6,bmosl,proofs,OPC R1 8B,0.0
331,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,bmosl_G_2025_1,bmosl,proofs,OPC R1 8B,0.0
332,gemini-2.5-pro,gemini/gemini-pro-2.5,bmosl_G_2025_1,bmosl,proofs,OPC R1 8B,0.0
333,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,bmosl_G_2025_1,bmosl,proofs,OPC R1 8B,0.0
334,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,bmosl_G_2025_1,bmosl,proofs,OPC R1 8B,0.0
335,Qwen3-4B (25/07),qwen/qwen3_4b,bmosl_G_2025_1,bmosl,proofs,OPC R1 8B,0.0
336,GPT OSS 120B (high),openai/oss-120b,bmosl_G_2025_1,bmosl,proofs,OPC R1 8B,0.0
337,o4-mini (high),openai/o4-mini--high,bmosl_G_2025_1,bmosl,proofs,OPC R1 8B,0.0
338,Grok 4,xai/grok-4,bmosl_G_2025_1,bmosl,proofs,OPC R1 8B,0.0
339,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,bmosl_G_2025_1,bmosl,proofs,OPC R1 8B,0.0
340,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,bmosl_G_2025_2,bmosl,proofs,OPC R1 8B,0.0
341,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,bmosl_G_2025_2,bmosl,proofs,OPC R1 8B,0.0
342,Qwen3-4B (25/07),qwen/qwen3_4b,bmosl_G_2025_2,bmosl,proofs,OPC R1 8B,0.0
343,gemini-2.5-pro,gemini/gemini-pro-2.5,bmosl_G_2025_2,bmosl,proofs,OPC R1 8B,0.0
344,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,bmosl_G_2025_2,bmosl,proofs,OPC R1 8B,1.0
345,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,bmosl_G_2025_2,bmosl,proofs,OPC R1 8B,0.0
346,o4-mini (high),openai/o4-mini--high,bmosl_G_2025_2,bmosl,proofs,OPC R1 8B,0.0
347,Grok 4,xai/grok-4,bmosl_G_2025_2,bmosl,proofs,OPC R1 8B,0.0
348,GPT-5 (high),openai/gpt-5,bmosl_G_2025_2,bmosl,proofs,OPC R1 8B,1.0
349,GPT OSS 120B (high),openai/oss-120b,bmosl_G_2025_2,bmosl,proofs,OPC R1 8B,1.0
350,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,bmosl_G_2025_3,bmosl,proofs,OPC R1 8B,0.0
351,Grok 4,xai/grok-4,bmosl_G_2025_3,bmosl,proofs,OPC R1 8B,0.0
352,gemini-2.5-pro,gemini/gemini-pro-2.5,bmosl_G_2025_3,bmosl,proofs,OPC R1 8B,0.0
353,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,bmosl_G_2025_3,bmosl,proofs,OPC R1 8B,1.0
354,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,bmosl_G_2025_3,bmosl,proofs,OPC R1 8B,0.0
355,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,bmosl_G_2025_3,bmosl,proofs,OPC R1 8B,0.0
356,GPT OSS 120B (high),openai/oss-120b,bmosl_G_2025_3,bmosl,proofs,OPC R1 8B,0.0
357,GPT-5 (high),openai/gpt-5,bmosl_G_2025_3,bmosl,proofs,OPC R1 8B,0.0
358,Qwen3-4B (25/07),qwen/qwen3_4b,bmosl_G_2025_3,bmosl,proofs,OPC R1 8B,1.0
359,o4-mini (high),openai/o4-mini--high,bmosl_G_2025_3,bmosl,proofs,OPC R1 8B,1.0
360,GPT-5 (high),openai/gpt-5,bmosl_G_2025_4,bmosl,proofs,OPC R1 8B,1.0
361,gemini-2.5-pro,gemini/gemini-pro-2.5,bmosl_G_2025_4,bmosl,proofs,OPC R1 8B,0.0
362,GPT OSS 120B (high),openai/oss-120b,bmosl_G_2025_4,bmosl,proofs,OPC R1 8B,0.0
363,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,bmosl_G_2025_4,bmosl,proofs,OPC R1 8B,0.0
364,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,bmosl_G_2025_4,bmosl,proofs,OPC R1 8B,0.0
365,GPT-5-mini (high),openai/gpt-5-mini,bmosl_G_2025_4,bmosl,proofs,OPC R1 8B,0.0
366,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,bmosl_G_2025_4,bmosl,proofs,OPC R1 8B,0.0
367,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,bmosl_G_2025_4,bmosl,proofs,OPC R1 8B,0.0
368,o4-mini (high),openai/o4-mini--high,bmosl_G_2025_4,bmosl,proofs,OPC R1 8B,0.0
369,Qwen3-4B (25/07),qwen/qwen3_4b,bmosl_G_2025_4,bmosl,proofs,OPC R1 8B,0.0
370,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,bmosl_G_2025_5,bmosl,proofs,OPC R1 8B,0.0
371,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,bmosl_G_2025_5,bmosl,proofs,OPC R1 8B,1.0
372,gemini-2.5-pro,gemini/gemini-pro-2.5,bmosl_G_2025_5,bmosl,proofs,OPC R1 8B,0.0
373,Grok 4,xai/grok-4,bmosl_G_2025_5,bmosl,proofs,OPC R1 8B,0.0
374,GPT OSS 120B (high),openai/oss-120b,bmosl_G_2025_5,bmosl,proofs,OPC R1 8B,1.0
375,GPT-5-mini (high),openai/gpt-5-mini,bmosl_G_2025_5,bmosl,proofs,OPC R1 8B,1.0
376,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,bmosl_G_2025_5,bmosl,proofs,OPC R1 8B,0.0
377,o4-mini (high),openai/o4-mini--high,bmosl_G_2025_5,bmosl,proofs,OPC R1 8B,0.0
378,Qwen3-4B (25/07),qwen/qwen3_4b,bmosl_G_2025_5,bmosl,proofs,OPC R1 8B,1.0
379,GPT-5 (high),openai/gpt-5,bmosl_G_2025_5,bmosl,proofs,OPC R1 8B,1.0
380,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,bmosl_G_2025_5,bmosl,proofs,OPC R1 8B,0.0
381,o4-mini (high),openai/o4-mini--high,bmosl_G_2025_6,bmosl,proofs,OPC R1 8B,0.0
382,gemini-2.5-pro,gemini/gemini-pro-2.5,bmosl_G_2025_6,bmosl,proofs,OPC R1 8B,0.0
383,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,bmosl_G_2025_6,bmosl,proofs,OPC R1 8B,0.0
384,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,bmosl_G_2025_6,bmosl,proofs,OPC R1 8B,0.0
385,Qwen3-4B (25/07),qwen/qwen3_4b,bmosl_G_2025_6,bmosl,proofs,OPC R1 8B,0.0
386,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,bmosl_G_2025_6,bmosl,proofs,OPC R1 8B,0.0
387,Grok 4,xai/grok-4,bmosl_G_2025_6,bmosl,proofs,OPC R1 8B,0.0
388,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,bmosl_G_2025_6,bmosl,proofs,OPC R1 8B,0.0
389,GPT OSS 120B (high),openai/oss-120b,bmosl_G_2025_6,bmosl,proofs,OPC R1 8B,1.0
390,Qwen3-4B (25/07),qwen/qwen3_4b,bmosl_G_2025_7,bmosl,proofs,OPC R1 8B,0.0
391,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,bmosl_G_2025_7,bmosl,proofs,OPC R1 8B,0.0
392,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,bmosl_G_2025_7,bmosl,proofs,OPC R1 8B,0.0
393,Grok 4,xai/grok-4,bmosl_G_2025_7,bmosl,proofs,OPC R1 8B,0.0
394,GPT OSS 120B (high),openai/oss-120b,bmosl_G_2025_7,bmosl,proofs,OPC R1 8B,1.0
395,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,bmosl_G_2025_7,bmosl,proofs,OPC R1 8B,0.0
396,o4-mini (high),openai/o4-mini--high,bmosl_G_2025_7,bmosl,proofs,OPC R1 8B,0.0
397,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,bmosl_G_2025_7,bmosl,proofs,OPC R1 8B,0.0
398,gemini-2.5-pro,gemini/gemini-pro-2.5,bmosl_G_2025_7,bmosl,proofs,OPC R1 8B,0.0
399,o4-mini (high),openai/o4-mini--high,bmosl_NT_2025_1,bmosl,proofs,OPC R1 8B,0.0
400,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,bmosl_NT_2025_1,bmosl,proofs,OPC R1 8B,0.0
401,GPT OSS 120B (high),openai/oss-120b,bmosl_NT_2025_1,bmosl,proofs,OPC R1 8B,1.0
402,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,bmosl_NT_2025_1,bmosl,proofs,OPC R1 8B,0.0
403,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,bmosl_NT_2025_1,bmosl,proofs,OPC R1 8B,0.0
404,Grok 4,xai/grok-4,bmosl_NT_2025_1,bmosl,proofs,OPC R1 8B,0.0
405,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,bmosl_NT_2025_1,bmosl,proofs,OPC R1 8B,0.0
406,gemini-2.5-pro,gemini/gemini-pro-2.5,bmosl_NT_2025_1,bmosl,proofs,OPC R1 8B,0.0
407,Qwen3-4B (25/07),qwen/qwen3_4b,bmosl_NT_2025_1,bmosl,proofs,OPC R1 8B,0.0
408,GPT OSS 120B (high),openai/oss-120b,bmosl_NT_2025_2,bmosl,proofs,OPC R1 8B,0.0
409,gemini-2.5-pro,gemini/gemini-pro-2.5,bmosl_NT_2025_2,bmosl,proofs,OPC R1 8B,0.0
410,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,bmosl_NT_2025_2,bmosl,proofs,OPC R1 8B,0.0
411,Grok 4,xai/grok-4,bmosl_NT_2025_2,bmosl,proofs,OPC R1 8B,0.0
412,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,bmosl_NT_2025_2,bmosl,proofs,OPC R1 8B,0.0
413,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,bmosl_NT_2025_2,bmosl,proofs,OPC R1 8B,0.0
414,GPT-5 (high),openai/gpt-5,bmosl_NT_2025_2,bmosl,proofs,OPC R1 8B,0.0
415,o4-mini (high),openai/o4-mini--high,bmosl_NT_2025_2,bmosl,proofs,OPC R1 8B,0.0
416,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,bmosl_NT_2025_2,bmosl,proofs,OPC R1 8B,0.0
417,Qwen3-4B (25/07),qwen/qwen3_4b,bmosl_NT_2025_2,bmosl,proofs,OPC R1 8B,0.0
418,gemini-2.5-pro,gemini/gemini-pro-2.5,bmosl_NT_2025_3,bmosl,proofs,OPC R1 8B,1.0
419,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,bmosl_NT_2025_3,bmosl,proofs,OPC R1 8B,0.0
420,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,bmosl_NT_2025_3,bmosl,proofs,OPC R1 8B,0.0
421,GPT OSS 120B (high),openai/oss-120b,bmosl_NT_2025_3,bmosl,proofs,OPC R1 8B,0.0
422,o4-mini (high),openai/o4-mini--high,bmosl_NT_2025_3,bmosl,proofs,OPC R1 8B,0.0
423,Qwen3-4B (25/07),qwen/qwen3_4b,bmosl_NT_2025_3,bmosl,proofs,OPC R1 8B,0.0
424,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,bmosl_NT_2025_3,bmosl,proofs,OPC R1 8B,0.0
425,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,bmosl_NT_2025_3,bmosl,proofs,OPC R1 8B,0.0
426,Grok 4,xai/grok-4,bmosl_NT_2025_3,bmosl,proofs,OPC R1 8B,0.0
427,o4-mini (high),openai/o4-mini--high,bmosl_NT_2025_4,bmosl,proofs,OPC R1 8B,0.0
428,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,bmosl_NT_2025_4,bmosl,proofs,OPC R1 8B,0.0
429,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,bmosl_NT_2025_4,bmosl,proofs,OPC R1 8B,0.0
430,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,bmosl_NT_2025_4,bmosl,proofs,OPC R1 8B,0.0
431,gemini-2.5-pro,gemini/gemini-pro-2.5,bmosl_NT_2025_4,bmosl,proofs,OPC R1 8B,1.0
432,Grok 4,xai/grok-4,bmosl_NT_2025_4,bmosl,proofs,OPC R1 8B,0.0
433,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,bmosl_NT_2025_4,bmosl,proofs,OPC R1 8B,0.0
434,GPT OSS 120B (high),openai/oss-120b,bmosl_NT_2025_4,bmosl,proofs,OPC R1 8B,1.0
435,GPT-5-mini (high),openai/gpt-5-mini,bmosl_NT_2025_4,bmosl,proofs,OPC R1 8B,0.0
436,Qwen3-4B (25/07),qwen/qwen3_4b,bmosl_NT_2025_4,bmosl,proofs,OPC R1 8B,0.0
437,Qwen3-4B (25/07),qwen/qwen3_4b,bmosl_NT_2025_5,bmosl,proofs,OPC R1 8B,0.0
438,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,bmosl_NT_2025_5,bmosl,proofs,OPC R1 8B,1.0
439,GPT OSS 120B (high),openai/oss-120b,bmosl_NT_2025_5,bmosl,proofs,OPC R1 8B,1.0
440,Grok 4,xai/grok-4,bmosl_NT_2025_5,bmosl,proofs,OPC R1 8B,0.0
441,gemini-2.5-pro,gemini/gemini-pro-2.5,bmosl_NT_2025_5,bmosl,proofs,OPC R1 8B,0.0
442,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,bmosl_NT_2025_5,bmosl,proofs,OPC R1 8B,0.0
443,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,bmosl_NT_2025_5,bmosl,proofs,OPC R1 8B,0.0
444,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,bmosl_NT_2025_5,bmosl,proofs,OPC R1 8B,0.0
445,o4-mini (high),openai/o4-mini--high,bmosl_NT_2025_5,bmosl,proofs,OPC R1 8B,0.0
446,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,bmosl_NT_2025_6,bmosl,proofs,OPC R1 8B,1.0
447,GPT-5 (high),openai/gpt-5,bmosl_NT_2025_6,bmosl,proofs,OPC R1 8B,1.0
448,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,bmosl_NT_2025_6,bmosl,proofs,OPC R1 8B,0.0
449,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,bmosl_NT_2025_6,bmosl,proofs,OPC R1 8B,0.0
450,GPT-5-mini (high),openai/gpt-5-mini,bmosl_NT_2025_6,bmosl,proofs,OPC R1 8B,1.0
451,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,bmosl_NT_2025_6,bmosl,proofs,OPC R1 8B,1.0
452,o4-mini (high),openai/o4-mini--high,bmosl_NT_2025_6,bmosl,proofs,OPC R1 8B,1.0
453,GPT OSS 120B (high),openai/oss-120b,bmosl_NT_2025_6,bmosl,proofs,OPC R1 8B,0.0
454,Qwen3-4B (25/07),qwen/qwen3_4b,bmosl_NT_2025_6,bmosl,proofs,OPC R1 8B,0.0
455,gemini-2.5-pro,gemini/gemini-pro-2.5,bmosl_NT_2025_6,bmosl,proofs,OPC R1 8B,0.0
456,Grok 4,xai/grok-4,bmosl_NT_2025_6,bmosl,proofs,OPC R1 8B,0.0
457,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,bmosl_NT_2025_7,bmosl,proofs,OPC R1 8B,1.0
458,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,bmosl_NT_2025_7,bmosl,proofs,OPC R1 8B,0.0
459,o4-mini (high),openai/o4-mini--high,bmosl_NT_2025_7,bmosl,proofs,OPC R1 8B,0.0
460,Qwen3-4B (25/07),qwen/qwen3_4b,bmosl_NT_2025_7,bmosl,proofs,OPC R1 8B,0.0
461,GPT OSS 120B (high),openai/oss-120b,bmosl_NT_2025_7,bmosl,proofs,OPC R1 8B,1.0
462,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,bmosl_NT_2025_7,bmosl,proofs,OPC R1 8B,1.0
463,gemini-2.5-pro,gemini/gemini-pro-2.5,bmosl_NT_2025_7,bmosl,proofs,OPC R1 8B,1.0
464,GPT-5-mini (high),openai/gpt-5-mini,bmosl_NT_2025_7,bmosl,proofs,OPC R1 8B,0.0
465,Grok 4,xai/grok-4,bmosl_NT_2025_7,bmosl,proofs,OPC R1 8B,1.0
466,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,bmosl_NT_2025_7,bmosl,proofs,OPC R1 8B,1.0
467,GPT OSS 120B (high),openai/oss-120b,bulgaria_2025_1,bulgaria,proofs,OPC R1 8B,0.0
468,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,bulgaria_2025_1,bulgaria,proofs,OPC R1 8B,1.0
469,o4-mini (high),openai/o4-mini--high,bulgaria_2025_1,bulgaria,proofs,OPC R1 8B,1.0
470,Grok 4,xai/grok-4,bulgaria_2025_1,bulgaria,proofs,OPC R1 8B,1.0
471,GPT-5 (high),openai/gpt-5,bulgaria_2025_1,bulgaria,proofs,OPC R1 8B,0.0
472,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,bulgaria_2025_1,bulgaria,proofs,OPC R1 8B,0.0
473,GPT-5-mini (high),openai/gpt-5-mini,bulgaria_2025_1,bulgaria,proofs,OPC R1 8B,1.0
474,gemini-2.5-pro,gemini/gemini-pro-2.5,bulgaria_2025_1,bulgaria,proofs,OPC R1 8B,1.0
475,Qwen3-4B (25/07),qwen/qwen3_4b,bulgaria_2025_1,bulgaria,proofs,OPC R1 8B,0.0
476,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,bulgaria_2025_1,bulgaria,proofs,OPC R1 8B,1.0
477,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,bulgaria_2025_1,bulgaria,proofs,OPC R1 8B,0.0
478,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,bulgaria_2025_2,bulgaria,proofs,OPC R1 8B,0.0
479,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,bulgaria_2025_2,bulgaria,proofs,OPC R1 8B,0.0
480,GPT-5 (high),openai/gpt-5,bulgaria_2025_2,bulgaria,proofs,OPC R1 8B,0.0
481,Grok 4,xai/grok-4,bulgaria_2025_2,bulgaria,proofs,OPC R1 8B,0.0
482,GPT-5-mini (high),openai/gpt-5-mini,bulgaria_2025_2,bulgaria,proofs,OPC R1 8B,0.0
483,gemini-2.5-pro,gemini/gemini-pro-2.5,bulgaria_2025_2,bulgaria,proofs,OPC R1 8B,0.0
484,GPT OSS 120B (high),openai/oss-120b,bulgaria_2025_2,bulgaria,proofs,OPC R1 8B,0.0
485,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,bulgaria_2025_2,bulgaria,proofs,OPC R1 8B,0.0
486,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,bulgaria_2025_2,bulgaria,proofs,OPC R1 8B,0.0
487,o4-mini (high),openai/o4-mini--high,bulgaria_2025_2,bulgaria,proofs,OPC R1 8B,0.0
488,Qwen3-4B (25/07),qwen/qwen3_4b,bulgaria_2025_2,bulgaria,proofs,OPC R1 8B,1.0
489,GPT-5 (high),openai/gpt-5,bulgaria_2025_3,bulgaria,proofs,OPC R1 8B,0.0
490,o4-mini (high),openai/o4-mini--high,bulgaria_2025_3,bulgaria,proofs,OPC R1 8B,0.0
491,Grok 4,xai/grok-4,bulgaria_2025_3,bulgaria,proofs,OPC R1 8B,0.0
492,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,bulgaria_2025_3,bulgaria,proofs,OPC R1 8B,0.0
493,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,bulgaria_2025_3,bulgaria,proofs,OPC R1 8B,0.0
494,Qwen3-4B (25/07),qwen/qwen3_4b,bulgaria_2025_3,bulgaria,proofs,OPC R1 8B,0.0
495,GPT OSS 120B (high),openai/oss-120b,bulgaria_2025_3,bulgaria,proofs,OPC R1 8B,0.0
496,GPT-5-mini (high),openai/gpt-5-mini,bulgaria_2025_3,bulgaria,proofs,OPC R1 8B,0.0
497,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,bulgaria_2025_3,bulgaria,proofs,OPC R1 8B,0.0
498,gemini-2.5-pro,gemini/gemini-pro-2.5,bulgaria_2025_3,bulgaria,proofs,OPC R1 8B,0.0
499,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,bulgaria_2025_3,bulgaria,proofs,OPC R1 8B,0.0
500,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,bulgaria_2025_4,bulgaria,proofs,OPC R1 8B,1.0
501,GPT OSS 120B (high),openai/oss-120b,bulgaria_2025_4,bulgaria,proofs,OPC R1 8B,0.0
502,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,bulgaria_2025_4,bulgaria,proofs,OPC R1 8B,0.0
503,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,bulgaria_2025_4,bulgaria,proofs,OPC R1 8B,0.0
504,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,bulgaria_2025_4,bulgaria,proofs,OPC R1 8B,0.0
505,Qwen3-4B (25/07),qwen/qwen3_4b,bulgaria_2025_4,bulgaria,proofs,OPC R1 8B,1.0
506,o4-mini (high),openai/o4-mini--high,bulgaria_2025_4,bulgaria,proofs,OPC R1 8B,0.0
507,GPT-5 (high),openai/gpt-5,bulgaria_2025_4,bulgaria,proofs,OPC R1 8B,0.0
508,gemini-2.5-pro,gemini/gemini-pro-2.5,bulgaria_2025_4,bulgaria,proofs,OPC R1 8B,0.0
509,Grok 4,xai/grok-4,bulgaria_2025_4,bulgaria,proofs,OPC R1 8B,1.0
510,Qwen3-4B (25/07),qwen/qwen3_4b,bulgaria_2025_5,bulgaria,proofs,OPC R1 8B,0.0
511,GPT-5-mini (high),openai/gpt-5-mini,bulgaria_2025_5,bulgaria,proofs,OPC R1 8B,1.0
512,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,bulgaria_2025_5,bulgaria,proofs,OPC R1 8B,0.0
513,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,bulgaria_2025_5,bulgaria,proofs,OPC R1 8B,0.0
514,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,bulgaria_2025_5,bulgaria,proofs,OPC R1 8B,0.0
515,o4-mini (high),openai/o4-mini--high,bulgaria_2025_5,bulgaria,proofs,OPC R1 8B,0.0
516,GPT-5 (high),openai/gpt-5,bulgaria_2025_5,bulgaria,proofs,OPC R1 8B,0.0
517,GPT OSS 120B (high),openai/oss-120b,bulgaria_2025_5,bulgaria,proofs,OPC R1 8B,0.0
518,gemini-2.5-pro,gemini/gemini-pro-2.5,bulgaria_2025_5,bulgaria,proofs,OPC R1 8B,0.0
519,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,bulgaria_2025_5,bulgaria,proofs,OPC R1 8B,0.0
520,Grok 4,xai/grok-4,bulgaria_2025_5,bulgaria,proofs,OPC R1 8B,0.0
521,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,bulgaria_2025_6,bulgaria,proofs,OPC R1 8B,0.0
522,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,bulgaria_2025_6,bulgaria,proofs,OPC R1 8B,0.0
523,Grok 4,xai/grok-4,bulgaria_2025_6,bulgaria,proofs,OPC R1 8B,0.0
524,GPT-5-mini (high),openai/gpt-5-mini,bulgaria_2025_6,bulgaria,proofs,OPC R1 8B,1.0
525,GPT-5 (high),openai/gpt-5,bulgaria_2025_6,bulgaria,proofs,OPC R1 8B,1.0
526,gemini-2.5-pro,gemini/gemini-pro-2.5,bulgaria_2025_6,bulgaria,proofs,OPC R1 8B,0.0
527,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,bulgaria_2025_6,bulgaria,proofs,OPC R1 8B,0.0
528,GPT OSS 120B (high),openai/oss-120b,bulgaria_2025_6,bulgaria,proofs,OPC R1 8B,0.0
529,o4-mini (high),openai/o4-mini--high,bulgaria_2025_6,bulgaria,proofs,OPC R1 8B,1.0
530,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,bulgaria_2025_6,bulgaria,proofs,OPC R1 8B,1.0
531,Qwen3-4B (25/07),qwen/qwen3_4b,bulgaria_2025_6,bulgaria,proofs,OPC R1 8B,0.0
532,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,canada_2025_1,canada,proofs,OPC R1 8B,0.0
533,GPT-5 (high),openai/gpt-5,canada_2025_1,canada,proofs,OPC R1 8B,0.0
534,gemini-2.5-pro,gemini/gemini-pro-2.5,canada_2025_1,canada,proofs,OPC R1 8B,0.0
535,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,canada_2025_1,canada,proofs,OPC R1 8B,0.0
536,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,canada_2025_1,canada,proofs,OPC R1 8B,0.0
537,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,canada_2025_1,canada,proofs,OPC R1 8B,0.0
538,o4-mini (high),openai/o4-mini--high,canada_2025_1,canada,proofs,OPC R1 8B,0.0
539,GPT OSS 120B (high),openai/oss-120b,canada_2025_1,canada,proofs,OPC R1 8B,0.0
540,Qwen3-4B (25/07),qwen/qwen3_4b,canada_2025_1,canada,proofs,OPC R1 8B,0.0
541,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,canada_2025_2,canada,proofs,OPC R1 8B,1.0
542,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,canada_2025_2,canada,proofs,OPC R1 8B,1.0
543,gemini-2.5-pro,gemini/gemini-pro-2.5,canada_2025_2,canada,proofs,OPC R1 8B,1.0
544,Qwen3-4B (25/07),qwen/qwen3_4b,canada_2025_2,canada,proofs,OPC R1 8B,1.0
545,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,canada_2025_2,canada,proofs,OPC R1 8B,0.0
546,GPT-5 (high),openai/gpt-5,canada_2025_2,canada,proofs,OPC R1 8B,1.0
547,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,canada_2025_2,canada,proofs,OPC R1 8B,0.0
548,Grok 4,xai/grok-4,canada_2025_2,canada,proofs,OPC R1 8B,0.0
549,o4-mini (high),openai/o4-mini--high,canada_2025_2,canada,proofs,OPC R1 8B,0.0
550,GPT OSS 120B (high),openai/oss-120b,canada_2025_2,canada,proofs,OPC R1 8B,0.0
551,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,canada_2025_3,canada,proofs,OPC R1 8B,0.0
552,o4-mini (high),openai/o4-mini--high,canada_2025_3,canada,proofs,OPC R1 8B,0.0
553,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,canada_2025_3,canada,proofs,OPC R1 8B,0.0
554,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,canada_2025_3,canada,proofs,OPC R1 8B,0.0
555,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,canada_2025_3,canada,proofs,OPC R1 8B,1.0
556,Grok 4,xai/grok-4,canada_2025_3,canada,proofs,OPC R1 8B,1.0
557,gemini-2.5-pro,gemini/gemini-pro-2.5,canada_2025_3,canada,proofs,OPC R1 8B,0.0
558,Qwen3-4B (25/07),qwen/qwen3_4b,canada_2025_3,canada,proofs,OPC R1 8B,1.0
559,GPT-5 (high),openai/gpt-5,canada_2025_3,canada,proofs,OPC R1 8B,0.0
560,GPT OSS 120B (high),openai/oss-120b,canada_2025_3,canada,proofs,OPC R1 8B,1.0
561,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,canada_2025_4,canada,proofs,OPC R1 8B,0.0
562,gemini-2.5-pro,gemini/gemini-pro-2.5,canada_2025_4,canada,proofs,OPC R1 8B,0.0
563,Grok 4,xai/grok-4,canada_2025_4,canada,proofs,OPC R1 8B,0.0
564,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,canada_2025_4,canada,proofs,OPC R1 8B,0.0
565,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,canada_2025_4,canada,proofs,OPC R1 8B,0.0
566,Qwen3-4B (25/07),qwen/qwen3_4b,canada_2025_4,canada,proofs,OPC R1 8B,0.0
567,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,canada_2025_4,canada,proofs,OPC R1 8B,0.0
568,GPT OSS 120B (high),openai/oss-120b,canada_2025_4,canada,proofs,OPC R1 8B,0.0
569,o4-mini (high),openai/o4-mini--high,canada_2025_4,canada,proofs,OPC R1 8B,0.0
570,GPT-5 (high),openai/gpt-5,canada_2025_4,canada,proofs,OPC R1 8B,0.0
571,Qwen3-4B (25/07),qwen/qwen3_4b,canada_2025_5,canada,proofs,OPC R1 8B,0.0
572,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,canada_2025_5,canada,proofs,OPC R1 8B,1.0
573,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,canada_2025_5,canada,proofs,OPC R1 8B,0.0
574,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,canada_2025_5,canada,proofs,OPC R1 8B,0.0
575,gemini-2.5-pro,gemini/gemini-pro-2.5,canada_2025_5,canada,proofs,OPC R1 8B,0.0
576,o4-mini (high),openai/o4-mini--high,canada_2025_5,canada,proofs,OPC R1 8B,1.0
577,GPT OSS 120B (high),openai/oss-120b,canada_2025_5,canada,proofs,OPC R1 8B,1.0
578,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,canada_2025_5,canada,proofs,OPC R1 8B,0.0
579,GPT-5 (high),openai/gpt-5,canada_2025_5,canada,proofs,OPC R1 8B,0.0
580,Grok 4,xai/grok-4,canada_2025_5,canada,proofs,OPC R1 8B,0.0
581,gemini-2.5-pro,gemini/gemini-pro-2.5,china_2025_1,china,proofs,OPC R1 8B,0.0
582,GPT-5-mini (high),openai/gpt-5-mini,china_2025_1,china,proofs,OPC R1 8B,0.0
583,GPT OSS 120B (high),openai/oss-120b,china_2025_1,china,proofs,OPC R1 8B,1.0
584,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,china_2025_1,china,proofs,OPC R1 8B,0.0
585,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,china_2025_1,china,proofs,OPC R1 8B,0.0
586,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,china_2025_1,china,proofs,OPC R1 8B,0.0
587,GPT-5 (high),openai/gpt-5,china_2025_1,china,proofs,OPC R1 8B,1.0
588,Qwen3-4B (25/07),qwen/qwen3_4b,china_2025_1,china,proofs,OPC R1 8B,0.0
589,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,china_2025_1,china,proofs,OPC R1 8B,0.0
590,Grok 4,xai/grok-4,china_2025_1,china,proofs,OPC R1 8B,0.0
591,o4-mini (high),openai/o4-mini--high,china_2025_1,china,proofs,OPC R1 8B,0.0
592,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,china_2025_2,china,proofs,OPC R1 8B,0.0
593,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,china_2025_2,china,proofs,OPC R1 8B,0.0
594,GPT OSS 120B (high),openai/oss-120b,china_2025_2,china,proofs,OPC R1 8B,1.0
595,Grok 4,xai/grok-4,china_2025_2,china,proofs,OPC R1 8B,0.0
596,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,china_2025_2,china,proofs,OPC R1 8B,1.0
597,GPT-5 (high),openai/gpt-5,china_2025_2,china,proofs,OPC R1 8B,0.0
598,o4-mini (high),openai/o4-mini--high,china_2025_2,china,proofs,OPC R1 8B,0.0
599,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,china_2025_2,china,proofs,OPC R1 8B,0.0
600,Qwen3-4B (25/07),qwen/qwen3_4b,china_2025_2,china,proofs,OPC R1 8B,0.0
601,gemini-2.5-pro,gemini/gemini-pro-2.5,china_2025_2,china,proofs,OPC R1 8B,0.0
602,Qwen3-4B (25/07),qwen/qwen3_4b,china_2025_3,china,proofs,OPC R1 8B,0.0
603,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,china_2025_3,china,proofs,OPC R1 8B,0.0
604,GPT OSS 120B (high),openai/oss-120b,china_2025_3,china,proofs,OPC R1 8B,1.0
605,GPT-5-mini (high),openai/gpt-5-mini,china_2025_3,china,proofs,OPC R1 8B,0.0
606,Grok 4,xai/grok-4,china_2025_3,china,proofs,OPC R1 8B,0.0
607,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,china_2025_3,china,proofs,OPC R1 8B,0.0
608,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,china_2025_3,china,proofs,OPC R1 8B,0.0
609,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,china_2025_3,china,proofs,OPC R1 8B,0.0
610,gemini-2.5-pro,gemini/gemini-pro-2.5,china_2025_3,china,proofs,OPC R1 8B,1.0
611,o4-mini (high),openai/o4-mini--high,china_2025_3,china,proofs,OPC R1 8B,0.0
612,GPT-5-mini (high),openai/gpt-5-mini,china_2025_5,china,proofs,OPC R1 8B,0.0
613,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,china_2025_5,china,proofs,OPC R1 8B,0.0
614,o4-mini (high),openai/o4-mini--high,china_2025_5,china,proofs,OPC R1 8B,0.0
615,Grok 4,xai/grok-4,china_2025_5,china,proofs,OPC R1 8B,0.0
616,gemini-2.5-pro,gemini/gemini-pro-2.5,china_2025_5,china,proofs,OPC R1 8B,0.0
617,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,china_2025_5,china,proofs,OPC R1 8B,0.0
618,GPT-5 (high),openai/gpt-5,china_2025_5,china,proofs,OPC R1 8B,0.0
619,GPT OSS 120B (high),openai/oss-120b,china_2025_5,china,proofs,OPC R1 8B,0.0
620,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,china_2025_5,china,proofs,OPC R1 8B,0.0
621,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,china_2025_5,china,proofs,OPC R1 8B,0.0
622,Qwen3-4B (25/07),qwen/qwen3_4b,china_2025_5,china,proofs,OPC R1 8B,0.0
623,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,china_2025_6,china,proofs,OPC R1 8B,0.0
624,GPT-5 (high),openai/gpt-5,china_2025_6,china,proofs,OPC R1 8B,0.0
625,GPT-5-mini (high),openai/gpt-5-mini,china_2025_6,china,proofs,OPC R1 8B,0.0
626,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,china_2025_6,china,proofs,OPC R1 8B,0.0
627,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,china_2025_6,china,proofs,OPC R1 8B,0.0
628,gemini-2.5-pro,gemini/gemini-pro-2.5,china_2025_6,china,proofs,OPC R1 8B,0.0
629,GPT OSS 120B (high),openai/oss-120b,china_2025_6,china,proofs,OPC R1 8B,0.0
630,o4-mini (high),openai/o4-mini--high,china_2025_6,china,proofs,OPC R1 8B,1.0
631,Qwen3-4B (25/07),qwen/qwen3_4b,china_2025_6,china,proofs,OPC R1 8B,0.0
632,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,china_2025_6,china,proofs,OPC R1 8B,0.0
633,o4-mini (high),openai/o4-mini--high,chinatst_2025_1,chinatst,proofs,OPC R1 8B,0.0
634,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,chinatst_2025_1,chinatst,proofs,OPC R1 8B,0.0
635,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,chinatst_2025_1,chinatst,proofs,OPC R1 8B,0.0
636,GPT OSS 120B (high),openai/oss-120b,chinatst_2025_1,chinatst,proofs,OPC R1 8B,0.0
637,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,chinatst_2025_1,chinatst,proofs,OPC R1 8B,1.0
638,gemini-2.5-pro,gemini/gemini-pro-2.5,chinatst_2025_1,chinatst,proofs,OPC R1 8B,0.0
639,GPT-5 (high),openai/gpt-5,chinatst_2025_1,chinatst,proofs,OPC R1 8B,0.0
640,Grok 4,xai/grok-4,chinatst_2025_1,chinatst,proofs,OPC R1 8B,0.0
641,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,chinatst_2025_1,chinatst,proofs,OPC R1 8B,0.0
642,Qwen3-4B (25/07),qwen/qwen3_4b,chinatst_2025_1,chinatst,proofs,OPC R1 8B,0.0
643,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,chinatst_2025_10,chinatst,proofs,OPC R1 8B,0.0
644,o4-mini (high),openai/o4-mini--high,chinatst_2025_10,chinatst,proofs,OPC R1 8B,1.0
645,GPT-5 (high),openai/gpt-5,chinatst_2025_10,chinatst,proofs,OPC R1 8B,0.0
646,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,chinatst_2025_10,chinatst,proofs,OPC R1 8B,0.0
647,GPT-5-mini (high),openai/gpt-5-mini,chinatst_2025_10,chinatst,proofs,OPC R1 8B,1.0
648,Grok 4,xai/grok-4,chinatst_2025_10,chinatst,proofs,OPC R1 8B,0.0
649,GPT OSS 120B (high),openai/oss-120b,chinatst_2025_10,chinatst,proofs,OPC R1 8B,0.0
650,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,chinatst_2025_10,chinatst,proofs,OPC R1 8B,0.0
651,Qwen3-4B (25/07),qwen/qwen3_4b,chinatst_2025_10,chinatst,proofs,OPC R1 8B,0.0
652,gemini-2.5-pro,gemini/gemini-pro-2.5,chinatst_2025_10,chinatst,proofs,OPC R1 8B,1.0
653,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,chinatst_2025_10,chinatst,proofs,OPC R1 8B,0.0
654,o4-mini (high),openai/o4-mini--high,chinatst_2025_11,chinatst,proofs,OPC R1 8B,0.0
655,Grok 4,xai/grok-4,chinatst_2025_11,chinatst,proofs,OPC R1 8B,0.0
656,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,chinatst_2025_11,chinatst,proofs,OPC R1 8B,0.0
657,GPT-5-mini (high),openai/gpt-5-mini,chinatst_2025_11,chinatst,proofs,OPC R1 8B,0.0
658,gemini-2.5-pro,gemini/gemini-pro-2.5,chinatst_2025_11,chinatst,proofs,OPC R1 8B,0.0
659,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,chinatst_2025_11,chinatst,proofs,OPC R1 8B,0.0
660,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,chinatst_2025_11,chinatst,proofs,OPC R1 8B,0.0
661,GPT-5 (high),openai/gpt-5,chinatst_2025_11,chinatst,proofs,OPC R1 8B,0.0
662,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,chinatst_2025_11,chinatst,proofs,OPC R1 8B,0.0
663,GPT OSS 120B (high),openai/oss-120b,chinatst_2025_11,chinatst,proofs,OPC R1 8B,0.0
664,Qwen3-4B (25/07),qwen/qwen3_4b,chinatst_2025_11,chinatst,proofs,OPC R1 8B,0.0
665,o4-mini (high),openai/o4-mini--high,chinatst_2025_12,chinatst,proofs,OPC R1 8B,0.0
666,GPT OSS 120B (high),openai/oss-120b,chinatst_2025_12,chinatst,proofs,OPC R1 8B,0.0
667,GPT-5-mini (high),openai/gpt-5-mini,chinatst_2025_12,chinatst,proofs,OPC R1 8B,0.0
668,GPT-5 (high),openai/gpt-5,chinatst_2025_12,chinatst,proofs,OPC R1 8B,1.0
669,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,chinatst_2025_12,chinatst,proofs,OPC R1 8B,0.0
670,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,chinatst_2025_12,chinatst,proofs,OPC R1 8B,0.0
671,Qwen3-4B (25/07),qwen/qwen3_4b,chinatst_2025_12,chinatst,proofs,OPC R1 8B,0.0
672,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,chinatst_2025_12,chinatst,proofs,OPC R1 8B,0.0
673,gemini-2.5-pro,gemini/gemini-pro-2.5,chinatst_2025_12,chinatst,proofs,OPC R1 8B,0.0
674,Grok 4,xai/grok-4,chinatst_2025_12,chinatst,proofs,OPC R1 8B,1.0
675,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,chinatst_2025_12,chinatst,proofs,OPC R1 8B,0.0
676,gemini-2.5-pro,gemini/gemini-pro-2.5,chinatst_2025_13,chinatst,proofs,OPC R1 8B,0.0
677,Qwen3-4B (25/07),qwen/qwen3_4b,chinatst_2025_13,chinatst,proofs,OPC R1 8B,0.0
678,GPT-5 (high),openai/gpt-5,chinatst_2025_13,chinatst,proofs,OPC R1 8B,1.0
679,GPT OSS 120B (high),openai/oss-120b,chinatst_2025_13,chinatst,proofs,OPC R1 8B,0.0
680,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,chinatst_2025_13,chinatst,proofs,OPC R1 8B,0.0
681,GPT-5-mini (high),openai/gpt-5-mini,chinatst_2025_13,chinatst,proofs,OPC R1 8B,0.0
682,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,chinatst_2025_13,chinatst,proofs,OPC R1 8B,0.0
683,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,chinatst_2025_13,chinatst,proofs,OPC R1 8B,0.0
684,Grok 4,xai/grok-4,chinatst_2025_13,chinatst,proofs,OPC R1 8B,0.0
685,o4-mini (high),openai/o4-mini--high,chinatst_2025_13,chinatst,proofs,OPC R1 8B,0.0
686,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,chinatst_2025_13,chinatst,proofs,OPC R1 8B,0.0
687,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,chinatst_2025_14,chinatst,proofs,OPC R1 8B,0.0
688,o4-mini (high),openai/o4-mini--high,chinatst_2025_14,chinatst,proofs,OPC R1 8B,0.0
689,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,chinatst_2025_14,chinatst,proofs,OPC R1 8B,0.0
690,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,chinatst_2025_14,chinatst,proofs,OPC R1 8B,0.0
691,gemini-2.5-pro,gemini/gemini-pro-2.5,chinatst_2025_14,chinatst,proofs,OPC R1 8B,0.0
692,Qwen3-4B (25/07),qwen/qwen3_4b,chinatst_2025_14,chinatst,proofs,OPC R1 8B,0.0
693,GPT OSS 120B (high),openai/oss-120b,chinatst_2025_14,chinatst,proofs,OPC R1 8B,1.0
694,GPT-5-mini (high),openai/gpt-5-mini,chinatst_2025_14,chinatst,proofs,OPC R1 8B,0.0
695,Grok 4,xai/grok-4,chinatst_2025_14,chinatst,proofs,OPC R1 8B,0.0
696,GPT-5 (high),openai/gpt-5,chinatst_2025_14,chinatst,proofs,OPC R1 8B,0.0
697,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,chinatst_2025_14,chinatst,proofs,OPC R1 8B,0.0
698,o4-mini (high),openai/o4-mini--high,chinatst_2025_15,chinatst,proofs,OPC R1 8B,0.0
699,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,chinatst_2025_15,chinatst,proofs,OPC R1 8B,0.0
700,GPT-5 (high),openai/gpt-5,chinatst_2025_15,chinatst,proofs,OPC R1 8B,0.0
701,gemini-2.5-pro,gemini/gemini-pro-2.5,chinatst_2025_15,chinatst,proofs,OPC R1 8B,0.0
702,GPT OSS 120B (high),openai/oss-120b,chinatst_2025_15,chinatst,proofs,OPC R1 8B,0.0
703,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,chinatst_2025_15,chinatst,proofs,OPC R1 8B,0.0
704,Qwen3-4B (25/07),qwen/qwen3_4b,chinatst_2025_15,chinatst,proofs,OPC R1 8B,0.0
705,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,chinatst_2025_15,chinatst,proofs,OPC R1 8B,0.0
706,GPT-5-mini (high),openai/gpt-5-mini,chinatst_2025_15,chinatst,proofs,OPC R1 8B,0.0
707,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,chinatst_2025_15,chinatst,proofs,OPC R1 8B,0.0
708,GPT OSS 120B (high),openai/oss-120b,chinatst_2025_16,chinatst,proofs,OPC R1 8B,1.0
709,o4-mini (high),openai/o4-mini--high,chinatst_2025_16,chinatst,proofs,OPC R1 8B,0.0
710,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,chinatst_2025_16,chinatst,proofs,OPC R1 8B,0.0
711,Qwen3-4B (25/07),qwen/qwen3_4b,chinatst_2025_16,chinatst,proofs,OPC R1 8B,0.0
712,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,chinatst_2025_16,chinatst,proofs,OPC R1 8B,0.0
713,gemini-2.5-pro,gemini/gemini-pro-2.5,chinatst_2025_16,chinatst,proofs,OPC R1 8B,0.0
714,Grok 4,xai/grok-4,chinatst_2025_16,chinatst,proofs,OPC R1 8B,0.0
715,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,chinatst_2025_16,chinatst,proofs,OPC R1 8B,0.0
716,GPT-5-mini (high),openai/gpt-5-mini,chinatst_2025_16,chinatst,proofs,OPC R1 8B,0.0
717,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,chinatst_2025_16,chinatst,proofs,OPC R1 8B,0.0
718,GPT-5 (high),openai/gpt-5,chinatst_2025_16,chinatst,proofs,OPC R1 8B,0.0
719,GPT-5-mini (high),openai/gpt-5-mini,chinatst_2025_17,chinatst,proofs,OPC R1 8B,1.0
720,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,chinatst_2025_17,chinatst,proofs,OPC R1 8B,1.0
721,Grok 4,xai/grok-4,chinatst_2025_17,chinatst,proofs,OPC R1 8B,0.0
722,GPT-5 (high),openai/gpt-5,chinatst_2025_17,chinatst,proofs,OPC R1 8B,0.0
723,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,chinatst_2025_17,chinatst,proofs,OPC R1 8B,0.0
724,o4-mini (high),openai/o4-mini--high,chinatst_2025_17,chinatst,proofs,OPC R1 8B,0.0
725,gemini-2.5-pro,gemini/gemini-pro-2.5,chinatst_2025_17,chinatst,proofs,OPC R1 8B,0.0
726,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,chinatst_2025_17,chinatst,proofs,OPC R1 8B,0.0
727,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,chinatst_2025_17,chinatst,proofs,OPC R1 8B,0.0
728,Qwen3-4B (25/07),qwen/qwen3_4b,chinatst_2025_17,chinatst,proofs,OPC R1 8B,0.0
729,GPT OSS 120B (high),openai/oss-120b,chinatst_2025_17,chinatst,proofs,OPC R1 8B,1.0
730,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,chinatst_2025_18,chinatst,proofs,OPC R1 8B,0.0
731,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,chinatst_2025_18,chinatst,proofs,OPC R1 8B,0.0
732,GPT-5 (high),openai/gpt-5,chinatst_2025_18,chinatst,proofs,OPC R1 8B,0.0
733,GPT OSS 120B (high),openai/oss-120b,chinatst_2025_18,chinatst,proofs,OPC R1 8B,1.0
734,Qwen3-4B (25/07),qwen/qwen3_4b,chinatst_2025_18,chinatst,proofs,OPC R1 8B,0.0
735,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,chinatst_2025_18,chinatst,proofs,OPC R1 8B,0.0
736,gemini-2.5-pro,gemini/gemini-pro-2.5,chinatst_2025_18,chinatst,proofs,OPC R1 8B,0.0
737,GPT-5-mini (high),openai/gpt-5-mini,chinatst_2025_18,chinatst,proofs,OPC R1 8B,0.0
738,o4-mini (high),openai/o4-mini--high,chinatst_2025_18,chinatst,proofs,OPC R1 8B,0.0
739,Grok 4,xai/grok-4,chinatst_2025_18,chinatst,proofs,OPC R1 8B,0.0
740,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,chinatst_2025_18,chinatst,proofs,OPC R1 8B,0.0
741,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,chinatst_2025_19,chinatst,proofs,OPC R1 8B,0.0
742,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,chinatst_2025_19,chinatst,proofs,OPC R1 8B,0.0
743,o4-mini (high),openai/o4-mini--high,chinatst_2025_19,chinatst,proofs,OPC R1 8B,0.0
744,GPT OSS 120B (high),openai/oss-120b,chinatst_2025_19,chinatst,proofs,OPC R1 8B,0.0
745,Grok 4,xai/grok-4,chinatst_2025_19,chinatst,proofs,OPC R1 8B,0.0
746,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,chinatst_2025_19,chinatst,proofs,OPC R1 8B,0.0
747,Qwen3-4B (25/07),qwen/qwen3_4b,chinatst_2025_19,chinatst,proofs,OPC R1 8B,0.0
748,GPT-5-mini (high),openai/gpt-5-mini,chinatst_2025_19,chinatst,proofs,OPC R1 8B,0.0
749,GPT-5 (high),openai/gpt-5,chinatst_2025_19,chinatst,proofs,OPC R1 8B,0.0
750,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,chinatst_2025_19,chinatst,proofs,OPC R1 8B,0.0
751,gemini-2.5-pro,gemini/gemini-pro-2.5,chinatst_2025_19,chinatst,proofs,OPC R1 8B,0.0
752,o4-mini (high),openai/o4-mini--high,chinatst_2025_2,chinatst,proofs,OPC R1 8B,0.0
753,GPT-5-mini (high),openai/gpt-5-mini,chinatst_2025_2,chinatst,proofs,OPC R1 8B,0.0
754,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,chinatst_2025_2,chinatst,proofs,OPC R1 8B,0.0
755,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,chinatst_2025_2,chinatst,proofs,OPC R1 8B,1.0
756,Grok 4,xai/grok-4,chinatst_2025_2,chinatst,proofs,OPC R1 8B,0.0
757,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,chinatst_2025_2,chinatst,proofs,OPC R1 8B,0.0
758,gemini-2.5-pro,gemini/gemini-pro-2.5,chinatst_2025_2,chinatst,proofs,OPC R1 8B,0.0
759,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,chinatst_2025_2,chinatst,proofs,OPC R1 8B,0.0
760,GPT OSS 120B (high),openai/oss-120b,chinatst_2025_2,chinatst,proofs,OPC R1 8B,1.0
761,Qwen3-4B (25/07),qwen/qwen3_4b,chinatst_2025_2,chinatst,proofs,OPC R1 8B,0.0
762,GPT-5 (high),openai/gpt-5,chinatst_2025_2,chinatst,proofs,OPC R1 8B,0.0
763,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,chinatst_2025_20,chinatst,proofs,OPC R1 8B,0.0
764,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,chinatst_2025_20,chinatst,proofs,OPC R1 8B,0.0
765,Grok 4,xai/grok-4,chinatst_2025_20,chinatst,proofs,OPC R1 8B,0.0
766,Qwen3-4B (25/07),qwen/qwen3_4b,chinatst_2025_20,chinatst,proofs,OPC R1 8B,0.0
767,GPT-5-mini (high),openai/gpt-5-mini,chinatst_2025_20,chinatst,proofs,OPC R1 8B,0.0
768,GPT-5 (high),openai/gpt-5,chinatst_2025_20,chinatst,proofs,OPC R1 8B,1.0
769,gemini-2.5-pro,gemini/gemini-pro-2.5,chinatst_2025_20,chinatst,proofs,OPC R1 8B,0.0
770,o4-mini (high),openai/o4-mini--high,chinatst_2025_20,chinatst,proofs,OPC R1 8B,0.0
771,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,chinatst_2025_20,chinatst,proofs,OPC R1 8B,0.0
772,GPT OSS 120B (high),openai/oss-120b,chinatst_2025_20,chinatst,proofs,OPC R1 8B,0.0
773,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,chinatst_2025_20,chinatst,proofs,OPC R1 8B,0.0
774,Grok 4,xai/grok-4,chinatst_2025_21,chinatst,proofs,OPC R1 8B,0.0
775,Qwen3-4B (25/07),qwen/qwen3_4b,chinatst_2025_21,chinatst,proofs,OPC R1 8B,0.0
776,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,chinatst_2025_21,chinatst,proofs,OPC R1 8B,1.0
777,GPT-5 (high),openai/gpt-5,chinatst_2025_21,chinatst,proofs,OPC R1 8B,0.0
778,gemini-2.5-pro,gemini/gemini-pro-2.5,chinatst_2025_21,chinatst,proofs,OPC R1 8B,0.0
779,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,chinatst_2025_21,chinatst,proofs,OPC R1 8B,0.0
780,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,chinatst_2025_21,chinatst,proofs,OPC R1 8B,0.0
781,o4-mini (high),openai/o4-mini--high,chinatst_2025_21,chinatst,proofs,OPC R1 8B,0.0
782,GPT-5-mini (high),openai/gpt-5-mini,chinatst_2025_21,chinatst,proofs,OPC R1 8B,1.0
783,GPT OSS 120B (high),openai/oss-120b,chinatst_2025_21,chinatst,proofs,OPC R1 8B,1.0
784,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,chinatst_2025_21,chinatst,proofs,OPC R1 8B,0.0
785,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,chinatst_2025_22,chinatst,proofs,OPC R1 8B,0.0
786,Qwen3-4B (25/07),qwen/qwen3_4b,chinatst_2025_22,chinatst,proofs,OPC R1 8B,0.0
787,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,chinatst_2025_22,chinatst,proofs,OPC R1 8B,0.0
788,GPT OSS 120B (high),openai/oss-120b,chinatst_2025_22,chinatst,proofs,OPC R1 8B,0.0
789,gemini-2.5-pro,gemini/gemini-pro-2.5,chinatst_2025_22,chinatst,proofs,OPC R1 8B,0.0
790,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,chinatst_2025_22,chinatst,proofs,OPC R1 8B,0.0
791,o4-mini (high),openai/o4-mini--high,chinatst_2025_22,chinatst,proofs,OPC R1 8B,0.0
792,Grok 4,xai/grok-4,chinatst_2025_22,chinatst,proofs,OPC R1 8B,0.0
793,GPT-5 (high),openai/gpt-5,chinatst_2025_22,chinatst,proofs,OPC R1 8B,1.0
794,GPT-5-mini (high),openai/gpt-5-mini,chinatst_2025_22,chinatst,proofs,OPC R1 8B,0.0
795,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,chinatst_2025_22,chinatst,proofs,OPC R1 8B,1.0
796,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,chinatst_2025_3,chinatst,proofs,OPC R1 8B,0.0
797,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,chinatst_2025_3,chinatst,proofs,OPC R1 8B,0.0
798,gemini-2.5-pro,gemini/gemini-pro-2.5,chinatst_2025_3,chinatst,proofs,OPC R1 8B,0.0
799,GPT-5-mini (high),openai/gpt-5-mini,chinatst_2025_3,chinatst,proofs,OPC R1 8B,0.0
800,GPT-5 (high),openai/gpt-5,chinatst_2025_3,chinatst,proofs,OPC R1 8B,1.0
801,GPT OSS 120B (high),openai/oss-120b,chinatst_2025_3,chinatst,proofs,OPC R1 8B,0.0
802,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,chinatst_2025_3,chinatst,proofs,OPC R1 8B,0.0
803,o4-mini (high),openai/o4-mini--high,chinatst_2025_3,chinatst,proofs,OPC R1 8B,0.0
804,Grok 4,xai/grok-4,chinatst_2025_3,chinatst,proofs,OPC R1 8B,0.0
805,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,chinatst_2025_3,chinatst,proofs,OPC R1 8B,0.0
806,Qwen3-4B (25/07),qwen/qwen3_4b,chinatst_2025_3,chinatst,proofs,OPC R1 8B,0.0
807,GPT OSS 120B (high),openai/oss-120b,chinatst_2025_4,chinatst,proofs,OPC R1 8B,0.0
808,gemini-2.5-pro,gemini/gemini-pro-2.5,chinatst_2025_4,chinatst,proofs,OPC R1 8B,0.0
809,Grok 4,xai/grok-4,chinatst_2025_4,chinatst,proofs,OPC R1 8B,0.0
810,o4-mini (high),openai/o4-mini--high,chinatst_2025_4,chinatst,proofs,OPC R1 8B,1.0
811,Qwen3-4B (25/07),qwen/qwen3_4b,chinatst_2025_4,chinatst,proofs,OPC R1 8B,0.0
812,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,chinatst_2025_4,chinatst,proofs,OPC R1 8B,0.0
813,GPT-5 (high),openai/gpt-5,chinatst_2025_4,chinatst,proofs,OPC R1 8B,0.0
814,GPT-5-mini (high),openai/gpt-5-mini,chinatst_2025_4,chinatst,proofs,OPC R1 8B,1.0
815,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,chinatst_2025_4,chinatst,proofs,OPC R1 8B,1.0
816,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,chinatst_2025_4,chinatst,proofs,OPC R1 8B,0.0
817,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,chinatst_2025_4,chinatst,proofs,OPC R1 8B,0.0
818,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,chinatst_2025_5,chinatst,proofs,OPC R1 8B,0.0
819,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,chinatst_2025_5,chinatst,proofs,OPC R1 8B,0.0
820,Grok 4,xai/grok-4,chinatst_2025_5,chinatst,proofs,OPC R1 8B,1.0
821,GPT-5-mini (high),openai/gpt-5-mini,chinatst_2025_5,chinatst,proofs,OPC R1 8B,1.0
822,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,chinatst_2025_5,chinatst,proofs,OPC R1 8B,0.0
823,GPT-5 (high),openai/gpt-5,chinatst_2025_5,chinatst,proofs,OPC R1 8B,0.0
824,o4-mini (high),openai/o4-mini--high,chinatst_2025_5,chinatst,proofs,OPC R1 8B,0.0
825,gemini-2.5-pro,gemini/gemini-pro-2.5,chinatst_2025_5,chinatst,proofs,OPC R1 8B,0.0
826,GPT OSS 120B (high),openai/oss-120b,chinatst_2025_5,chinatst,proofs,OPC R1 8B,0.0
827,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,chinatst_2025_5,chinatst,proofs,OPC R1 8B,0.0
828,Qwen3-4B (25/07),qwen/qwen3_4b,chinatst_2025_5,chinatst,proofs,OPC R1 8B,0.0
829,GPT-5 (high),openai/gpt-5,chinatst_2025_6,chinatst,proofs,OPC R1 8B,0.0
830,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,chinatst_2025_6,chinatst,proofs,OPC R1 8B,0.0
831,GPT-5-mini (high),openai/gpt-5-mini,chinatst_2025_6,chinatst,proofs,OPC R1 8B,1.0
832,Grok 4,xai/grok-4,chinatst_2025_6,chinatst,proofs,OPC R1 8B,1.0
833,Qwen3-4B (25/07),qwen/qwen3_4b,chinatst_2025_6,chinatst,proofs,OPC R1 8B,0.0
834,GPT OSS 120B (high),openai/oss-120b,chinatst_2025_6,chinatst,proofs,OPC R1 8B,0.0
835,gemini-2.5-pro,gemini/gemini-pro-2.5,chinatst_2025_6,chinatst,proofs,OPC R1 8B,0.0
836,o4-mini (high),openai/o4-mini--high,chinatst_2025_6,chinatst,proofs,OPC R1 8B,0.0
837,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,chinatst_2025_6,chinatst,proofs,OPC R1 8B,1.0
838,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,chinatst_2025_6,chinatst,proofs,OPC R1 8B,0.0
839,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,chinatst_2025_6,chinatst,proofs,OPC R1 8B,0.0
840,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,chinatst_2025_7,chinatst,proofs,OPC R1 8B,0.0
841,GPT-5 (high),openai/gpt-5,chinatst_2025_7,chinatst,proofs,OPC R1 8B,0.0
842,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,chinatst_2025_7,chinatst,proofs,OPC R1 8B,0.0
843,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,chinatst_2025_7,chinatst,proofs,OPC R1 8B,0.0
844,GPT-5-mini (high),openai/gpt-5-mini,chinatst_2025_7,chinatst,proofs,OPC R1 8B,0.0
845,gemini-2.5-pro,gemini/gemini-pro-2.5,chinatst_2025_7,chinatst,proofs,OPC R1 8B,0.0
846,Grok 4,xai/grok-4,chinatst_2025_7,chinatst,proofs,OPC R1 8B,0.0
847,Qwen3-4B (25/07),qwen/qwen3_4b,chinatst_2025_7,chinatst,proofs,OPC R1 8B,0.0
848,o4-mini (high),openai/o4-mini--high,chinatst_2025_7,chinatst,proofs,OPC R1 8B,0.0
849,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,chinatst_2025_7,chinatst,proofs,OPC R1 8B,0.0
850,GPT OSS 120B (high),openai/oss-120b,chinatst_2025_7,chinatst,proofs,OPC R1 8B,0.0
851,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,chinatst_2025_8,chinatst,proofs,OPC R1 8B,0.0
852,gemini-2.5-pro,gemini/gemini-pro-2.5,chinatst_2025_8,chinatst,proofs,OPC R1 8B,0.0
853,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,chinatst_2025_8,chinatst,proofs,OPC R1 8B,0.0
854,Qwen3-4B (25/07),qwen/qwen3_4b,chinatst_2025_8,chinatst,proofs,OPC R1 8B,0.0
855,o4-mini (high),openai/o4-mini--high,chinatst_2025_8,chinatst,proofs,OPC R1 8B,0.0
856,GPT-5 (high),openai/gpt-5,chinatst_2025_8,chinatst,proofs,OPC R1 8B,0.0
857,GPT-5-mini (high),openai/gpt-5-mini,chinatst_2025_8,chinatst,proofs,OPC R1 8B,0.0
858,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,chinatst_2025_8,chinatst,proofs,OPC R1 8B,0.0
859,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,chinatst_2025_8,chinatst,proofs,OPC R1 8B,0.0
860,Grok 4,xai/grok-4,chinatst_2025_8,chinatst,proofs,OPC R1 8B,0.0
861,GPT OSS 120B (high),openai/oss-120b,chinatst_2025_8,chinatst,proofs,OPC R1 8B,0.0
862,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,chinatst_2025_9,chinatst,proofs,OPC R1 8B,0.0
863,Qwen3-4B (25/07),qwen/qwen3_4b,chinatst_2025_9,chinatst,proofs,OPC R1 8B,0.0
864,o4-mini (high),openai/o4-mini--high,chinatst_2025_9,chinatst,proofs,OPC R1 8B,0.0
865,GPT-5 (high),openai/gpt-5,chinatst_2025_9,chinatst,proofs,OPC R1 8B,0.0
866,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,chinatst_2025_9,chinatst,proofs,OPC R1 8B,0.0
867,Grok 4,xai/grok-4,chinatst_2025_9,chinatst,proofs,OPC R1 8B,0.0
868,GPT-5-mini (high),openai/gpt-5-mini,chinatst_2025_9,chinatst,proofs,OPC R1 8B,0.0
869,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,chinatst_2025_9,chinatst,proofs,OPC R1 8B,0.0
870,GPT OSS 120B (high),openai/oss-120b,chinatst_2025_9,chinatst,proofs,OPC R1 8B,0.0
871,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,chinatst_2025_9,chinatst,proofs,OPC R1 8B,0.0
872,gemini-2.5-pro,gemini/gemini-pro-2.5,chinatst_2025_9,chinatst,proofs,OPC R1 8B,0.0
873,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,egmo_2025_1,egmo,proofs,OPC R1 8B,0.0
874,gemini-2.5-pro,gemini/gemini-pro-2.5,egmo_2025_1,egmo,proofs,OPC R1 8B,0.0
875,Qwen3-4B (25/07),qwen/qwen3_4b,egmo_2025_1,egmo,proofs,OPC R1 8B,0.0
876,GPT-5 (high),openai/gpt-5,egmo_2025_1,egmo,proofs,OPC R1 8B,1.0
877,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,egmo_2025_1,egmo,proofs,OPC R1 8B,0.0
878,o4-mini (high),openai/o4-mini--high,egmo_2025_1,egmo,proofs,OPC R1 8B,0.0
879,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,egmo_2025_1,egmo,proofs,OPC R1 8B,0.0
880,GPT-5-mini (high),openai/gpt-5-mini,egmo_2025_1,egmo,proofs,OPC R1 8B,0.0
881,GPT OSS 120B (high),openai/oss-120b,egmo_2025_1,egmo,proofs,OPC R1 8B,0.0
882,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,egmo_2025_1,egmo,proofs,OPC R1 8B,0.0
883,Grok 4,xai/grok-4,egmo_2025_1,egmo,proofs,OPC R1 8B,0.0
884,Grok 4,xai/grok-4,egmo_2025_2,egmo,proofs,OPC R1 8B,0.0
885,Qwen3-4B (25/07),qwen/qwen3_4b,egmo_2025_2,egmo,proofs,OPC R1 8B,0.0
886,gemini-2.5-pro,gemini/gemini-pro-2.5,egmo_2025_2,egmo,proofs,OPC R1 8B,1.0
887,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,egmo_2025_2,egmo,proofs,OPC R1 8B,0.0
888,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,egmo_2025_2,egmo,proofs,OPC R1 8B,0.0
889,GPT OSS 120B (high),openai/oss-120b,egmo_2025_2,egmo,proofs,OPC R1 8B,0.0
890,o4-mini (high),openai/o4-mini--high,egmo_2025_2,egmo,proofs,OPC R1 8B,0.0
891,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,egmo_2025_2,egmo,proofs,OPC R1 8B,0.0
892,GPT-5 (high),openai/gpt-5,egmo_2025_2,egmo,proofs,OPC R1 8B,0.0
893,GPT-5-mini (high),openai/gpt-5-mini,egmo_2025_2,egmo,proofs,OPC R1 8B,1.0
894,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,egmo_2025_2,egmo,proofs,OPC R1 8B,0.0
895,gemini-2.5-pro,gemini/gemini-pro-2.5,egmo_2025_3,egmo,proofs,OPC R1 8B,0.0
896,Qwen3-4B (25/07),qwen/qwen3_4b,egmo_2025_3,egmo,proofs,OPC R1 8B,0.0
897,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,egmo_2025_3,egmo,proofs,OPC R1 8B,0.0
898,GPT-5 (high),openai/gpt-5,egmo_2025_3,egmo,proofs,OPC R1 8B,0.0
899,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,egmo_2025_3,egmo,proofs,OPC R1 8B,0.0
900,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,egmo_2025_3,egmo,proofs,OPC R1 8B,0.0
901,o4-mini (high),openai/o4-mini--high,egmo_2025_3,egmo,proofs,OPC R1 8B,0.0
902,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,egmo_2025_3,egmo,proofs,OPC R1 8B,0.0
903,GPT OSS 120B (high),openai/oss-120b,egmo_2025_3,egmo,proofs,OPC R1 8B,0.0
904,Grok 4,xai/grok-4,egmo_2025_3,egmo,proofs,OPC R1 8B,0.0
905,GPT-5 (high),openai/gpt-5,egmo_2025_4,egmo,proofs,OPC R1 8B,0.0
906,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,egmo_2025_4,egmo,proofs,OPC R1 8B,0.0
907,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,egmo_2025_4,egmo,proofs,OPC R1 8B,0.0
908,o4-mini (high),openai/o4-mini--high,egmo_2025_4,egmo,proofs,OPC R1 8B,0.0
909,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,egmo_2025_4,egmo,proofs,OPC R1 8B,0.0
910,gemini-2.5-pro,gemini/gemini-pro-2.5,egmo_2025_4,egmo,proofs,OPC R1 8B,0.0
911,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,egmo_2025_4,egmo,proofs,OPC R1 8B,0.0
912,GPT OSS 120B (high),openai/oss-120b,egmo_2025_4,egmo,proofs,OPC R1 8B,1.0
913,GPT-5-mini (high),openai/gpt-5-mini,egmo_2025_4,egmo,proofs,OPC R1 8B,0.0
914,Qwen3-4B (25/07),qwen/qwen3_4b,egmo_2025_4,egmo,proofs,OPC R1 8B,0.0
915,Grok 4,xai/grok-4,egmo_2025_4,egmo,proofs,OPC R1 8B,0.0
916,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,egmo_2025_5,egmo,proofs,OPC R1 8B,1.0
917,gemini-2.5-pro,gemini/gemini-pro-2.5,egmo_2025_5,egmo,proofs,OPC R1 8B,0.0
918,Grok 4,xai/grok-4,egmo_2025_5,egmo,proofs,OPC R1 8B,0.0
919,GPT OSS 120B (high),openai/oss-120b,egmo_2025_5,egmo,proofs,OPC R1 8B,0.0
920,GPT-5-mini (high),openai/gpt-5-mini,egmo_2025_5,egmo,proofs,OPC R1 8B,0.0
921,GPT-5 (high),openai/gpt-5,egmo_2025_5,egmo,proofs,OPC R1 8B,0.0
922,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,egmo_2025_5,egmo,proofs,OPC R1 8B,0.0
923,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,egmo_2025_5,egmo,proofs,OPC R1 8B,0.0
924,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,egmo_2025_5,egmo,proofs,OPC R1 8B,0.0
925,Qwen3-4B (25/07),qwen/qwen3_4b,egmo_2025_5,egmo,proofs,OPC R1 8B,0.0
926,o4-mini (high),openai/o4-mini--high,egmo_2025_5,egmo,proofs,OPC R1 8B,0.0
927,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,egmo_2025_6,egmo,proofs,OPC R1 8B,1.0
928,gemini-2.5-pro,gemini/gemini-pro-2.5,egmo_2025_6,egmo,proofs,OPC R1 8B,0.0
929,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,egmo_2025_6,egmo,proofs,OPC R1 8B,0.0
930,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,egmo_2025_6,egmo,proofs,OPC R1 8B,1.0
931,GPT-5 (high),openai/gpt-5,egmo_2025_6,egmo,proofs,OPC R1 8B,1.0
932,o4-mini (high),openai/o4-mini--high,egmo_2025_6,egmo,proofs,OPC R1 8B,1.0
933,Grok 4,xai/grok-4,egmo_2025_6,egmo,proofs,OPC R1 8B,1.0
934,GPT OSS 120B (high),openai/oss-120b,egmo_2025_6,egmo,proofs,OPC R1 8B,0.0
935,GPT-5-mini (high),openai/gpt-5-mini,egmo_2025_6,egmo,proofs,OPC R1 8B,0.0
936,Qwen3-4B (25/07),qwen/qwen3_4b,egmo_2025_6,egmo,proofs,OPC R1 8B,1.0
937,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,egmo_2025_6,egmo,proofs,OPC R1 8B,1.0
938,o4-mini (high),openai/o4-mini--high,elmosl_A_2025_1,elmosl,proofs,OPC R1 8B,0.0
939,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,elmosl_A_2025_1,elmosl,proofs,OPC R1 8B,0.0
940,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,elmosl_A_2025_1,elmosl,proofs,OPC R1 8B,0.0
941,Qwen3-4B (25/07),qwen/qwen3_4b,elmosl_A_2025_1,elmosl,proofs,OPC R1 8B,0.0
942,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,elmosl_A_2025_1,elmosl,proofs,OPC R1 8B,0.0
943,GPT OSS 120B (high),openai/oss-120b,elmosl_A_2025_1,elmosl,proofs,OPC R1 8B,1.0
944,GPT-5 (high),openai/gpt-5,elmosl_A_2025_1,elmosl,proofs,OPC R1 8B,0.0
945,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,elmosl_A_2025_1,elmosl,proofs,OPC R1 8B,0.0
946,Grok 4,xai/grok-4,elmosl_A_2025_1,elmosl,proofs,OPC R1 8B,0.0
947,gemini-2.5-pro,gemini/gemini-pro-2.5,elmosl_A_2025_1,elmosl,proofs,OPC R1 8B,0.0
948,Qwen3-4B (25/07),qwen/qwen3_4b,elmosl_A_2025_2,elmosl,proofs,OPC R1 8B,0.0
949,gemini-2.5-pro,gemini/gemini-pro-2.5,elmosl_A_2025_2,elmosl,proofs,OPC R1 8B,1.0
950,Grok 4,xai/grok-4,elmosl_A_2025_2,elmosl,proofs,OPC R1 8B,0.0
951,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,elmosl_A_2025_2,elmosl,proofs,OPC R1 8B,1.0
952,GPT OSS 120B (high),openai/oss-120b,elmosl_A_2025_2,elmosl,proofs,OPC R1 8B,0.0
953,o4-mini (high),openai/o4-mini--high,elmosl_A_2025_2,elmosl,proofs,OPC R1 8B,0.0
954,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,elmosl_A_2025_2,elmosl,proofs,OPC R1 8B,0.0
955,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,elmosl_A_2025_2,elmosl,proofs,OPC R1 8B,0.0
956,GPT-5 (high),openai/gpt-5,elmosl_A_2025_2,elmosl,proofs,OPC R1 8B,1.0
957,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,elmosl_A_2025_2,elmosl,proofs,OPC R1 8B,1.0
958,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,elmosl_A_2025_3,elmosl,proofs,OPC R1 8B,0.0
959,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,elmosl_A_2025_3,elmosl,proofs,OPC R1 8B,0.0
960,GPT OSS 120B (high),openai/oss-120b,elmosl_A_2025_3,elmosl,proofs,OPC R1 8B,0.0
961,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,elmosl_A_2025_3,elmosl,proofs,OPC R1 8B,0.0
962,gemini-2.5-pro,gemini/gemini-pro-2.5,elmosl_A_2025_3,elmosl,proofs,OPC R1 8B,0.0
963,Grok 4,xai/grok-4,elmosl_A_2025_3,elmosl,proofs,OPC R1 8B,1.0
964,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,elmosl_A_2025_3,elmosl,proofs,OPC R1 8B,0.0
965,Qwen3-4B (25/07),qwen/qwen3_4b,elmosl_A_2025_3,elmosl,proofs,OPC R1 8B,0.0
966,GPT-5 (high),openai/gpt-5,elmosl_A_2025_3,elmosl,proofs,OPC R1 8B,1.0
967,o4-mini (high),openai/o4-mini--high,elmosl_A_2025_3,elmosl,proofs,OPC R1 8B,0.0
968,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,elmosl_A_2025_5,elmosl,proofs,OPC R1 8B,0.0
969,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,elmosl_A_2025_5,elmosl,proofs,OPC R1 8B,1.0
970,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,elmosl_A_2025_5,elmosl,proofs,OPC R1 8B,0.0
971,GPT-5 (high),openai/gpt-5,elmosl_A_2025_5,elmosl,proofs,OPC R1 8B,1.0
972,GPT OSS 120B (high),openai/oss-120b,elmosl_A_2025_5,elmosl,proofs,OPC R1 8B,0.0
973,o4-mini (high),openai/o4-mini--high,elmosl_A_2025_5,elmosl,proofs,OPC R1 8B,0.0
974,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,elmosl_A_2025_5,elmosl,proofs,OPC R1 8B,0.0
975,Qwen3-4B (25/07),qwen/qwen3_4b,elmosl_A_2025_5,elmosl,proofs,OPC R1 8B,0.0
976,Grok 4,xai/grok-4,elmosl_A_2025_5,elmosl,proofs,OPC R1 8B,0.0
977,gemini-2.5-pro,gemini/gemini-pro-2.5,elmosl_A_2025_5,elmosl,proofs,OPC R1 8B,0.0
978,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,elmosl_A_2025_6,elmosl,proofs,OPC R1 8B,0.0
979,GPT OSS 120B (high),openai/oss-120b,elmosl_A_2025_6,elmosl,proofs,OPC R1 8B,1.0
980,Qwen3-4B (25/07),qwen/qwen3_4b,elmosl_A_2025_6,elmosl,proofs,OPC R1 8B,1.0
981,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,elmosl_A_2025_6,elmosl,proofs,OPC R1 8B,1.0
982,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,elmosl_A_2025_6,elmosl,proofs,OPC R1 8B,1.0
983,Grok 4,xai/grok-4,elmosl_A_2025_6,elmosl,proofs,OPC R1 8B,1.0
984,GPT-5 (high),openai/gpt-5,elmosl_A_2025_6,elmosl,proofs,OPC R1 8B,1.0
985,gemini-2.5-pro,gemini/gemini-pro-2.5,elmosl_A_2025_6,elmosl,proofs,OPC R1 8B,1.0
986,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,elmosl_A_2025_6,elmosl,proofs,OPC R1 8B,1.0
987,o4-mini (high),openai/o4-mini--high,elmosl_A_2025_6,elmosl,proofs,OPC R1 8B,1.0
988,GPT OSS 120B (high),openai/oss-120b,elmosl_A_2025_7,elmosl,proofs,OPC R1 8B,0.0
989,Qwen3-4B (25/07),qwen/qwen3_4b,elmosl_A_2025_7,elmosl,proofs,OPC R1 8B,0.0
990,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,elmosl_A_2025_7,elmosl,proofs,OPC R1 8B,0.0
991,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,elmosl_A_2025_7,elmosl,proofs,OPC R1 8B,0.0
992,o4-mini (high),openai/o4-mini--high,elmosl_A_2025_7,elmosl,proofs,OPC R1 8B,0.0
993,Grok 4,xai/grok-4,elmosl_A_2025_7,elmosl,proofs,OPC R1 8B,0.0
994,gemini-2.5-pro,gemini/gemini-pro-2.5,elmosl_A_2025_7,elmosl,proofs,OPC R1 8B,0.0
995,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,elmosl_A_2025_7,elmosl,proofs,OPC R1 8B,0.0
996,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,elmosl_A_2025_7,elmosl,proofs,OPC R1 8B,0.0
997,GPT-5 (high),openai/gpt-5,elmosl_A_2025_7,elmosl,proofs,OPC R1 8B,0.0
998,o4-mini (high),openai/o4-mini--high,elmosl_A_2025_8,elmosl,proofs,OPC R1 8B,0.0
999,GPT OSS 120B (high),openai/oss-120b,elmosl_A_2025_8,elmosl,proofs,OPC R1 8B,0.0
1000,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,elmosl_A_2025_8,elmosl,proofs,OPC R1 8B,0.0
1001,gemini-2.5-pro,gemini/gemini-pro-2.5,elmosl_A_2025_8,elmosl,proofs,OPC R1 8B,0.0
1002,Qwen3-4B (25/07),qwen/qwen3_4b,elmosl_A_2025_8,elmosl,proofs,OPC R1 8B,0.0
1003,GPT-5 (high),openai/gpt-5,elmosl_A_2025_8,elmosl,proofs,OPC R1 8B,0.0
1004,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,elmosl_A_2025_8,elmosl,proofs,OPC R1 8B,0.0
1005,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,elmosl_A_2025_8,elmosl,proofs,OPC R1 8B,0.0
1006,Grok 4,xai/grok-4,elmosl_A_2025_8,elmosl,proofs,OPC R1 8B,0.0
1007,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,elmosl_A_2025_8,elmosl,proofs,OPC R1 8B,0.0
1008,Qwen3-4B (25/07),qwen/qwen3_4b,elmosl_C_2025_1,elmosl,proofs,OPC R1 8B,0.0
1009,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,elmosl_C_2025_1,elmosl,proofs,OPC R1 8B,0.0
1010,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,elmosl_C_2025_1,elmosl,proofs,OPC R1 8B,0.0
1011,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,elmosl_C_2025_1,elmosl,proofs,OPC R1 8B,0.0
1012,Grok 4,xai/grok-4,elmosl_C_2025_1,elmosl,proofs,OPC R1 8B,0.0
1013,GPT-5 (high),openai/gpt-5,elmosl_C_2025_1,elmosl,proofs,OPC R1 8B,1.0
1014,o4-mini (high),openai/o4-mini--high,elmosl_C_2025_1,elmosl,proofs,OPC R1 8B,0.0
1015,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,elmosl_C_2025_1,elmosl,proofs,OPC R1 8B,0.0
1016,GPT OSS 120B (high),openai/oss-120b,elmosl_C_2025_1,elmosl,proofs,OPC R1 8B,0.0
1017,gemini-2.5-pro,gemini/gemini-pro-2.5,elmosl_C_2025_1,elmosl,proofs,OPC R1 8B,0.0
1018,Qwen3-4B (25/07),qwen/qwen3_4b,elmosl_C_2025_2,elmosl,proofs,OPC R1 8B,1.0
1019,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,elmosl_C_2025_2,elmosl,proofs,OPC R1 8B,1.0
1020,Grok 4,xai/grok-4,elmosl_C_2025_2,elmosl,proofs,OPC R1 8B,0.0
1021,o4-mini (high),openai/o4-mini--high,elmosl_C_2025_2,elmosl,proofs,OPC R1 8B,0.0
1022,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,elmosl_C_2025_2,elmosl,proofs,OPC R1 8B,1.0
1023,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,elmosl_C_2025_2,elmosl,proofs,OPC R1 8B,0.0
1024,gemini-2.5-pro,gemini/gemini-pro-2.5,elmosl_C_2025_2,elmosl,proofs,OPC R1 8B,1.0
1025,GPT OSS 120B (high),openai/oss-120b,elmosl_C_2025_2,elmosl,proofs,OPC R1 8B,0.0
1026,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,elmosl_C_2025_2,elmosl,proofs,OPC R1 8B,1.0
1027,GPT-5 (high),openai/gpt-5,elmosl_C_2025_2,elmosl,proofs,OPC R1 8B,1.0
1028,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,elmosl_C_2025_3,elmosl,proofs,OPC R1 8B,1.0
1029,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,elmosl_C_2025_3,elmosl,proofs,OPC R1 8B,1.0
1030,gemini-2.5-pro,gemini/gemini-pro-2.5,elmosl_C_2025_3,elmosl,proofs,OPC R1 8B,1.0
1031,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,elmosl_C_2025_3,elmosl,proofs,OPC R1 8B,1.0
1032,GPT OSS 120B (high),openai/oss-120b,elmosl_C_2025_3,elmosl,proofs,OPC R1 8B,0.0
1033,GPT-5 (high),openai/gpt-5,elmosl_C_2025_3,elmosl,proofs,OPC R1 8B,1.0
1034,o4-mini (high),openai/o4-mini--high,elmosl_C_2025_3,elmosl,proofs,OPC R1 8B,1.0
1035,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,elmosl_C_2025_3,elmosl,proofs,OPC R1 8B,0.0
1036,Grok 4,xai/grok-4,elmosl_C_2025_3,elmosl,proofs,OPC R1 8B,0.0
1037,Qwen3-4B (25/07),qwen/qwen3_4b,elmosl_C_2025_3,elmosl,proofs,OPC R1 8B,1.0
1038,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,elmosl_C_2025_4,elmosl,proofs,OPC R1 8B,0.0
1039,o4-mini (high),openai/o4-mini--high,elmosl_C_2025_4,elmosl,proofs,OPC R1 8B,0.0
1040,gemini-2.5-pro,gemini/gemini-pro-2.5,elmosl_C_2025_4,elmosl,proofs,OPC R1 8B,1.0
1041,Grok 4,xai/grok-4,elmosl_C_2025_4,elmosl,proofs,OPC R1 8B,1.0
1042,GPT OSS 120B (high),openai/oss-120b,elmosl_C_2025_4,elmosl,proofs,OPC R1 8B,0.0
1043,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,elmosl_C_2025_4,elmosl,proofs,OPC R1 8B,0.0
1044,Qwen3-4B (25/07),qwen/qwen3_4b,elmosl_C_2025_4,elmosl,proofs,OPC R1 8B,1.0
1045,GPT-5 (high),openai/gpt-5,elmosl_C_2025_4,elmosl,proofs,OPC R1 8B,0.0
1046,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,elmosl_C_2025_4,elmosl,proofs,OPC R1 8B,0.0
1047,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,elmosl_C_2025_4,elmosl,proofs,OPC R1 8B,0.0
1048,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,elmosl_C_2025_5,elmosl,proofs,OPC R1 8B,1.0
1049,GPT OSS 120B (high),openai/oss-120b,elmosl_C_2025_5,elmosl,proofs,OPC R1 8B,0.0
1050,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,elmosl_C_2025_5,elmosl,proofs,OPC R1 8B,0.0
1051,Qwen3-4B (25/07),qwen/qwen3_4b,elmosl_C_2025_5,elmosl,proofs,OPC R1 8B,1.0
1052,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,elmosl_C_2025_5,elmosl,proofs,OPC R1 8B,0.0
1053,Grok 4,xai/grok-4,elmosl_C_2025_5,elmosl,proofs,OPC R1 8B,1.0
1054,gemini-2.5-pro,gemini/gemini-pro-2.5,elmosl_C_2025_5,elmosl,proofs,OPC R1 8B,0.0
1055,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,elmosl_C_2025_5,elmosl,proofs,OPC R1 8B,0.0
1056,o4-mini (high),openai/o4-mini--high,elmosl_C_2025_5,elmosl,proofs,OPC R1 8B,0.0
1057,GPT-5 (high),openai/gpt-5,elmosl_C_2025_5,elmosl,proofs,OPC R1 8B,0.0
1058,GPT OSS 120B (high),openai/oss-120b,elmosl_C_2025_6,elmosl,proofs,OPC R1 8B,0.0
1059,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,elmosl_C_2025_6,elmosl,proofs,OPC R1 8B,0.0
1060,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,elmosl_C_2025_6,elmosl,proofs,OPC R1 8B,0.0
1061,gemini-2.5-pro,gemini/gemini-pro-2.5,elmosl_C_2025_6,elmosl,proofs,OPC R1 8B,0.0
1062,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,elmosl_C_2025_6,elmosl,proofs,OPC R1 8B,1.0
1063,o4-mini (high),openai/o4-mini--high,elmosl_C_2025_6,elmosl,proofs,OPC R1 8B,0.0
1064,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,elmosl_C_2025_6,elmosl,proofs,OPC R1 8B,0.0
1065,GPT-5 (high),openai/gpt-5,elmosl_C_2025_6,elmosl,proofs,OPC R1 8B,0.0
1066,Qwen3-4B (25/07),qwen/qwen3_4b,elmosl_C_2025_6,elmosl,proofs,OPC R1 8B,0.0
1067,Grok 4,xai/grok-4,elmosl_C_2025_6,elmosl,proofs,OPC R1 8B,0.0
1068,gemini-2.5-pro,gemini/gemini-pro-2.5,elmosl_C_2025_7,elmosl,proofs,OPC R1 8B,0.0
1069,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,elmosl_C_2025_7,elmosl,proofs,OPC R1 8B,0.0
1070,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,elmosl_C_2025_7,elmosl,proofs,OPC R1 8B,0.0
1071,Qwen3-4B (25/07),qwen/qwen3_4b,elmosl_C_2025_7,elmosl,proofs,OPC R1 8B,0.0
1072,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,elmosl_C_2025_7,elmosl,proofs,OPC R1 8B,0.0
1073,o4-mini (high),openai/o4-mini--high,elmosl_C_2025_7,elmosl,proofs,OPC R1 8B,0.0
1074,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,elmosl_C_2025_7,elmosl,proofs,OPC R1 8B,0.0
1075,Grok 4,xai/grok-4,elmosl_C_2025_7,elmosl,proofs,OPC R1 8B,0.0
1076,GPT OSS 120B (high),openai/oss-120b,elmosl_C_2025_7,elmosl,proofs,OPC R1 8B,0.0
1077,GPT-5 (high),openai/gpt-5,elmosl_C_2025_7,elmosl,proofs,OPC R1 8B,1.0
1078,GPT-5 (high),openai/gpt-5,elmosl_C_2025_8,elmosl,proofs,OPC R1 8B,0.0
1079,o4-mini (high),openai/o4-mini--high,elmosl_C_2025_8,elmosl,proofs,OPC R1 8B,1.0
1080,Grok 4,xai/grok-4,elmosl_C_2025_8,elmosl,proofs,OPC R1 8B,0.0
1081,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,elmosl_C_2025_8,elmosl,proofs,OPC R1 8B,0.0
1082,GPT OSS 120B (high),openai/oss-120b,elmosl_C_2025_8,elmosl,proofs,OPC R1 8B,0.0
1083,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,elmosl_C_2025_8,elmosl,proofs,OPC R1 8B,0.0
1084,Qwen3-4B (25/07),qwen/qwen3_4b,elmosl_C_2025_8,elmosl,proofs,OPC R1 8B,0.0
1085,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,elmosl_C_2025_8,elmosl,proofs,OPC R1 8B,1.0
1086,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,elmosl_C_2025_8,elmosl,proofs,OPC R1 8B,0.0
1087,gemini-2.5-pro,gemini/gemini-pro-2.5,elmosl_C_2025_8,elmosl,proofs,OPC R1 8B,0.0
1088,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,elmosl_C_2025_9,elmosl,proofs,OPC R1 8B,0.0
1089,GPT-5 (high),openai/gpt-5,elmosl_C_2025_9,elmosl,proofs,OPC R1 8B,0.0
1090,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,elmosl_C_2025_9,elmosl,proofs,OPC R1 8B,0.0
1091,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,elmosl_C_2025_9,elmosl,proofs,OPC R1 8B,0.0
1092,o4-mini (high),openai/o4-mini--high,elmosl_C_2025_9,elmosl,proofs,OPC R1 8B,0.0
1093,Grok 4,xai/grok-4,elmosl_C_2025_9,elmosl,proofs,OPC R1 8B,0.0
1094,gemini-2.5-pro,gemini/gemini-pro-2.5,elmosl_C_2025_9,elmosl,proofs,OPC R1 8B,0.0
1095,GPT OSS 120B (high),openai/oss-120b,elmosl_C_2025_9,elmosl,proofs,OPC R1 8B,0.0
1096,Qwen3-4B (25/07),qwen/qwen3_4b,elmosl_C_2025_9,elmosl,proofs,OPC R1 8B,0.0
1097,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,elmosl_C_2025_9,elmosl,proofs,OPC R1 8B,0.0
1098,o4-mini (high),openai/o4-mini--high,elmosl_G_2025_1,elmosl,proofs,OPC R1 8B,0.0
1099,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,elmosl_G_2025_1,elmosl,proofs,OPC R1 8B,0.0
1100,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,elmosl_G_2025_1,elmosl,proofs,OPC R1 8B,1.0
1101,Qwen3-4B (25/07),qwen/qwen3_4b,elmosl_G_2025_1,elmosl,proofs,OPC R1 8B,0.0
1102,gemini-2.5-pro,gemini/gemini-pro-2.5,elmosl_G_2025_1,elmosl,proofs,OPC R1 8B,0.0
1103,GPT OSS 120B (high),openai/oss-120b,elmosl_G_2025_1,elmosl,proofs,OPC R1 8B,1.0
1104,Grok 4,xai/grok-4,elmosl_G_2025_1,elmosl,proofs,OPC R1 8B,0.0
1105,GPT-5 (high),openai/gpt-5,elmosl_G_2025_1,elmosl,proofs,OPC R1 8B,1.0
1106,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,elmosl_G_2025_1,elmosl,proofs,OPC R1 8B,0.0
1107,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,elmosl_G_2025_1,elmosl,proofs,OPC R1 8B,0.0
1108,Qwen3-4B (25/07),qwen/qwen3_4b,elmosl_G_2025_2,elmosl,proofs,OPC R1 8B,0.0
1109,gemini-2.5-pro,gemini/gemini-pro-2.5,elmosl_G_2025_2,elmosl,proofs,OPC R1 8B,0.0
1110,Grok 4,xai/grok-4,elmosl_G_2025_2,elmosl,proofs,OPC R1 8B,0.0
1111,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,elmosl_G_2025_2,elmosl,proofs,OPC R1 8B,0.0
1112,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,elmosl_G_2025_2,elmosl,proofs,OPC R1 8B,0.0
1113,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,elmosl_G_2025_2,elmosl,proofs,OPC R1 8B,0.0
1114,GPT OSS 120B (high),openai/oss-120b,elmosl_G_2025_2,elmosl,proofs,OPC R1 8B,0.0
1115,GPT-5 (high),openai/gpt-5,elmosl_G_2025_2,elmosl,proofs,OPC R1 8B,0.0
1116,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,elmosl_G_2025_2,elmosl,proofs,OPC R1 8B,0.0
1117,o4-mini (high),openai/o4-mini--high,elmosl_G_2025_2,elmosl,proofs,OPC R1 8B,0.0
1118,o4-mini (high),openai/o4-mini--high,elmosl_G_2025_3,elmosl,proofs,OPC R1 8B,0.0
1119,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,elmosl_G_2025_3,elmosl,proofs,OPC R1 8B,0.0
1120,GPT-5 (high),openai/gpt-5,elmosl_G_2025_3,elmosl,proofs,OPC R1 8B,0.0
1121,Grok 4,xai/grok-4,elmosl_G_2025_3,elmosl,proofs,OPC R1 8B,0.0
1122,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,elmosl_G_2025_3,elmosl,proofs,OPC R1 8B,0.0
1123,Qwen3-4B (25/07),qwen/qwen3_4b,elmosl_G_2025_3,elmosl,proofs,OPC R1 8B,0.0
1124,GPT OSS 120B (high),openai/oss-120b,elmosl_G_2025_3,elmosl,proofs,OPC R1 8B,1.0
1125,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,elmosl_G_2025_3,elmosl,proofs,OPC R1 8B,1.0
1126,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,elmosl_G_2025_3,elmosl,proofs,OPC R1 8B,0.0
1127,gemini-2.5-pro,gemini/gemini-pro-2.5,elmosl_G_2025_3,elmosl,proofs,OPC R1 8B,0.0
1128,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,elmosl_G_2025_4,elmosl,proofs,OPC R1 8B,1.0
1129,GPT OSS 120B (high),openai/oss-120b,elmosl_G_2025_4,elmosl,proofs,OPC R1 8B,0.0
1130,Qwen3-4B (25/07),qwen/qwen3_4b,elmosl_G_2025_4,elmosl,proofs,OPC R1 8B,0.0
1131,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,elmosl_G_2025_4,elmosl,proofs,OPC R1 8B,1.0
1132,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,elmosl_G_2025_4,elmosl,proofs,OPC R1 8B,0.0
1133,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,elmosl_G_2025_4,elmosl,proofs,OPC R1 8B,1.0
1134,o4-mini (high),openai/o4-mini--high,elmosl_G_2025_4,elmosl,proofs,OPC R1 8B,0.0
1135,Grok 4,xai/grok-4,elmosl_G_2025_4,elmosl,proofs,OPC R1 8B,1.0
1136,gemini-2.5-pro,gemini/gemini-pro-2.5,elmosl_G_2025_4,elmosl,proofs,OPC R1 8B,1.0
1137,GPT-5 (high),openai/gpt-5,elmosl_G_2025_4,elmosl,proofs,OPC R1 8B,1.0
1138,Qwen3-4B (25/07),qwen/qwen3_4b,elmosl_G_2025_5,elmosl,proofs,OPC R1 8B,0.0
1139,Grok 4,xai/grok-4,elmosl_G_2025_5,elmosl,proofs,OPC R1 8B,0.0
1140,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,elmosl_G_2025_5,elmosl,proofs,OPC R1 8B,1.0
1141,GPT OSS 120B (high),openai/oss-120b,elmosl_G_2025_5,elmosl,proofs,OPC R1 8B,0.0
1142,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,elmosl_G_2025_5,elmosl,proofs,OPC R1 8B,0.0
1143,o4-mini (high),openai/o4-mini--high,elmosl_G_2025_5,elmosl,proofs,OPC R1 8B,0.0
1144,gemini-2.5-pro,gemini/gemini-pro-2.5,elmosl_G_2025_5,elmosl,proofs,OPC R1 8B,1.0
1145,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,elmosl_G_2025_5,elmosl,proofs,OPC R1 8B,1.0
1146,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,elmosl_G_2025_5,elmosl,proofs,OPC R1 8B,0.0
1147,GPT-5 (high),openai/gpt-5,elmosl_G_2025_5,elmosl,proofs,OPC R1 8B,0.0
1148,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,elmosl_G_2025_6,elmosl,proofs,OPC R1 8B,0.0
1149,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,elmosl_G_2025_6,elmosl,proofs,OPC R1 8B,0.0
1150,GPT-5 (high),openai/gpt-5,elmosl_G_2025_6,elmosl,proofs,OPC R1 8B,0.0
1151,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,elmosl_G_2025_6,elmosl,proofs,OPC R1 8B,0.0
1152,Qwen3-4B (25/07),qwen/qwen3_4b,elmosl_G_2025_6,elmosl,proofs,OPC R1 8B,0.0
1153,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,elmosl_G_2025_6,elmosl,proofs,OPC R1 8B,0.0
1154,Grok 4,xai/grok-4,elmosl_G_2025_6,elmosl,proofs,OPC R1 8B,0.0
1155,GPT OSS 120B (high),openai/oss-120b,elmosl_G_2025_6,elmosl,proofs,OPC R1 8B,1.0
1156,gemini-2.5-pro,gemini/gemini-pro-2.5,elmosl_G_2025_6,elmosl,proofs,OPC R1 8B,0.0
1157,o4-mini (high),openai/o4-mini--high,elmosl_G_2025_6,elmosl,proofs,OPC R1 8B,0.0
1158,Grok 4,xai/grok-4,elmosl_G_2025_7,elmosl,proofs,OPC R1 8B,0.0
1159,gemini-2.5-pro,gemini/gemini-pro-2.5,elmosl_G_2025_7,elmosl,proofs,OPC R1 8B,0.0
1160,GPT-5 (high),openai/gpt-5,elmosl_G_2025_7,elmosl,proofs,OPC R1 8B,0.0
1161,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,elmosl_G_2025_7,elmosl,proofs,OPC R1 8B,0.0
1162,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,elmosl_G_2025_7,elmosl,proofs,OPC R1 8B,0.0
1163,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,elmosl_G_2025_7,elmosl,proofs,OPC R1 8B,0.0
1164,GPT OSS 120B (high),openai/oss-120b,elmosl_G_2025_7,elmosl,proofs,OPC R1 8B,1.0
1165,o4-mini (high),openai/o4-mini--high,elmosl_G_2025_7,elmosl,proofs,OPC R1 8B,0.0
1166,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,elmosl_G_2025_7,elmosl,proofs,OPC R1 8B,0.0
1167,Qwen3-4B (25/07),qwen/qwen3_4b,elmosl_G_2025_7,elmosl,proofs,OPC R1 8B,0.0
1168,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,elmosl_G_2025_8,elmosl,proofs,OPC R1 8B,0.0
1169,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,elmosl_G_2025_8,elmosl,proofs,OPC R1 8B,0.0
1170,Qwen3-4B (25/07),qwen/qwen3_4b,elmosl_G_2025_8,elmosl,proofs,OPC R1 8B,0.0
1171,GPT OSS 120B (high),openai/oss-120b,elmosl_G_2025_8,elmosl,proofs,OPC R1 8B,1.0
1172,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,elmosl_G_2025_8,elmosl,proofs,OPC R1 8B,0.0
1173,Grok 4,xai/grok-4,elmosl_G_2025_8,elmosl,proofs,OPC R1 8B,0.0
1174,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,elmosl_G_2025_8,elmosl,proofs,OPC R1 8B,0.0
1175,gemini-2.5-pro,gemini/gemini-pro-2.5,elmosl_G_2025_8,elmosl,proofs,OPC R1 8B,0.0
1176,GPT-5 (high),openai/gpt-5,elmosl_G_2025_8,elmosl,proofs,OPC R1 8B,0.0
1177,o4-mini (high),openai/o4-mini--high,elmosl_G_2025_8,elmosl,proofs,OPC R1 8B,0.0
1178,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,elmosl_G_2025_9,elmosl,proofs,OPC R1 8B,0.0
1179,Grok 4,xai/grok-4,elmosl_G_2025_9,elmosl,proofs,OPC R1 8B,0.0
1180,Qwen3-4B (25/07),qwen/qwen3_4b,elmosl_G_2025_9,elmosl,proofs,OPC R1 8B,0.0
1181,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,elmosl_G_2025_9,elmosl,proofs,OPC R1 8B,0.0
1182,GPT OSS 120B (high),openai/oss-120b,elmosl_G_2025_9,elmosl,proofs,OPC R1 8B,0.0
1183,gemini-2.5-pro,gemini/gemini-pro-2.5,elmosl_G_2025_9,elmosl,proofs,OPC R1 8B,0.0
1184,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,elmosl_G_2025_9,elmosl,proofs,OPC R1 8B,0.0
1185,GPT-5 (high),openai/gpt-5,elmosl_G_2025_9,elmosl,proofs,OPC R1 8B,0.0
1186,o4-mini (high),openai/o4-mini--high,elmosl_G_2025_9,elmosl,proofs,OPC R1 8B,0.0
1187,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,elmosl_G_2025_9,elmosl,proofs,OPC R1 8B,0.0
1188,o4-mini (high),openai/o4-mini--high,elmosl_NT_2025_1,elmosl,proofs,OPC R1 8B,0.0
1189,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,elmosl_NT_2025_1,elmosl,proofs,OPC R1 8B,0.0
1190,gemini-2.5-pro,gemini/gemini-pro-2.5,elmosl_NT_2025_1,elmosl,proofs,OPC R1 8B,1.0
1191,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,elmosl_NT_2025_1,elmosl,proofs,OPC R1 8B,1.0
1192,GPT OSS 120B (high),openai/oss-120b,elmosl_NT_2025_1,elmosl,proofs,OPC R1 8B,0.0
1193,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,elmosl_NT_2025_1,elmosl,proofs,OPC R1 8B,1.0
1194,Grok 4,xai/grok-4,elmosl_NT_2025_1,elmosl,proofs,OPC R1 8B,0.0
1195,Qwen3-4B (25/07),qwen/qwen3_4b,elmosl_NT_2025_1,elmosl,proofs,OPC R1 8B,0.0
1196,GPT-5 (high),openai/gpt-5,elmosl_NT_2025_1,elmosl,proofs,OPC R1 8B,0.0
1197,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,elmosl_NT_2025_1,elmosl,proofs,OPC R1 8B,1.0
1198,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,elmosl_NT_2025_2,elmosl,proofs,OPC R1 8B,0.0
1199,GPT OSS 120B (high),openai/oss-120b,elmosl_NT_2025_2,elmosl,proofs,OPC R1 8B,0.0
1200,o4-mini (high),openai/o4-mini--high,elmosl_NT_2025_2,elmosl,proofs,OPC R1 8B,0.0
1201,gemini-2.5-pro,gemini/gemini-pro-2.5,elmosl_NT_2025_2,elmosl,proofs,OPC R1 8B,1.0
1202,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,elmosl_NT_2025_2,elmosl,proofs,OPC R1 8B,0.0
1203,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,elmosl_NT_2025_2,elmosl,proofs,OPC R1 8B,1.0
1204,Qwen3-4B (25/07),qwen/qwen3_4b,elmosl_NT_2025_2,elmosl,proofs,OPC R1 8B,0.0
1205,Grok 4,xai/grok-4,elmosl_NT_2025_2,elmosl,proofs,OPC R1 8B,0.0
1206,GPT-5 (high),openai/gpt-5,elmosl_NT_2025_2,elmosl,proofs,OPC R1 8B,0.0
1207,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,elmosl_NT_2025_2,elmosl,proofs,OPC R1 8B,0.0
1208,o4-mini (high),openai/o4-mini--high,elmosl_NT_2025_3,elmosl,proofs,OPC R1 8B,1.0
1209,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,elmosl_NT_2025_3,elmosl,proofs,OPC R1 8B,0.0
1210,GPT-5 (high),openai/gpt-5,elmosl_NT_2025_3,elmosl,proofs,OPC R1 8B,0.0
1211,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,elmosl_NT_2025_3,elmosl,proofs,OPC R1 8B,0.0
1212,Grok 4,xai/grok-4,elmosl_NT_2025_3,elmosl,proofs,OPC R1 8B,0.0
1213,Qwen3-4B (25/07),qwen/qwen3_4b,elmosl_NT_2025_3,elmosl,proofs,OPC R1 8B,0.0
1214,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,elmosl_NT_2025_3,elmosl,proofs,OPC R1 8B,1.0
1215,gemini-2.5-pro,gemini/gemini-pro-2.5,elmosl_NT_2025_3,elmosl,proofs,OPC R1 8B,1.0
1216,GPT OSS 120B (high),openai/oss-120b,elmosl_NT_2025_3,elmosl,proofs,OPC R1 8B,0.0
1217,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,elmosl_NT_2025_3,elmosl,proofs,OPC R1 8B,0.0
1218,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,elmosl_NT_2025_4,elmosl,proofs,OPC R1 8B,1.0
1219,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,elmosl_NT_2025_4,elmosl,proofs,OPC R1 8B,0.0
1220,o4-mini (high),openai/o4-mini--high,elmosl_NT_2025_4,elmosl,proofs,OPC R1 8B,1.0
1221,GPT OSS 120B (high),openai/oss-120b,elmosl_NT_2025_4,elmosl,proofs,OPC R1 8B,0.0
1222,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,elmosl_NT_2025_4,elmosl,proofs,OPC R1 8B,0.0
1223,Qwen3-4B (25/07),qwen/qwen3_4b,elmosl_NT_2025_4,elmosl,proofs,OPC R1 8B,0.0
1224,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,elmosl_NT_2025_4,elmosl,proofs,OPC R1 8B,1.0
1225,gemini-2.5-pro,gemini/gemini-pro-2.5,elmosl_NT_2025_4,elmosl,proofs,OPC R1 8B,0.0
1226,GPT-5 (high),openai/gpt-5,elmosl_NT_2025_4,elmosl,proofs,OPC R1 8B,0.0
1227,Grok 4,xai/grok-4,elmosl_NT_2025_4,elmosl,proofs,OPC R1 8B,0.0
1228,GPT OSS 120B (high),openai/oss-120b,elmosl_NT_2025_5,elmosl,proofs,OPC R1 8B,0.0
1229,gemini-2.5-pro,gemini/gemini-pro-2.5,elmosl_NT_2025_5,elmosl,proofs,OPC R1 8B,1.0
1230,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,elmosl_NT_2025_5,elmosl,proofs,OPC R1 8B,1.0
1231,o4-mini (high),openai/o4-mini--high,elmosl_NT_2025_5,elmosl,proofs,OPC R1 8B,0.0
1232,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,elmosl_NT_2025_5,elmosl,proofs,OPC R1 8B,0.0
1233,Grok 4,xai/grok-4,elmosl_NT_2025_5,elmosl,proofs,OPC R1 8B,0.0
1234,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,elmosl_NT_2025_5,elmosl,proofs,OPC R1 8B,0.0
1235,GPT-5 (high),openai/gpt-5,elmosl_NT_2025_5,elmosl,proofs,OPC R1 8B,0.0
1236,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,elmosl_NT_2025_5,elmosl,proofs,OPC R1 8B,0.0
1237,Qwen3-4B (25/07),qwen/qwen3_4b,elmosl_NT_2025_5,elmosl,proofs,OPC R1 8B,0.0
1238,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,elmosl_NT_2025_6,elmosl,proofs,OPC R1 8B,1.0
1239,gemini-2.5-pro,gemini/gemini-pro-2.5,elmosl_NT_2025_6,elmosl,proofs,OPC R1 8B,0.0
1240,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,elmosl_NT_2025_6,elmosl,proofs,OPC R1 8B,1.0
1241,Grok 4,xai/grok-4,elmosl_NT_2025_6,elmosl,proofs,OPC R1 8B,1.0
1242,GPT OSS 120B (high),openai/oss-120b,elmosl_NT_2025_6,elmosl,proofs,OPC R1 8B,0.0
1243,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,elmosl_NT_2025_6,elmosl,proofs,OPC R1 8B,1.0
1244,o4-mini (high),openai/o4-mini--high,elmosl_NT_2025_6,elmosl,proofs,OPC R1 8B,1.0
1245,GPT-5 (high),openai/gpt-5,elmosl_NT_2025_6,elmosl,proofs,OPC R1 8B,1.0
1246,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,elmosl_NT_2025_6,elmosl,proofs,OPC R1 8B,1.0
1247,Qwen3-4B (25/07),qwen/qwen3_4b,elmosl_NT_2025_6,elmosl,proofs,OPC R1 8B,0.0
1248,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,elmosl_NT_2025_7,elmosl,proofs,OPC R1 8B,0.0
1249,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,elmosl_NT_2025_7,elmosl,proofs,OPC R1 8B,0.0
1250,Grok 4,xai/grok-4,elmosl_NT_2025_7,elmosl,proofs,OPC R1 8B,0.0
1251,GPT-5 (high),openai/gpt-5,elmosl_NT_2025_7,elmosl,proofs,OPC R1 8B,0.0
1252,Qwen3-4B (25/07),qwen/qwen3_4b,elmosl_NT_2025_7,elmosl,proofs,OPC R1 8B,0.0
1253,GPT OSS 120B (high),openai/oss-120b,elmosl_NT_2025_7,elmosl,proofs,OPC R1 8B,0.0
1254,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,elmosl_NT_2025_7,elmosl,proofs,OPC R1 8B,0.0
1255,o4-mini (high),openai/o4-mini--high,elmosl_NT_2025_7,elmosl,proofs,OPC R1 8B,0.0
1256,gemini-2.5-pro,gemini/gemini-pro-2.5,elmosl_NT_2025_7,elmosl,proofs,OPC R1 8B,0.0
1257,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,elmosl_NT_2025_7,elmosl,proofs,OPC R1 8B,0.0
1258,o4-mini (high),openai/o4-mini--high,german_2025_1,german,proofs,OPC R1 8B,1.0
1259,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,german_2025_1,german,proofs,OPC R1 8B,1.0
1260,gemini-2.5-pro,gemini/gemini-pro-2.5,german_2025_1,german,proofs,OPC R1 8B,1.0
1261,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,german_2025_1,german,proofs,OPC R1 8B,1.0
1262,Grok 4,xai/grok-4,german_2025_1,german,proofs,OPC R1 8B,1.0
1263,GPT-5 (high),openai/gpt-5,german_2025_1,german,proofs,OPC R1 8B,1.0
1264,Qwen3-4B (25/07),qwen/qwen3_4b,german_2025_1,german,proofs,OPC R1 8B,1.0
1265,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,german_2025_1,german,proofs,OPC R1 8B,1.0
1266,GPT OSS 120B (high),openai/oss-120b,german_2025_1,german,proofs,OPC R1 8B,1.0
1267,GPT-5-mini (high),openai/gpt-5-mini,german_2025_1,german,proofs,OPC R1 8B,1.0
1268,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,german_2025_1,german,proofs,OPC R1 8B,1.0
1269,gemini-2.5-pro,gemini/gemini-pro-2.5,german_2025_2,german,proofs,OPC R1 8B,0.0
1270,o4-mini (high),openai/o4-mini--high,german_2025_2,german,proofs,OPC R1 8B,0.0
1271,GPT-5 (high),openai/gpt-5,german_2025_2,german,proofs,OPC R1 8B,0.0
1272,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,german_2025_2,german,proofs,OPC R1 8B,0.0
1273,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,german_2025_2,german,proofs,OPC R1 8B,0.0
1274,GPT-5-mini (high),openai/gpt-5-mini,german_2025_2,german,proofs,OPC R1 8B,0.0
1275,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,german_2025_2,german,proofs,OPC R1 8B,0.0
1276,Qwen3-4B (25/07),qwen/qwen3_4b,german_2025_2,german,proofs,OPC R1 8B,0.0
1277,GPT OSS 120B (high),openai/oss-120b,german_2025_2,german,proofs,OPC R1 8B,1.0
1278,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,german_2025_2,german,proofs,OPC R1 8B,0.0
1279,Grok 4,xai/grok-4,german_2025_2,german,proofs,OPC R1 8B,0.0
1280,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,german_2025_3,german,proofs,OPC R1 8B,0.0
1281,Qwen3-4B (25/07),qwen/qwen3_4b,german_2025_3,german,proofs,OPC R1 8B,1.0
1282,Grok 4,xai/grok-4,german_2025_3,german,proofs,OPC R1 8B,1.0
1283,o4-mini (high),openai/o4-mini--high,german_2025_3,german,proofs,OPC R1 8B,0.0
1284,gemini-2.5-pro,gemini/gemini-pro-2.5,german_2025_3,german,proofs,OPC R1 8B,0.0
1285,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,german_2025_3,german,proofs,OPC R1 8B,0.0
1286,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,german_2025_3,german,proofs,OPC R1 8B,1.0
1287,GPT-5 (high),openai/gpt-5,german_2025_3,german,proofs,OPC R1 8B,1.0
1288,GPT OSS 120B (high),openai/oss-120b,german_2025_3,german,proofs,OPC R1 8B,0.0
1289,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,german_2025_3,german,proofs,OPC R1 8B,1.0
1290,GPT-5-mini (high),openai/gpt-5-mini,german_2025_3,german,proofs,OPC R1 8B,1.0
1291,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,german_2025_4,german,proofs,OPC R1 8B,1.0
1292,Grok 4,xai/grok-4,german_2025_4,german,proofs,OPC R1 8B,1.0
1293,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,german_2025_4,german,proofs,OPC R1 8B,0.0
1294,gemini-2.5-pro,gemini/gemini-pro-2.5,german_2025_4,german,proofs,OPC R1 8B,0.0
1295,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,german_2025_4,german,proofs,OPC R1 8B,1.0
1296,o4-mini (high),openai/o4-mini--high,german_2025_4,german,proofs,OPC R1 8B,0.0
1297,GPT OSS 120B (high),openai/oss-120b,german_2025_4,german,proofs,OPC R1 8B,0.0
1298,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,german_2025_4,german,proofs,OPC R1 8B,1.0
1299,Qwen3-4B (25/07),qwen/qwen3_4b,german_2025_4,german,proofs,OPC R1 8B,0.0
1300,GPT-5-mini (high),openai/gpt-5-mini,german_2025_4,german,proofs,OPC R1 8B,0.0
1301,GPT-5 (high),openai/gpt-5,german_2025_4,german,proofs,OPC R1 8B,0.0
1302,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,greece_2025_1,greece,proofs,OPC R1 8B,1.0
1303,GPT-5 (high),openai/gpt-5,greece_2025_1,greece,proofs,OPC R1 8B,1.0
1304,GPT OSS 120B (high),openai/oss-120b,greece_2025_1,greece,proofs,OPC R1 8B,0.0
1305,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,greece_2025_1,greece,proofs,OPC R1 8B,0.0
1306,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,greece_2025_1,greece,proofs,OPC R1 8B,0.0
1307,gemini-2.5-pro,gemini/gemini-pro-2.5,greece_2025_1,greece,proofs,OPC R1 8B,1.0
1308,Qwen3-4B (25/07),qwen/qwen3_4b,greece_2025_1,greece,proofs,OPC R1 8B,0.0
1309,o4-mini (high),openai/o4-mini--high,greece_2025_1,greece,proofs,OPC R1 8B,1.0
1310,GPT-5-mini (high),openai/gpt-5-mini,greece_2025_1,greece,proofs,OPC R1 8B,1.0
1311,Grok 4,xai/grok-4,greece_2025_1,greece,proofs,OPC R1 8B,1.0
1312,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,greece_2025_1,greece,proofs,OPC R1 8B,1.0
1313,Grok 4,xai/grok-4,greece_2025_2,greece,proofs,OPC R1 8B,0.0
1314,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,greece_2025_2,greece,proofs,OPC R1 8B,0.0
1315,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,greece_2025_2,greece,proofs,OPC R1 8B,0.0
1316,GPT-5-mini (high),openai/gpt-5-mini,greece_2025_2,greece,proofs,OPC R1 8B,0.0
1317,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,greece_2025_2,greece,proofs,OPC R1 8B,0.0
1318,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,greece_2025_2,greece,proofs,OPC R1 8B,0.0
1319,gemini-2.5-pro,gemini/gemini-pro-2.5,greece_2025_2,greece,proofs,OPC R1 8B,0.0
1320,GPT OSS 120B (high),openai/oss-120b,greece_2025_2,greece,proofs,OPC R1 8B,1.0
1321,o4-mini (high),openai/o4-mini--high,greece_2025_2,greece,proofs,OPC R1 8B,0.0
1322,Qwen3-4B (25/07),qwen/qwen3_4b,greece_2025_2,greece,proofs,OPC R1 8B,0.0
1323,GPT-5 (high),openai/gpt-5,greece_2025_2,greece,proofs,OPC R1 8B,1.0
1324,GPT-5-mini (high),openai/gpt-5-mini,greece_2025_3,greece,proofs,OPC R1 8B,0.0
1325,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,greece_2025_3,greece,proofs,OPC R1 8B,1.0
1326,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,greece_2025_3,greece,proofs,OPC R1 8B,1.0
1327,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,greece_2025_3,greece,proofs,OPC R1 8B,0.0
1328,GPT OSS 120B (high),openai/oss-120b,greece_2025_3,greece,proofs,OPC R1 8B,0.0
1329,gemini-2.5-pro,gemini/gemini-pro-2.5,greece_2025_3,greece,proofs,OPC R1 8B,1.0
1330,GPT-5 (high),openai/gpt-5,greece_2025_3,greece,proofs,OPC R1 8B,0.0
1331,o4-mini (high),openai/o4-mini--high,greece_2025_3,greece,proofs,OPC R1 8B,0.0
1332,Qwen3-4B (25/07),qwen/qwen3_4b,greece_2025_3,greece,proofs,OPC R1 8B,0.0
1333,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,greece_2025_3,greece,proofs,OPC R1 8B,0.0
1334,Grok 4,xai/grok-4,greece_2025_3,greece,proofs,OPC R1 8B,1.0
1335,GPT-5-mini (high),openai/gpt-5-mini,greece_2025_4,greece,proofs,OPC R1 8B,0.0
1336,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,greece_2025_4,greece,proofs,OPC R1 8B,0.0
1337,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,greece_2025_4,greece,proofs,OPC R1 8B,0.0
1338,Qwen3-4B (25/07),qwen/qwen3_4b,greece_2025_4,greece,proofs,OPC R1 8B,0.0
1339,Grok 4,xai/grok-4,greece_2025_4,greece,proofs,OPC R1 8B,0.0
1340,gemini-2.5-pro,gemini/gemini-pro-2.5,greece_2025_4,greece,proofs,OPC R1 8B,0.0
1341,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,greece_2025_4,greece,proofs,OPC R1 8B,1.0
1342,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,greece_2025_4,greece,proofs,OPC R1 8B,0.0
1343,GPT-5 (high),openai/gpt-5,greece_2025_4,greece,proofs,OPC R1 8B,0.0
1344,o4-mini (high),openai/o4-mini--high,greece_2025_4,greece,proofs,OPC R1 8B,0.0
1345,GPT OSS 120B (high),openai/oss-120b,greece_2025_4,greece,proofs,OPC R1 8B,0.0
1346,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_1,imosl,proofs,OPC R1 8B,1.0
1347,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_1,imosl,proofs,OPC R1 8B,0.0
1348,o4-mini (high),openai/o4-mini--high,imosl_2025_1,imosl,proofs,OPC R1 8B,0.0
1349,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_1,imosl,proofs,OPC R1 8B,0.0
1350,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_1,imosl,proofs,OPC R1 8B,1.0
1351,Grok 4,xai/grok-4,imosl_2025_1,imosl,proofs,OPC R1 8B,1.0
1352,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_1,imosl,proofs,OPC R1 8B,0.0
1353,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_1,imosl,proofs,OPC R1 8B,1.0
1354,GPT OSS 120B (high),openai/oss-120b,imosl_2025_1,imosl,proofs,OPC R1 8B,0.0
1355,GPT-5 (high),openai/gpt-5,imosl_2025_1,imosl,proofs,OPC R1 8B,1.0
1356,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_10,imosl,proofs,OPC R1 8B,0.0
1357,o4-mini (high),openai/o4-mini--high,imosl_2025_10,imosl,proofs,OPC R1 8B,0.0
1358,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_10,imosl,proofs,OPC R1 8B,0.0
1359,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_10,imosl,proofs,OPC R1 8B,0.0
1360,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_10,imosl,proofs,OPC R1 8B,0.0
1361,GPT OSS 120B (high),openai/oss-120b,imosl_2025_10,imosl,proofs,OPC R1 8B,0.0
1362,Grok 4,xai/grok-4,imosl_2025_10,imosl,proofs,OPC R1 8B,0.0
1363,GPT-5-mini (high),openai/gpt-5-mini,imosl_2025_10,imosl,proofs,OPC R1 8B,0.0
1364,GPT-5 (high),openai/gpt-5,imosl_2025_10,imosl,proofs,OPC R1 8B,0.0
1365,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_10,imosl,proofs,OPC R1 8B,0.0
1366,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_10,imosl,proofs,OPC R1 8B,0.0
1367,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_11,imosl,proofs,OPC R1 8B,0.0
1368,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_11,imosl,proofs,OPC R1 8B,0.0
1369,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_11,imosl,proofs,OPC R1 8B,0.0
1370,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_11,imosl,proofs,OPC R1 8B,0.0
1371,Grok 4,xai/grok-4,imosl_2025_11,imosl,proofs,OPC R1 8B,1.0
1372,GPT-5 (high),openai/gpt-5,imosl_2025_11,imosl,proofs,OPC R1 8B,0.0
1373,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_11,imosl,proofs,OPC R1 8B,0.0
1374,GPT OSS 120B (high),openai/oss-120b,imosl_2025_11,imosl,proofs,OPC R1 8B,0.0
1375,o4-mini (high),openai/o4-mini--high,imosl_2025_11,imosl,proofs,OPC R1 8B,0.0
1376,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_11,imosl,proofs,OPC R1 8B,0.0
1377,GPT-5-mini (high),openai/gpt-5-mini,imosl_2025_11,imosl,proofs,OPC R1 8B,0.0
1378,GPT-5-mini (high),openai/gpt-5-mini,imosl_2025_12,imosl,proofs,OPC R1 8B,1.0
1379,GPT OSS 120B (high),openai/oss-120b,imosl_2025_12,imosl,proofs,OPC R1 8B,0.0
1380,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_12,imosl,proofs,OPC R1 8B,1.0
1381,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_12,imosl,proofs,OPC R1 8B,1.0
1382,GPT-5 (high),openai/gpt-5,imosl_2025_12,imosl,proofs,OPC R1 8B,0.0
1383,Grok 4,xai/grok-4,imosl_2025_12,imosl,proofs,OPC R1 8B,1.0
1384,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_12,imosl,proofs,OPC R1 8B,0.0
1385,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_12,imosl,proofs,OPC R1 8B,1.0
1386,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_12,imosl,proofs,OPC R1 8B,0.0
1387,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_12,imosl,proofs,OPC R1 8B,1.0
1388,o4-mini (high),openai/o4-mini--high,imosl_2025_12,imosl,proofs,OPC R1 8B,1.0
1389,GPT OSS 120B (high),openai/oss-120b,imosl_2025_13,imosl,proofs,OPC R1 8B,0.0
1390,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_13,imosl,proofs,OPC R1 8B,0.0
1391,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_13,imosl,proofs,OPC R1 8B,0.0
1392,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_13,imosl,proofs,OPC R1 8B,0.0
1393,GPT-5 (high),openai/gpt-5,imosl_2025_13,imosl,proofs,OPC R1 8B,0.0
1394,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_13,imosl,proofs,OPC R1 8B,0.0
1395,Grok 4,xai/grok-4,imosl_2025_13,imosl,proofs,OPC R1 8B,0.0
1396,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_13,imosl,proofs,OPC R1 8B,0.0
1397,o4-mini (high),openai/o4-mini--high,imosl_2025_13,imosl,proofs,OPC R1 8B,0.0
1398,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_13,imosl,proofs,OPC R1 8B,0.0
1399,GPT-5-mini (high),openai/gpt-5-mini,imosl_2025_14,imosl,proofs,OPC R1 8B,0.0
1400,GPT-5 (high),openai/gpt-5,imosl_2025_14,imosl,proofs,OPC R1 8B,0.0
1401,o4-mini (high),openai/o4-mini--high,imosl_2025_14,imosl,proofs,OPC R1 8B,0.0
1402,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_14,imosl,proofs,OPC R1 8B,0.0
1403,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_14,imosl,proofs,OPC R1 8B,0.0
1404,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_14,imosl,proofs,OPC R1 8B,0.0
1405,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_14,imosl,proofs,OPC R1 8B,0.0
1406,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_14,imosl,proofs,OPC R1 8B,0.0
1407,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_14,imosl,proofs,OPC R1 8B,0.0
1408,GPT OSS 120B (high),openai/oss-120b,imosl_2025_14,imosl,proofs,OPC R1 8B,0.0
1409,GPT-5 (high),openai/gpt-5,imosl_2025_15,imosl,proofs,OPC R1 8B,0.0
1410,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_15,imosl,proofs,OPC R1 8B,0.0
1411,o4-mini (high),openai/o4-mini--high,imosl_2025_15,imosl,proofs,OPC R1 8B,0.0
1412,GPT OSS 120B (high),openai/oss-120b,imosl_2025_15,imosl,proofs,OPC R1 8B,1.0
1413,Grok 4,xai/grok-4,imosl_2025_15,imosl,proofs,OPC R1 8B,0.0
1414,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_15,imosl,proofs,OPC R1 8B,0.0
1415,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_15,imosl,proofs,OPC R1 8B,0.0
1416,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_15,imosl,proofs,OPC R1 8B,0.0
1417,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_15,imosl,proofs,OPC R1 8B,0.0
1418,GPT-5-mini (high),openai/gpt-5-mini,imosl_2025_15,imosl,proofs,OPC R1 8B,0.0
1419,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_15,imosl,proofs,OPC R1 8B,0.0
1420,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_16,imosl,proofs,OPC R1 8B,0.0
1421,o4-mini (high),openai/o4-mini--high,imosl_2025_16,imosl,proofs,OPC R1 8B,0.0
1422,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_16,imosl,proofs,OPC R1 8B,0.0
1423,Grok 4,xai/grok-4,imosl_2025_16,imosl,proofs,OPC R1 8B,0.0
1424,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_16,imosl,proofs,OPC R1 8B,0.0
1425,GPT-5-mini (high),openai/gpt-5-mini,imosl_2025_16,imosl,proofs,OPC R1 8B,0.0
1426,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_16,imosl,proofs,OPC R1 8B,0.0
1427,GPT OSS 120B (high),openai/oss-120b,imosl_2025_16,imosl,proofs,OPC R1 8B,0.0
1428,GPT-5 (high),openai/gpt-5,imosl_2025_16,imosl,proofs,OPC R1 8B,0.0
1429,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_16,imosl,proofs,OPC R1 8B,0.0
1430,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_16,imosl,proofs,OPC R1 8B,0.0
1431,Grok 4,xai/grok-4,imosl_2025_17,imosl,proofs,OPC R1 8B,0.0
1432,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_17,imosl,proofs,OPC R1 8B,0.0
1433,o4-mini (high),openai/o4-mini--high,imosl_2025_17,imosl,proofs,OPC R1 8B,0.0
1434,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_17,imosl,proofs,OPC R1 8B,0.0
1435,GPT-5 (high),openai/gpt-5,imosl_2025_17,imosl,proofs,OPC R1 8B,0.0
1436,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_17,imosl,proofs,OPC R1 8B,0.0
1437,GPT-5-mini (high),openai/gpt-5-mini,imosl_2025_17,imosl,proofs,OPC R1 8B,0.0
1438,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_17,imosl,proofs,OPC R1 8B,0.0
1439,GPT OSS 120B (high),openai/oss-120b,imosl_2025_17,imosl,proofs,OPC R1 8B,1.0
1440,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_17,imosl,proofs,OPC R1 8B,0.0
1441,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_17,imosl,proofs,OPC R1 8B,0.0
1442,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_18,imosl,proofs,OPC R1 8B,0.0
1443,GPT-5 (high),openai/gpt-5,imosl_2025_18,imosl,proofs,OPC R1 8B,0.0
1444,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_18,imosl,proofs,OPC R1 8B,0.0
1445,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_18,imosl,proofs,OPC R1 8B,1.0
1446,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_18,imosl,proofs,OPC R1 8B,0.0
1447,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_18,imosl,proofs,OPC R1 8B,0.0
1448,GPT OSS 120B (high),openai/oss-120b,imosl_2025_18,imosl,proofs,OPC R1 8B,0.0
1449,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_18,imosl,proofs,OPC R1 8B,0.0
1450,o4-mini (high),openai/o4-mini--high,imosl_2025_18,imosl,proofs,OPC R1 8B,0.0
1451,GPT OSS 120B (high),openai/oss-120b,imosl_2025_19,imosl,proofs,OPC R1 8B,0.0
1452,GPT-5 (high),openai/gpt-5,imosl_2025_19,imosl,proofs,OPC R1 8B,0.0
1453,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_19,imosl,proofs,OPC R1 8B,0.0
1454,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_19,imosl,proofs,OPC R1 8B,0.0
1455,GPT-5-mini (high),openai/gpt-5-mini,imosl_2025_19,imosl,proofs,OPC R1 8B,0.0
1456,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_19,imosl,proofs,OPC R1 8B,0.0
1457,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_19,imosl,proofs,OPC R1 8B,0.0
1458,Grok 4,xai/grok-4,imosl_2025_19,imosl,proofs,OPC R1 8B,0.0
1459,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_19,imosl,proofs,OPC R1 8B,0.0
1460,o4-mini (high),openai/o4-mini--high,imosl_2025_19,imosl,proofs,OPC R1 8B,0.0
1461,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_19,imosl,proofs,OPC R1 8B,0.0
1462,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_2,imosl,proofs,OPC R1 8B,1.0
1463,GPT OSS 120B (high),openai/oss-120b,imosl_2025_2,imosl,proofs,OPC R1 8B,0.0
1464,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_2,imosl,proofs,OPC R1 8B,0.0
1465,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_2,imosl,proofs,OPC R1 8B,0.0
1466,Grok 4,xai/grok-4,imosl_2025_2,imosl,proofs,OPC R1 8B,1.0
1467,GPT-5 (high),openai/gpt-5,imosl_2025_2,imosl,proofs,OPC R1 8B,1.0
1468,GPT-5-mini (high),openai/gpt-5-mini,imosl_2025_2,imosl,proofs,OPC R1 8B,1.0
1469,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_2,imosl,proofs,OPC R1 8B,0.0
1470,o4-mini (high),openai/o4-mini--high,imosl_2025_2,imosl,proofs,OPC R1 8B,0.0
1471,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_2,imosl,proofs,OPC R1 8B,0.0
1472,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_2,imosl,proofs,OPC R1 8B,1.0
1473,GPT-5 (high),openai/gpt-5,imosl_2025_20,imosl,proofs,OPC R1 8B,1.0
1474,GPT-5-mini (high),openai/gpt-5-mini,imosl_2025_20,imosl,proofs,OPC R1 8B,0.0
1475,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_20,imosl,proofs,OPC R1 8B,0.0
1476,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_20,imosl,proofs,OPC R1 8B,0.0
1477,GPT OSS 120B (high),openai/oss-120b,imosl_2025_20,imosl,proofs,OPC R1 8B,0.0
1478,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_20,imosl,proofs,OPC R1 8B,0.0
1479,o4-mini (high),openai/o4-mini--high,imosl_2025_20,imosl,proofs,OPC R1 8B,0.0
1480,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_20,imosl,proofs,OPC R1 8B,0.0
1481,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_20,imosl,proofs,OPC R1 8B,0.0
1482,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_20,imosl,proofs,OPC R1 8B,0.0
1483,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_21,imosl,proofs,OPC R1 8B,0.0
1484,Grok 4,xai/grok-4,imosl_2025_21,imosl,proofs,OPC R1 8B,0.0
1485,o4-mini (high),openai/o4-mini--high,imosl_2025_21,imosl,proofs,OPC R1 8B,0.0
1486,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_21,imosl,proofs,OPC R1 8B,0.0
1487,GPT-5 (high),openai/gpt-5,imosl_2025_21,imosl,proofs,OPC R1 8B,0.0
1488,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_21,imosl,proofs,OPC R1 8B,0.0
1489,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_21,imosl,proofs,OPC R1 8B,0.0
1490,GPT OSS 120B (high),openai/oss-120b,imosl_2025_21,imosl,proofs,OPC R1 8B,1.0
1491,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_21,imosl,proofs,OPC R1 8B,0.0
1492,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_21,imosl,proofs,OPC R1 8B,0.0
1493,Grok 4,xai/grok-4,imosl_2025_22,imosl,proofs,OPC R1 8B,0.0
1494,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_22,imosl,proofs,OPC R1 8B,0.0
1495,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_22,imosl,proofs,OPC R1 8B,0.0
1496,GPT-5 (high),openai/gpt-5,imosl_2025_22,imosl,proofs,OPC R1 8B,0.0
1497,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_22,imosl,proofs,OPC R1 8B,0.0
1498,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_22,imosl,proofs,OPC R1 8B,0.0
1499,GPT-5-mini (high),openai/gpt-5-mini,imosl_2025_22,imosl,proofs,OPC R1 8B,0.0
1500,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_22,imosl,proofs,OPC R1 8B,0.0
1501,GPT OSS 120B (high),openai/oss-120b,imosl_2025_22,imosl,proofs,OPC R1 8B,0.0
1502,o4-mini (high),openai/o4-mini--high,imosl_2025_22,imosl,proofs,OPC R1 8B,0.0
1503,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_22,imosl,proofs,OPC R1 8B,0.0
1504,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_23,imosl,proofs,OPC R1 8B,0.0
1505,Grok 4,xai/grok-4,imosl_2025_23,imosl,proofs,OPC R1 8B,0.0
1506,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_23,imosl,proofs,OPC R1 8B,0.0
1507,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_23,imosl,proofs,OPC R1 8B,1.0
1508,o4-mini (high),openai/o4-mini--high,imosl_2025_23,imosl,proofs,OPC R1 8B,0.0
1509,GPT-5 (high),openai/gpt-5,imosl_2025_23,imosl,proofs,OPC R1 8B,0.0
1510,GPT OSS 120B (high),openai/oss-120b,imosl_2025_23,imosl,proofs,OPC R1 8B,0.0
1511,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_23,imosl,proofs,OPC R1 8B,0.0
1512,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_23,imosl,proofs,OPC R1 8B,0.0
1513,GPT-5-mini (high),openai/gpt-5-mini,imosl_2025_23,imosl,proofs,OPC R1 8B,0.0
1514,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_23,imosl,proofs,OPC R1 8B,0.0
1515,GPT OSS 120B (high),openai/oss-120b,imosl_2025_24,imosl,proofs,OPC R1 8B,0.0
1516,GPT-5 (high),openai/gpt-5,imosl_2025_24,imosl,proofs,OPC R1 8B,0.0
1517,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_24,imosl,proofs,OPC R1 8B,0.0
1518,GPT-5-mini (high),openai/gpt-5-mini,imosl_2025_24,imosl,proofs,OPC R1 8B,0.0
1519,Grok 4,xai/grok-4,imosl_2025_24,imosl,proofs,OPC R1 8B,0.0
1520,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_24,imosl,proofs,OPC R1 8B,0.0
1521,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_24,imosl,proofs,OPC R1 8B,0.0
1522,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_24,imosl,proofs,OPC R1 8B,0.0
1523,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_24,imosl,proofs,OPC R1 8B,0.0
1524,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_24,imosl,proofs,OPC R1 8B,0.0
1525,o4-mini (high),openai/o4-mini--high,imosl_2025_24,imosl,proofs,OPC R1 8B,0.0
1526,GPT OSS 120B (high),openai/oss-120b,imosl_2025_25,imosl,proofs,OPC R1 8B,0.0
1527,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_25,imosl,proofs,OPC R1 8B,1.0
1528,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_25,imosl,proofs,OPC R1 8B,0.0
1529,o4-mini (high),openai/o4-mini--high,imosl_2025_25,imosl,proofs,OPC R1 8B,0.0
1530,GPT-5 (high),openai/gpt-5,imosl_2025_25,imosl,proofs,OPC R1 8B,0.0
1531,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_25,imosl,proofs,OPC R1 8B,1.0
1532,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_25,imosl,proofs,OPC R1 8B,0.0
1533,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_25,imosl,proofs,OPC R1 8B,0.0
1534,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_25,imosl,proofs,OPC R1 8B,0.0
1535,Grok 4,xai/grok-4,imosl_2025_25,imosl,proofs,OPC R1 8B,1.0
1536,GPT OSS 120B (high),openai/oss-120b,imosl_2025_26,imosl,proofs,OPC R1 8B,0.0
1537,GPT-5 (high),openai/gpt-5,imosl_2025_26,imosl,proofs,OPC R1 8B,1.0
1538,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_26,imosl,proofs,OPC R1 8B,1.0
1539,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_26,imosl,proofs,OPC R1 8B,0.0
1540,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_26,imosl,proofs,OPC R1 8B,1.0
1541,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_26,imosl,proofs,OPC R1 8B,0.0
1542,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_26,imosl,proofs,OPC R1 8B,0.0
1543,Grok 4,xai/grok-4,imosl_2025_26,imosl,proofs,OPC R1 8B,1.0
1544,GPT-5-mini (high),openai/gpt-5-mini,imosl_2025_26,imosl,proofs,OPC R1 8B,1.0
1545,o4-mini (high),openai/o4-mini--high,imosl_2025_26,imosl,proofs,OPC R1 8B,0.0
1546,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_26,imosl,proofs,OPC R1 8B,1.0
1547,GPT-5 (high),openai/gpt-5,imosl_2025_27,imosl,proofs,OPC R1 8B,0.0
1548,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_27,imosl,proofs,OPC R1 8B,0.0
1549,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_27,imosl,proofs,OPC R1 8B,0.0
1550,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_27,imosl,proofs,OPC R1 8B,0.0
1551,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_27,imosl,proofs,OPC R1 8B,0.0
1552,o4-mini (high),openai/o4-mini--high,imosl_2025_27,imosl,proofs,OPC R1 8B,0.0
1553,Grok 4,xai/grok-4,imosl_2025_27,imosl,proofs,OPC R1 8B,0.0
1554,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_27,imosl,proofs,OPC R1 8B,0.0
1555,GPT OSS 120B (high),openai/oss-120b,imosl_2025_27,imosl,proofs,OPC R1 8B,0.0
1556,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_27,imosl,proofs,OPC R1 8B,1.0
1557,Grok 4,xai/grok-4,imosl_2025_28,imosl,proofs,OPC R1 8B,0.0
1558,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_28,imosl,proofs,OPC R1 8B,0.0
1559,GPT-5-mini (high),openai/gpt-5-mini,imosl_2025_28,imosl,proofs,OPC R1 8B,0.0
1560,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_28,imosl,proofs,OPC R1 8B,0.0
1561,GPT-5 (high),openai/gpt-5,imosl_2025_28,imosl,proofs,OPC R1 8B,0.0
1562,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_28,imosl,proofs,OPC R1 8B,1.0
1563,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_28,imosl,proofs,OPC R1 8B,0.0
1564,GPT OSS 120B (high),openai/oss-120b,imosl_2025_28,imosl,proofs,OPC R1 8B,0.0
1565,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_28,imosl,proofs,OPC R1 8B,0.0
1566,o4-mini (high),openai/o4-mini--high,imosl_2025_28,imosl,proofs,OPC R1 8B,1.0
1567,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_28,imosl,proofs,OPC R1 8B,0.0
1568,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_29,imosl,proofs,OPC R1 8B,0.0
1569,GPT-5-mini (high),openai/gpt-5-mini,imosl_2025_29,imosl,proofs,OPC R1 8B,0.0
1570,Grok 4,xai/grok-4,imosl_2025_29,imosl,proofs,OPC R1 8B,0.0
1571,GPT-5 (high),openai/gpt-5,imosl_2025_29,imosl,proofs,OPC R1 8B,0.0
1572,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_29,imosl,proofs,OPC R1 8B,0.0
1573,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_29,imosl,proofs,OPC R1 8B,0.0
1574,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_29,imosl,proofs,OPC R1 8B,0.0
1575,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_29,imosl,proofs,OPC R1 8B,0.0
1576,o4-mini (high),openai/o4-mini--high,imosl_2025_29,imosl,proofs,OPC R1 8B,0.0
1577,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_29,imosl,proofs,OPC R1 8B,0.0
1578,GPT OSS 120B (high),openai/oss-120b,imosl_2025_29,imosl,proofs,OPC R1 8B,0.0
1579,GPT-5-mini (high),openai/gpt-5-mini,imosl_2025_3,imosl,proofs,OPC R1 8B,1.0
1580,GPT-5 (high),openai/gpt-5,imosl_2025_3,imosl,proofs,OPC R1 8B,1.0
1581,GPT OSS 120B (high),openai/oss-120b,imosl_2025_3,imosl,proofs,OPC R1 8B,1.0
1582,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_3,imosl,proofs,OPC R1 8B,0.0
1583,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_3,imosl,proofs,OPC R1 8B,0.0
1584,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_3,imosl,proofs,OPC R1 8B,0.0
1585,Grok 4,xai/grok-4,imosl_2025_3,imosl,proofs,OPC R1 8B,0.0
1586,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_3,imosl,proofs,OPC R1 8B,0.0
1587,o4-mini (high),openai/o4-mini--high,imosl_2025_3,imosl,proofs,OPC R1 8B,1.0
1588,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_3,imosl,proofs,OPC R1 8B,0.0
1589,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_3,imosl,proofs,OPC R1 8B,0.0
1590,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_30,imosl,proofs,OPC R1 8B,0.0
1591,Grok 4,xai/grok-4,imosl_2025_30,imosl,proofs,OPC R1 8B,0.0
1592,GPT OSS 120B (high),openai/oss-120b,imosl_2025_30,imosl,proofs,OPC R1 8B,0.0
1593,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_30,imosl,proofs,OPC R1 8B,0.0
1594,GPT-5 (high),openai/gpt-5,imosl_2025_30,imosl,proofs,OPC R1 8B,0.0
1595,o4-mini (high),openai/o4-mini--high,imosl_2025_30,imosl,proofs,OPC R1 8B,0.0
1596,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_30,imosl,proofs,OPC R1 8B,0.0
1597,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_30,imosl,proofs,OPC R1 8B,0.0
1598,GPT-5-mini (high),openai/gpt-5-mini,imosl_2025_30,imosl,proofs,OPC R1 8B,0.0
1599,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_30,imosl,proofs,OPC R1 8B,0.0
1600,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_30,imosl,proofs,OPC R1 8B,0.0
1601,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_31,imosl,proofs,OPC R1 8B,0.0
1602,GPT-5-mini (high),openai/gpt-5-mini,imosl_2025_31,imosl,proofs,OPC R1 8B,1.0
1603,o4-mini (high),openai/o4-mini--high,imosl_2025_31,imosl,proofs,OPC R1 8B,0.0
1604,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_31,imosl,proofs,OPC R1 8B,0.0
1605,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_31,imosl,proofs,OPC R1 8B,1.0
1606,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_31,imosl,proofs,OPC R1 8B,0.0
1607,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_31,imosl,proofs,OPC R1 8B,0.0
1608,GPT OSS 120B (high),openai/oss-120b,imosl_2025_31,imosl,proofs,OPC R1 8B,0.0
1609,GPT-5 (high),openai/gpt-5,imosl_2025_31,imosl,proofs,OPC R1 8B,0.0
1610,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_31,imosl,proofs,OPC R1 8B,0.0
1611,Grok 4,xai/grok-4,imosl_2025_31,imosl,proofs,OPC R1 8B,0.0
1612,GPT OSS 120B (high),openai/oss-120b,imosl_2025_32,imosl,proofs,OPC R1 8B,0.0
1613,o4-mini (high),openai/o4-mini--high,imosl_2025_32,imosl,proofs,OPC R1 8B,0.0
1614,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_32,imosl,proofs,OPC R1 8B,0.0
1615,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_32,imosl,proofs,OPC R1 8B,0.0
1616,GPT-5 (high),openai/gpt-5,imosl_2025_32,imosl,proofs,OPC R1 8B,0.0
1617,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_32,imosl,proofs,OPC R1 8B,0.0
1618,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_32,imosl,proofs,OPC R1 8B,0.0
1619,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_32,imosl,proofs,OPC R1 8B,0.0
1620,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_32,imosl,proofs,OPC R1 8B,0.0
1621,GPT-5-mini (high),openai/gpt-5-mini,imosl_2025_32,imosl,proofs,OPC R1 8B,0.0
1622,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_33,imosl,proofs,OPC R1 8B,0.0
1623,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_33,imosl,proofs,OPC R1 8B,0.0
1624,Grok 4,xai/grok-4,imosl_2025_33,imosl,proofs,OPC R1 8B,0.0
1625,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_33,imosl,proofs,OPC R1 8B,0.0
1626,GPT-5-mini (high),openai/gpt-5-mini,imosl_2025_33,imosl,proofs,OPC R1 8B,1.0
1627,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_33,imosl,proofs,OPC R1 8B,0.0
1628,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_33,imosl,proofs,OPC R1 8B,0.0
1629,GPT-5 (high),openai/gpt-5,imosl_2025_33,imosl,proofs,OPC R1 8B,1.0
1630,o4-mini (high),openai/o4-mini--high,imosl_2025_33,imosl,proofs,OPC R1 8B,0.0
1631,GPT OSS 120B (high),openai/oss-120b,imosl_2025_33,imosl,proofs,OPC R1 8B,1.0
1632,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_33,imosl,proofs,OPC R1 8B,0.0
1633,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_34,imosl,proofs,OPC R1 8B,0.0
1634,GPT OSS 120B (high),openai/oss-120b,imosl_2025_34,imosl,proofs,OPC R1 8B,0.0
1635,Grok 4,xai/grok-4,imosl_2025_34,imosl,proofs,OPC R1 8B,0.0
1636,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_34,imosl,proofs,OPC R1 8B,0.0
1637,GPT-5 (high),openai/gpt-5,imosl_2025_34,imosl,proofs,OPC R1 8B,0.0
1638,GPT-5-mini (high),openai/gpt-5-mini,imosl_2025_34,imosl,proofs,OPC R1 8B,0.0
1639,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_34,imosl,proofs,OPC R1 8B,0.0
1640,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_34,imosl,proofs,OPC R1 8B,0.0
1641,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_34,imosl,proofs,OPC R1 8B,0.0
1642,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_34,imosl,proofs,OPC R1 8B,0.0
1643,o4-mini (high),openai/o4-mini--high,imosl_2025_34,imosl,proofs,OPC R1 8B,0.0
1644,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_35,imosl,proofs,OPC R1 8B,0.0
1645,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_35,imosl,proofs,OPC R1 8B,0.0
1646,Grok 4,xai/grok-4,imosl_2025_35,imosl,proofs,OPC R1 8B,0.0
1647,GPT OSS 120B (high),openai/oss-120b,imosl_2025_35,imosl,proofs,OPC R1 8B,1.0
1648,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_35,imosl,proofs,OPC R1 8B,0.0
1649,GPT-5 (high),openai/gpt-5,imosl_2025_35,imosl,proofs,OPC R1 8B,0.0
1650,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_35,imosl,proofs,OPC R1 8B,0.0
1651,o4-mini (high),openai/o4-mini--high,imosl_2025_35,imosl,proofs,OPC R1 8B,0.0
1652,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_35,imosl,proofs,OPC R1 8B,0.0
1653,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_35,imosl,proofs,OPC R1 8B,0.0
1654,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_36,imosl,proofs,OPC R1 8B,0.0
1655,GPT-5 (high),openai/gpt-5,imosl_2025_36,imosl,proofs,OPC R1 8B,0.0
1656,Grok 4,xai/grok-4,imosl_2025_36,imosl,proofs,OPC R1 8B,0.0
1657,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_36,imosl,proofs,OPC R1 8B,0.0
1658,GPT OSS 120B (high),openai/oss-120b,imosl_2025_36,imosl,proofs,OPC R1 8B,1.0
1659,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_36,imosl,proofs,OPC R1 8B,0.0
1660,o4-mini (high),openai/o4-mini--high,imosl_2025_36,imosl,proofs,OPC R1 8B,0.0
1661,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_36,imosl,proofs,OPC R1 8B,0.0
1662,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_36,imosl,proofs,OPC R1 8B,0.0
1663,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_36,imosl,proofs,OPC R1 8B,1.0
1664,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_37,imosl,proofs,OPC R1 8B,0.0
1665,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_37,imosl,proofs,OPC R1 8B,0.0
1666,o4-mini (high),openai/o4-mini--high,imosl_2025_37,imosl,proofs,OPC R1 8B,0.0
1667,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_37,imosl,proofs,OPC R1 8B,0.0
1668,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_37,imosl,proofs,OPC R1 8B,0.0
1669,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_37,imosl,proofs,OPC R1 8B,0.0
1670,GPT-5-mini (high),openai/gpt-5-mini,imosl_2025_37,imosl,proofs,OPC R1 8B,0.0
1671,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_37,imosl,proofs,OPC R1 8B,0.0
1672,Grok 4,xai/grok-4,imosl_2025_37,imosl,proofs,OPC R1 8B,0.0
1673,GPT OSS 120B (high),openai/oss-120b,imosl_2025_37,imosl,proofs,OPC R1 8B,0.0
1674,GPT-5 (high),openai/gpt-5,imosl_2025_37,imosl,proofs,OPC R1 8B,0.0
1675,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_4,imosl,proofs,OPC R1 8B,0.0
1676,Grok 4,xai/grok-4,imosl_2025_4,imosl,proofs,OPC R1 8B,0.0
1677,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_4,imosl,proofs,OPC R1 8B,0.0
1678,GPT-5-mini (high),openai/gpt-5-mini,imosl_2025_4,imosl,proofs,OPC R1 8B,0.0
1679,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_4,imosl,proofs,OPC R1 8B,0.0
1680,o4-mini (high),openai/o4-mini--high,imosl_2025_4,imosl,proofs,OPC R1 8B,0.0
1681,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_4,imosl,proofs,OPC R1 8B,0.0
1682,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_4,imosl,proofs,OPC R1 8B,0.0
1683,GPT OSS 120B (high),openai/oss-120b,imosl_2025_4,imosl,proofs,OPC R1 8B,0.0
1684,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_4,imosl,proofs,OPC R1 8B,0.0
1685,GPT-5 (high),openai/gpt-5,imosl_2025_4,imosl,proofs,OPC R1 8B,0.0
1686,o4-mini (high),openai/o4-mini--high,imosl_2025_5,imosl,proofs,OPC R1 8B,1.0
1687,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_5,imosl,proofs,OPC R1 8B,0.0
1688,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_5,imosl,proofs,OPC R1 8B,0.0
1689,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_5,imosl,proofs,OPC R1 8B,0.0
1690,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_5,imosl,proofs,OPC R1 8B,0.0
1691,GPT-5 (high),openai/gpt-5,imosl_2025_5,imosl,proofs,OPC R1 8B,0.0
1692,GPT-5-mini (high),openai/gpt-5-mini,imosl_2025_5,imosl,proofs,OPC R1 8B,1.0
1693,GPT OSS 120B (high),openai/oss-120b,imosl_2025_5,imosl,proofs,OPC R1 8B,0.0
1694,Grok 4,xai/grok-4,imosl_2025_5,imosl,proofs,OPC R1 8B,0.0
1695,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_5,imosl,proofs,OPC R1 8B,0.0
1696,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_5,imosl,proofs,OPC R1 8B,1.0
1697,GPT-5 (high),openai/gpt-5,imosl_2025_6,imosl,proofs,OPC R1 8B,0.0
1698,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_6,imosl,proofs,OPC R1 8B,0.0
1699,GPT OSS 120B (high),openai/oss-120b,imosl_2025_6,imosl,proofs,OPC R1 8B,1.0
1700,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_6,imosl,proofs,OPC R1 8B,0.0
1701,o4-mini (high),openai/o4-mini--high,imosl_2025_6,imosl,proofs,OPC R1 8B,0.0
1702,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_6,imosl,proofs,OPC R1 8B,0.0
1703,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_6,imosl,proofs,OPC R1 8B,0.0
1704,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_6,imosl,proofs,OPC R1 8B,0.0
1705,Grok 4,xai/grok-4,imosl_2025_6,imosl,proofs,OPC R1 8B,0.0
1706,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_6,imosl,proofs,OPC R1 8B,0.0
1707,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_7,imosl,proofs,OPC R1 8B,1.0
1708,GPT OSS 120B (high),openai/oss-120b,imosl_2025_7,imosl,proofs,OPC R1 8B,0.0
1709,o4-mini (high),openai/o4-mini--high,imosl_2025_7,imosl,proofs,OPC R1 8B,0.0
1710,Grok 4,xai/grok-4,imosl_2025_7,imosl,proofs,OPC R1 8B,0.0
1711,GPT-5-mini (high),openai/gpt-5-mini,imosl_2025_7,imosl,proofs,OPC R1 8B,0.0
1712,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_7,imosl,proofs,OPC R1 8B,0.0
1713,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_7,imosl,proofs,OPC R1 8B,0.0
1714,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_7,imosl,proofs,OPC R1 8B,1.0
1715,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_7,imosl,proofs,OPC R1 8B,1.0
1716,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_7,imosl,proofs,OPC R1 8B,0.0
1717,GPT-5 (high),openai/gpt-5,imosl_2025_7,imosl,proofs,OPC R1 8B,0.0
1718,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_8,imosl,proofs,OPC R1 8B,0.0
1719,GPT OSS 120B (high),openai/oss-120b,imosl_2025_8,imosl,proofs,OPC R1 8B,0.0
1720,GPT-5-mini (high),openai/gpt-5-mini,imosl_2025_8,imosl,proofs,OPC R1 8B,1.0
1721,o4-mini (high),openai/o4-mini--high,imosl_2025_8,imosl,proofs,OPC R1 8B,0.0
1722,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_8,imosl,proofs,OPC R1 8B,0.0
1723,GPT-5 (high),openai/gpt-5,imosl_2025_8,imosl,proofs,OPC R1 8B,0.0
1724,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_8,imosl,proofs,OPC R1 8B,0.0
1725,Grok 4,xai/grok-4,imosl_2025_8,imosl,proofs,OPC R1 8B,0.0
1726,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_8,imosl,proofs,OPC R1 8B,0.0
1727,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_8,imosl,proofs,OPC R1 8B,0.0
1728,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_8,imosl,proofs,OPC R1 8B,0.0
1729,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,imosl_2025_9,imosl,proofs,OPC R1 8B,1.0
1730,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,imosl_2025_9,imosl,proofs,OPC R1 8B,1.0
1731,o4-mini (high),openai/o4-mini--high,imosl_2025_9,imosl,proofs,OPC R1 8B,0.0
1732,gemini-2.5-pro,gemini/gemini-pro-2.5,imosl_2025_9,imosl,proofs,OPC R1 8B,0.0
1733,GPT OSS 120B (high),openai/oss-120b,imosl_2025_9,imosl,proofs,OPC R1 8B,0.0
1734,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,imosl_2025_9,imosl,proofs,OPC R1 8B,0.0
1735,GPT-5-mini (high),openai/gpt-5-mini,imosl_2025_9,imosl,proofs,OPC R1 8B,1.0
1736,Qwen3-4B (25/07),qwen/qwen3_4b,imosl_2025_9,imosl,proofs,OPC R1 8B,1.0
1737,Grok 4,xai/grok-4,imosl_2025_9,imosl,proofs,OPC R1 8B,0.0
1738,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,imosl_2025_9,imosl,proofs,OPC R1 8B,1.0
1739,GPT-5 (high),openai/gpt-5,imosl_2025_9,imosl,proofs,OPC R1 8B,0.0
1740,gemini-2.5-pro,gemini/gemini-pro-2.5,india_2025_1,india,proofs,OPC R1 8B,1.0
1741,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,india_2025_1,india,proofs,OPC R1 8B,1.0
1742,Qwen3-4B (25/07),qwen/qwen3_4b,india_2025_1,india,proofs,OPC R1 8B,0.0
1743,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,india_2025_1,india,proofs,OPC R1 8B,0.0
1744,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,india_2025_1,india,proofs,OPC R1 8B,0.0
1745,GPT-5-mini (high),openai/gpt-5-mini,india_2025_1,india,proofs,OPC R1 8B,1.0
1746,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,india_2025_1,india,proofs,OPC R1 8B,1.0
1747,GPT-5 (high),openai/gpt-5,india_2025_1,india,proofs,OPC R1 8B,1.0
1748,o4-mini (high),openai/o4-mini--high,india_2025_1,india,proofs,OPC R1 8B,1.0
1749,GPT OSS 120B (high),openai/oss-120b,india_2025_1,india,proofs,OPC R1 8B,0.0
1750,Grok 4,xai/grok-4,india_2025_1,india,proofs,OPC R1 8B,1.0
1751,o4-mini (high),openai/o4-mini--high,india_2025_2,india,proofs,OPC R1 8B,0.0
1752,GPT-5-mini (high),openai/gpt-5-mini,india_2025_2,india,proofs,OPC R1 8B,0.0
1753,Qwen3-4B (25/07),qwen/qwen3_4b,india_2025_2,india,proofs,OPC R1 8B,0.0
1754,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,india_2025_2,india,proofs,OPC R1 8B,0.0
1755,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,india_2025_2,india,proofs,OPC R1 8B,0.0
1756,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,india_2025_2,india,proofs,OPC R1 8B,0.0
1757,GPT-5 (high),openai/gpt-5,india_2025_2,india,proofs,OPC R1 8B,0.0
1758,GPT OSS 120B (high),openai/oss-120b,india_2025_2,india,proofs,OPC R1 8B,0.0
1759,gemini-2.5-pro,gemini/gemini-pro-2.5,india_2025_2,india,proofs,OPC R1 8B,0.0
1760,Grok 4,xai/grok-4,india_2025_2,india,proofs,OPC R1 8B,0.0
1761,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,india_2025_2,india,proofs,OPC R1 8B,0.0
1762,GPT-5 (high),openai/gpt-5,india_2025_3,india,proofs,OPC R1 8B,0.0
1763,GPT-5-mini (high),openai/gpt-5-mini,india_2025_3,india,proofs,OPC R1 8B,0.0
1764,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,india_2025_3,india,proofs,OPC R1 8B,0.0
1765,o4-mini (high),openai/o4-mini--high,india_2025_3,india,proofs,OPC R1 8B,0.0
1766,gemini-2.5-pro,gemini/gemini-pro-2.5,india_2025_3,india,proofs,OPC R1 8B,0.0
1767,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,india_2025_3,india,proofs,OPC R1 8B,0.0
1768,GPT OSS 120B (high),openai/oss-120b,india_2025_3,india,proofs,OPC R1 8B,1.0
1769,Qwen3-4B (25/07),qwen/qwen3_4b,india_2025_3,india,proofs,OPC R1 8B,0.0
1770,Grok 4,xai/grok-4,india_2025_3,india,proofs,OPC R1 8B,0.0
1771,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,india_2025_3,india,proofs,OPC R1 8B,0.0
1772,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,india_2025_3,india,proofs,OPC R1 8B,0.0
1773,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,india_2025_4,india,proofs,OPC R1 8B,0.0
1774,Qwen3-4B (25/07),qwen/qwen3_4b,india_2025_4,india,proofs,OPC R1 8B,0.0
1775,Grok 4,xai/grok-4,india_2025_4,india,proofs,OPC R1 8B,1.0
1776,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,india_2025_4,india,proofs,OPC R1 8B,0.0
1777,o4-mini (high),openai/o4-mini--high,india_2025_4,india,proofs,OPC R1 8B,0.0
1778,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,india_2025_4,india,proofs,OPC R1 8B,1.0
1779,GPT-5 (high),openai/gpt-5,india_2025_4,india,proofs,OPC R1 8B,0.0
1780,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,india_2025_4,india,proofs,OPC R1 8B,1.0
1781,GPT-5-mini (high),openai/gpt-5-mini,india_2025_4,india,proofs,OPC R1 8B,0.0
1782,gemini-2.5-pro,gemini/gemini-pro-2.5,india_2025_4,india,proofs,OPC R1 8B,1.0
1783,GPT OSS 120B (high),openai/oss-120b,india_2025_4,india,proofs,OPC R1 8B,0.0
1784,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,india_2025_5,india,proofs,OPC R1 8B,0.0
1785,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,india_2025_5,india,proofs,OPC R1 8B,0.0
1786,GPT OSS 120B (high),openai/oss-120b,india_2025_5,india,proofs,OPC R1 8B,0.0
1787,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,india_2025_5,india,proofs,OPC R1 8B,0.0
1788,gemini-2.5-pro,gemini/gemini-pro-2.5,india_2025_5,india,proofs,OPC R1 8B,0.0
1789,Qwen3-4B (25/07),qwen/qwen3_4b,india_2025_5,india,proofs,OPC R1 8B,0.0
1790,Grok 4,xai/grok-4,india_2025_5,india,proofs,OPC R1 8B,0.0
1791,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,india_2025_5,india,proofs,OPC R1 8B,0.0
1792,o4-mini (high),openai/o4-mini--high,india_2025_5,india,proofs,OPC R1 8B,0.0
1793,GPT-5 (high),openai/gpt-5,india_2025_5,india,proofs,OPC R1 8B,0.0
1794,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,india_2025_6,india,proofs,OPC R1 8B,0.0
1795,GPT-5 (high),openai/gpt-5,india_2025_6,india,proofs,OPC R1 8B,0.0
1796,o4-mini (high),openai/o4-mini--high,india_2025_6,india,proofs,OPC R1 8B,0.0
1797,GPT-5-mini (high),openai/gpt-5-mini,india_2025_6,india,proofs,OPC R1 8B,0.0
1798,GPT OSS 120B (high),openai/oss-120b,india_2025_6,india,proofs,OPC R1 8B,1.0
1799,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,india_2025_6,india,proofs,OPC R1 8B,0.0
1800,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,india_2025_6,india,proofs,OPC R1 8B,0.0
1801,Qwen3-4B (25/07),qwen/qwen3_4b,india_2025_6,india,proofs,OPC R1 8B,0.0
1802,Grok 4,xai/grok-4,india_2025_6,india,proofs,OPC R1 8B,0.0
1803,gemini-2.5-pro,gemini/gemini-pro-2.5,india_2025_6,india,proofs,OPC R1 8B,0.0
1804,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,india_2025_6,india,proofs,OPC R1 8B,0.0
1805,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,india_prep_2025_1,india,proofs,OPC R1 8B,0.0
1806,gemini-2.5-pro,gemini/gemini-pro-2.5,india_prep_2025_1,india,proofs,OPC R1 8B,0.0
1807,GPT OSS 120B (high),openai/oss-120b,india_prep_2025_1,india,proofs,OPC R1 8B,0.0
1808,o4-mini (high),openai/o4-mini--high,india_prep_2025_1,india,proofs,OPC R1 8B,0.0
1809,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,india_prep_2025_1,india,proofs,OPC R1 8B,0.0
1810,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,india_prep_2025_1,india,proofs,OPC R1 8B,0.0
1811,Grok 4,xai/grok-4,india_prep_2025_1,india,proofs,OPC R1 8B,0.0
1812,Qwen3-4B (25/07),qwen/qwen3_4b,india_prep_2025_1,india,proofs,OPC R1 8B,0.0
1813,GPT-5 (high),openai/gpt-5,india_prep_2025_1,india,proofs,OPC R1 8B,0.0
1814,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,india_prep_2025_1,india,proofs,OPC R1 8B,0.0
1815,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,india_prep_2025_10,india,proofs,OPC R1 8B,0.0
1816,GPT-5-mini (high),openai/gpt-5-mini,india_prep_2025_10,india,proofs,OPC R1 8B,1.0
1817,gemini-2.5-pro,gemini/gemini-pro-2.5,india_prep_2025_10,india,proofs,OPC R1 8B,0.0
1818,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,india_prep_2025_10,india,proofs,OPC R1 8B,0.0
1819,GPT-5 (high),openai/gpt-5,india_prep_2025_10,india,proofs,OPC R1 8B,0.0
1820,Grok 4,xai/grok-4,india_prep_2025_10,india,proofs,OPC R1 8B,0.0
1821,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,india_prep_2025_10,india,proofs,OPC R1 8B,1.0
1822,Qwen3-4B (25/07),qwen/qwen3_4b,india_prep_2025_10,india,proofs,OPC R1 8B,1.0
1823,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,india_prep_2025_10,india,proofs,OPC R1 8B,0.0
1824,o4-mini (high),openai/o4-mini--high,india_prep_2025_10,india,proofs,OPC R1 8B,0.0
1825,GPT OSS 120B (high),openai/oss-120b,india_prep_2025_10,india,proofs,OPC R1 8B,0.0
1826,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,india_prep_2025_11,india,proofs,OPC R1 8B,0.0
1827,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,india_prep_2025_11,india,proofs,OPC R1 8B,0.0
1828,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,india_prep_2025_11,india,proofs,OPC R1 8B,0.0
1829,o4-mini (high),openai/o4-mini--high,india_prep_2025_11,india,proofs,OPC R1 8B,0.0
1830,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,india_prep_2025_11,india,proofs,OPC R1 8B,0.0
1831,gemini-2.5-pro,gemini/gemini-pro-2.5,india_prep_2025_11,india,proofs,OPC R1 8B,0.0
1832,GPT-5-mini (high),openai/gpt-5-mini,india_prep_2025_11,india,proofs,OPC R1 8B,0.0
1833,Qwen3-4B (25/07),qwen/qwen3_4b,india_prep_2025_11,india,proofs,OPC R1 8B,0.0
1834,GPT OSS 120B (high),openai/oss-120b,india_prep_2025_11,india,proofs,OPC R1 8B,0.0
1835,GPT-5 (high),openai/gpt-5,india_prep_2025_11,india,proofs,OPC R1 8B,0.0
1836,Grok 4,xai/grok-4,india_prep_2025_11,india,proofs,OPC R1 8B,0.0
1837,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,india_prep_2025_12,india,proofs,OPC R1 8B,1.0
1838,GPT-5-mini (high),openai/gpt-5-mini,india_prep_2025_12,india,proofs,OPC R1 8B,1.0
1839,GPT-5 (high),openai/gpt-5,india_prep_2025_12,india,proofs,OPC R1 8B,1.0
1840,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,india_prep_2025_12,india,proofs,OPC R1 8B,0.0
1841,o4-mini (high),openai/o4-mini--high,india_prep_2025_12,india,proofs,OPC R1 8B,0.0
1842,GPT OSS 120B (high),openai/oss-120b,india_prep_2025_12,india,proofs,OPC R1 8B,0.0
1843,Qwen3-4B (25/07),qwen/qwen3_4b,india_prep_2025_12,india,proofs,OPC R1 8B,0.0
1844,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,india_prep_2025_12,india,proofs,OPC R1 8B,0.0
1845,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,india_prep_2025_12,india,proofs,OPC R1 8B,1.0
1846,gemini-2.5-pro,gemini/gemini-pro-2.5,india_prep_2025_12,india,proofs,OPC R1 8B,1.0
1847,Grok 4,xai/grok-4,india_prep_2025_12,india,proofs,OPC R1 8B,1.0
1848,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,india_prep_2025_13,india,proofs,OPC R1 8B,1.0
1849,o4-mini (high),openai/o4-mini--high,india_prep_2025_13,india,proofs,OPC R1 8B,0.0
1850,GPT-5 (high),openai/gpt-5,india_prep_2025_13,india,proofs,OPC R1 8B,1.0
1851,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,india_prep_2025_13,india,proofs,OPC R1 8B,0.0
1852,gemini-2.5-pro,gemini/gemini-pro-2.5,india_prep_2025_13,india,proofs,OPC R1 8B,1.0
1853,GPT OSS 120B (high),openai/oss-120b,india_prep_2025_13,india,proofs,OPC R1 8B,0.0
1854,Qwen3-4B (25/07),qwen/qwen3_4b,india_prep_2025_13,india,proofs,OPC R1 8B,0.0
1855,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,india_prep_2025_13,india,proofs,OPC R1 8B,1.0
1856,GPT-5-mini (high),openai/gpt-5-mini,india_prep_2025_13,india,proofs,OPC R1 8B,1.0
1857,Grok 4,xai/grok-4,india_prep_2025_13,india,proofs,OPC R1 8B,0.0
1858,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,india_prep_2025_13,india,proofs,OPC R1 8B,0.0
1859,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,india_prep_2025_14,india,proofs,OPC R1 8B,0.0
1860,Qwen3-4B (25/07),qwen/qwen3_4b,india_prep_2025_14,india,proofs,OPC R1 8B,0.0
1861,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,india_prep_2025_14,india,proofs,OPC R1 8B,0.0
1862,GPT OSS 120B (high),openai/oss-120b,india_prep_2025_14,india,proofs,OPC R1 8B,0.0
1863,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,india_prep_2025_14,india,proofs,OPC R1 8B,1.0
1864,Grok 4,xai/grok-4,india_prep_2025_14,india,proofs,OPC R1 8B,1.0
1865,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,india_prep_2025_14,india,proofs,OPC R1 8B,0.0
1866,GPT-5-mini (high),openai/gpt-5-mini,india_prep_2025_14,india,proofs,OPC R1 8B,1.0
1867,o4-mini (high),openai/o4-mini--high,india_prep_2025_14,india,proofs,OPC R1 8B,0.0
1868,GPT-5 (high),openai/gpt-5,india_prep_2025_14,india,proofs,OPC R1 8B,1.0
1869,gemini-2.5-pro,gemini/gemini-pro-2.5,india_prep_2025_14,india,proofs,OPC R1 8B,1.0
1870,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,india_prep_2025_15,india,proofs,OPC R1 8B,0.0
1871,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,india_prep_2025_15,india,proofs,OPC R1 8B,0.0
1872,GPT-5-mini (high),openai/gpt-5-mini,india_prep_2025_15,india,proofs,OPC R1 8B,0.0
1873,Qwen3-4B (25/07),qwen/qwen3_4b,india_prep_2025_15,india,proofs,OPC R1 8B,0.0
1874,o4-mini (high),openai/o4-mini--high,india_prep_2025_15,india,proofs,OPC R1 8B,0.0
1875,gemini-2.5-pro,gemini/gemini-pro-2.5,india_prep_2025_15,india,proofs,OPC R1 8B,0.0
1876,GPT OSS 120B (high),openai/oss-120b,india_prep_2025_15,india,proofs,OPC R1 8B,1.0
1877,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,india_prep_2025_15,india,proofs,OPC R1 8B,0.0
1878,Grok 4,xai/grok-4,india_prep_2025_15,india,proofs,OPC R1 8B,0.0
1879,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,india_prep_2025_15,india,proofs,OPC R1 8B,0.0
1880,GPT-5 (high),openai/gpt-5,india_prep_2025_15,india,proofs,OPC R1 8B,0.0
1881,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,india_prep_2025_16,india,proofs,OPC R1 8B,0.0
1882,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,india_prep_2025_16,india,proofs,OPC R1 8B,0.0
1883,GPT OSS 120B (high),openai/oss-120b,india_prep_2025_16,india,proofs,OPC R1 8B,1.0
1884,gemini-2.5-pro,gemini/gemini-pro-2.5,india_prep_2025_16,india,proofs,OPC R1 8B,0.0
1885,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,india_prep_2025_16,india,proofs,OPC R1 8B,0.0
1886,GPT-5-mini (high),openai/gpt-5-mini,india_prep_2025_16,india,proofs,OPC R1 8B,1.0
1887,Qwen3-4B (25/07),qwen/qwen3_4b,india_prep_2025_16,india,proofs,OPC R1 8B,0.0
1888,Grok 4,xai/grok-4,india_prep_2025_16,india,proofs,OPC R1 8B,0.0
1889,GPT-5 (high),openai/gpt-5,india_prep_2025_16,india,proofs,OPC R1 8B,1.0
1890,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,india_prep_2025_16,india,proofs,OPC R1 8B,0.0
1891,o4-mini (high),openai/o4-mini--high,india_prep_2025_16,india,proofs,OPC R1 8B,1.0
1892,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,india_prep_2025_17,india,proofs,OPC R1 8B,0.0
1893,GPT-5 (high),openai/gpt-5,india_prep_2025_17,india,proofs,OPC R1 8B,0.0
1894,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,india_prep_2025_17,india,proofs,OPC R1 8B,1.0
1895,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,india_prep_2025_17,india,proofs,OPC R1 8B,0.0
1896,gemini-2.5-pro,gemini/gemini-pro-2.5,india_prep_2025_17,india,proofs,OPC R1 8B,1.0
1897,GPT-5-mini (high),openai/gpt-5-mini,india_prep_2025_17,india,proofs,OPC R1 8B,0.0
1898,Qwen3-4B (25/07),qwen/qwen3_4b,india_prep_2025_17,india,proofs,OPC R1 8B,0.0
1899,GPT OSS 120B (high),openai/oss-120b,india_prep_2025_17,india,proofs,OPC R1 8B,0.0
1900,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,india_prep_2025_17,india,proofs,OPC R1 8B,0.0
1901,o4-mini (high),openai/o4-mini--high,india_prep_2025_17,india,proofs,OPC R1 8B,0.0
1902,gemini-2.5-pro,gemini/gemini-pro-2.5,india_prep_2025_18,india,proofs,OPC R1 8B,0.0
1903,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,india_prep_2025_18,india,proofs,OPC R1 8B,0.0
1904,o4-mini (high),openai/o4-mini--high,india_prep_2025_18,india,proofs,OPC R1 8B,0.0
1905,GPT-5 (high),openai/gpt-5,india_prep_2025_18,india,proofs,OPC R1 8B,0.0
1906,Qwen3-4B (25/07),qwen/qwen3_4b,india_prep_2025_18,india,proofs,OPC R1 8B,0.0
1907,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,india_prep_2025_18,india,proofs,OPC R1 8B,0.0
1908,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,india_prep_2025_18,india,proofs,OPC R1 8B,0.0
1909,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,india_prep_2025_18,india,proofs,OPC R1 8B,0.0
1910,GPT OSS 120B (high),openai/oss-120b,india_prep_2025_18,india,proofs,OPC R1 8B,0.0
1911,GPT-5-mini (high),openai/gpt-5-mini,india_prep_2025_18,india,proofs,OPC R1 8B,0.0
1912,Grok 4,xai/grok-4,india_prep_2025_18,india,proofs,OPC R1 8B,0.0
1913,GPT-5 (high),openai/gpt-5,india_prep_2025_19,india,proofs,OPC R1 8B,0.0
1914,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,india_prep_2025_19,india,proofs,OPC R1 8B,1.0
1915,GPT-5-mini (high),openai/gpt-5-mini,india_prep_2025_19,india,proofs,OPC R1 8B,0.0
1916,gemini-2.5-pro,gemini/gemini-pro-2.5,india_prep_2025_19,india,proofs,OPC R1 8B,0.0
1917,Grok 4,xai/grok-4,india_prep_2025_19,india,proofs,OPC R1 8B,0.0
1918,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,india_prep_2025_19,india,proofs,OPC R1 8B,0.0
1919,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,india_prep_2025_19,india,proofs,OPC R1 8B,0.0
1920,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,india_prep_2025_19,india,proofs,OPC R1 8B,1.0
1921,o4-mini (high),openai/o4-mini--high,india_prep_2025_19,india,proofs,OPC R1 8B,0.0
1922,Qwen3-4B (25/07),qwen/qwen3_4b,india_prep_2025_19,india,proofs,OPC R1 8B,0.0
1923,GPT OSS 120B (high),openai/oss-120b,india_prep_2025_19,india,proofs,OPC R1 8B,0.0
1924,GPT-5-mini (high),openai/gpt-5-mini,india_prep_2025_2,india,proofs,OPC R1 8B,1.0
1925,GPT OSS 120B (high),openai/oss-120b,india_prep_2025_2,india,proofs,OPC R1 8B,0.0
1926,GPT-5 (high),openai/gpt-5,india_prep_2025_2,india,proofs,OPC R1 8B,0.0
1927,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,india_prep_2025_2,india,proofs,OPC R1 8B,0.0
1928,Grok 4,xai/grok-4,india_prep_2025_2,india,proofs,OPC R1 8B,0.0
1929,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,india_prep_2025_2,india,proofs,OPC R1 8B,0.0
1930,Qwen3-4B (25/07),qwen/qwen3_4b,india_prep_2025_2,india,proofs,OPC R1 8B,0.0
1931,gemini-2.5-pro,gemini/gemini-pro-2.5,india_prep_2025_2,india,proofs,OPC R1 8B,0.0
1932,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,india_prep_2025_2,india,proofs,OPC R1 8B,0.0
1933,o4-mini (high),openai/o4-mini--high,india_prep_2025_2,india,proofs,OPC R1 8B,0.0
1934,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,india_prep_2025_2,india,proofs,OPC R1 8B,0.0
1935,Qwen3-4B (25/07),qwen/qwen3_4b,india_prep_2025_20,india,proofs,OPC R1 8B,0.0
1936,GPT-5 (high),openai/gpt-5,india_prep_2025_20,india,proofs,OPC R1 8B,0.0
1937,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,india_prep_2025_20,india,proofs,OPC R1 8B,0.0
1938,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,india_prep_2025_20,india,proofs,OPC R1 8B,0.0
1939,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,india_prep_2025_20,india,proofs,OPC R1 8B,0.0
1940,gemini-2.5-pro,gemini/gemini-pro-2.5,india_prep_2025_20,india,proofs,OPC R1 8B,0.0
1941,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,india_prep_2025_20,india,proofs,OPC R1 8B,0.0
1942,GPT OSS 120B (high),openai/oss-120b,india_prep_2025_20,india,proofs,OPC R1 8B,1.0
1943,GPT-5-mini (high),openai/gpt-5-mini,india_prep_2025_20,india,proofs,OPC R1 8B,0.0
1944,o4-mini (high),openai/o4-mini--high,india_prep_2025_20,india,proofs,OPC R1 8B,0.0
1945,Grok 4,xai/grok-4,india_prep_2025_20,india,proofs,OPC R1 8B,0.0
1946,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,india_prep_2025_21,india,proofs,OPC R1 8B,0.0
1947,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,india_prep_2025_21,india,proofs,OPC R1 8B,0.0
1948,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,india_prep_2025_21,india,proofs,OPC R1 8B,0.0
1949,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,india_prep_2025_21,india,proofs,OPC R1 8B,0.0
1950,o4-mini (high),openai/o4-mini--high,india_prep_2025_21,india,proofs,OPC R1 8B,0.0
1951,Qwen3-4B (25/07),qwen/qwen3_4b,india_prep_2025_21,india,proofs,OPC R1 8B,0.0
1952,GPT OSS 120B (high),openai/oss-120b,india_prep_2025_21,india,proofs,OPC R1 8B,0.0
1953,GPT-5 (high),openai/gpt-5,india_prep_2025_21,india,proofs,OPC R1 8B,0.0
1954,GPT-5-mini (high),openai/gpt-5-mini,india_prep_2025_21,india,proofs,OPC R1 8B,0.0
1955,gemini-2.5-pro,gemini/gemini-pro-2.5,india_prep_2025_21,india,proofs,OPC R1 8B,1.0
1956,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,india_prep_2025_3,india,proofs,OPC R1 8B,0.0
1957,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,india_prep_2025_3,india,proofs,OPC R1 8B,0.0
1958,GPT-5-mini (high),openai/gpt-5-mini,india_prep_2025_3,india,proofs,OPC R1 8B,0.0
1959,Grok 4,xai/grok-4,india_prep_2025_3,india,proofs,OPC R1 8B,0.0
1960,Qwen3-4B (25/07),qwen/qwen3_4b,india_prep_2025_3,india,proofs,OPC R1 8B,0.0
1961,gemini-2.5-pro,gemini/gemini-pro-2.5,india_prep_2025_3,india,proofs,OPC R1 8B,1.0
1962,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,india_prep_2025_3,india,proofs,OPC R1 8B,0.0
1963,GPT-5 (high),openai/gpt-5,india_prep_2025_3,india,proofs,OPC R1 8B,0.0
1964,o4-mini (high),openai/o4-mini--high,india_prep_2025_3,india,proofs,OPC R1 8B,0.0
1965,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,india_prep_2025_3,india,proofs,OPC R1 8B,0.0
1966,GPT OSS 120B (high),openai/oss-120b,india_prep_2025_3,india,proofs,OPC R1 8B,0.0
1967,Qwen3-4B (25/07),qwen/qwen3_4b,india_prep_2025_4,india,proofs,OPC R1 8B,0.0
1968,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,india_prep_2025_4,india,proofs,OPC R1 8B,0.0
1969,gemini-2.5-pro,gemini/gemini-pro-2.5,india_prep_2025_4,india,proofs,OPC R1 8B,0.0
1970,Grok 4,xai/grok-4,india_prep_2025_4,india,proofs,OPC R1 8B,0.0
1971,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,india_prep_2025_4,india,proofs,OPC R1 8B,0.0
1972,GPT-5-mini (high),openai/gpt-5-mini,india_prep_2025_4,india,proofs,OPC R1 8B,0.0
1973,o4-mini (high),openai/o4-mini--high,india_prep_2025_4,india,proofs,OPC R1 8B,0.0
1974,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,india_prep_2025_4,india,proofs,OPC R1 8B,0.0
1975,GPT-5 (high),openai/gpt-5,india_prep_2025_4,india,proofs,OPC R1 8B,0.0
1976,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,india_prep_2025_4,india,proofs,OPC R1 8B,0.0
1977,GPT OSS 120B (high),openai/oss-120b,india_prep_2025_4,india,proofs,OPC R1 8B,0.0
1978,gemini-2.5-pro,gemini/gemini-pro-2.5,india_prep_2025_5,india,proofs,OPC R1 8B,0.0
1979,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,india_prep_2025_5,india,proofs,OPC R1 8B,0.0
1980,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,india_prep_2025_5,india,proofs,OPC R1 8B,0.0
1981,Grok 4,xai/grok-4,india_prep_2025_5,india,proofs,OPC R1 8B,0.0
1982,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,india_prep_2025_5,india,proofs,OPC R1 8B,0.0
1983,GPT OSS 120B (high),openai/oss-120b,india_prep_2025_5,india,proofs,OPC R1 8B,0.0
1984,Qwen3-4B (25/07),qwen/qwen3_4b,india_prep_2025_5,india,proofs,OPC R1 8B,0.0
1985,GPT-5 (high),openai/gpt-5,india_prep_2025_5,india,proofs,OPC R1 8B,0.0
1986,GPT-5-mini (high),openai/gpt-5-mini,india_prep_2025_5,india,proofs,OPC R1 8B,0.0
1987,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,india_prep_2025_5,india,proofs,OPC R1 8B,0.0
1988,o4-mini (high),openai/o4-mini--high,india_prep_2025_5,india,proofs,OPC R1 8B,0.0
1989,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,india_prep_2025_6,india,proofs,OPC R1 8B,0.0
1990,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,india_prep_2025_6,india,proofs,OPC R1 8B,0.0
1991,GPT-5-mini (high),openai/gpt-5-mini,india_prep_2025_6,india,proofs,OPC R1 8B,0.0
1992,o4-mini (high),openai/o4-mini--high,india_prep_2025_6,india,proofs,OPC R1 8B,0.0
1993,GPT OSS 120B (high),openai/oss-120b,india_prep_2025_6,india,proofs,OPC R1 8B,0.0
1994,Qwen3-4B (25/07),qwen/qwen3_4b,india_prep_2025_6,india,proofs,OPC R1 8B,1.0
1995,GPT-5 (high),openai/gpt-5,india_prep_2025_6,india,proofs,OPC R1 8B,1.0
1996,gemini-2.5-pro,gemini/gemini-pro-2.5,india_prep_2025_6,india,proofs,OPC R1 8B,0.0
1997,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,india_prep_2025_6,india,proofs,OPC R1 8B,0.0
1998,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,india_prep_2025_6,india,proofs,OPC R1 8B,0.0
1999,Grok 4,xai/grok-4,india_prep_2025_6,india,proofs,OPC R1 8B,0.0
2000,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,india_prep_2025_7,india,proofs,OPC R1 8B,0.0
2001,GPT OSS 120B (high),openai/oss-120b,india_prep_2025_7,india,proofs,OPC R1 8B,0.0
2002,Grok 4,xai/grok-4,india_prep_2025_7,india,proofs,OPC R1 8B,0.0
2003,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,india_prep_2025_7,india,proofs,OPC R1 8B,0.0
2004,GPT-5-mini (high),openai/gpt-5-mini,india_prep_2025_7,india,proofs,OPC R1 8B,0.0
2005,gemini-2.5-pro,gemini/gemini-pro-2.5,india_prep_2025_7,india,proofs,OPC R1 8B,0.0
2006,o4-mini (high),openai/o4-mini--high,india_prep_2025_7,india,proofs,OPC R1 8B,0.0
2007,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,india_prep_2025_7,india,proofs,OPC R1 8B,0.0
2008,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,india_prep_2025_7,india,proofs,OPC R1 8B,0.0
2009,GPT-5 (high),openai/gpt-5,india_prep_2025_7,india,proofs,OPC R1 8B,0.0
2010,Qwen3-4B (25/07),qwen/qwen3_4b,india_prep_2025_7,india,proofs,OPC R1 8B,0.0
2011,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,india_prep_2025_8,india,proofs,OPC R1 8B,0.0
2012,GPT OSS 120B (high),openai/oss-120b,india_prep_2025_8,india,proofs,OPC R1 8B,0.0
2013,gemini-2.5-pro,gemini/gemini-pro-2.5,india_prep_2025_8,india,proofs,OPC R1 8B,0.0
2014,GPT-5 (high),openai/gpt-5,india_prep_2025_8,india,proofs,OPC R1 8B,0.0
2015,o4-mini (high),openai/o4-mini--high,india_prep_2025_8,india,proofs,OPC R1 8B,0.0
2016,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,india_prep_2025_8,india,proofs,OPC R1 8B,0.0
2017,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,india_prep_2025_8,india,proofs,OPC R1 8B,0.0
2018,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,india_prep_2025_8,india,proofs,OPC R1 8B,0.0
2019,Qwen3-4B (25/07),qwen/qwen3_4b,india_prep_2025_8,india,proofs,OPC R1 8B,0.0
2020,Grok 4,xai/grok-4,india_prep_2025_8,india,proofs,OPC R1 8B,0.0
2021,GPT-5-mini (high),openai/gpt-5-mini,india_prep_2025_8,india,proofs,OPC R1 8B,0.0
2022,GPT-5 (high),openai/gpt-5,india_prep_2025_9,india,proofs,OPC R1 8B,1.0
2023,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,india_prep_2025_9,india,proofs,OPC R1 8B,1.0
2024,Qwen3-4B (25/07),qwen/qwen3_4b,india_prep_2025_9,india,proofs,OPC R1 8B,0.0
2025,Grok 4,xai/grok-4,india_prep_2025_9,india,proofs,OPC R1 8B,1.0
2026,o4-mini (high),openai/o4-mini--high,india_prep_2025_9,india,proofs,OPC R1 8B,0.0
2027,gemini-2.5-pro,gemini/gemini-pro-2.5,india_prep_2025_9,india,proofs,OPC R1 8B,0.0
2028,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,india_prep_2025_9,india,proofs,OPC R1 8B,1.0
2029,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,india_prep_2025_9,india,proofs,OPC R1 8B,1.0
2030,GPT OSS 120B (high),openai/oss-120b,india_prep_2025_9,india,proofs,OPC R1 8B,0.0
2031,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,india_prep_2025_9,india,proofs,OPC R1 8B,1.0
2032,GPT-5-mini (high),openai/gpt-5-mini,india_prep_2025_9,india,proofs,OPC R1 8B,1.0
2033,GPT OSS 120B (high),openai/oss-120b,iran_tst_2025_1,iran,proofs,OPC R1 8B,0.0
2034,Qwen3-4B (25/07),qwen/qwen3_4b,iran_tst_2025_1,iran,proofs,OPC R1 8B,0.0
2035,o4-mini (high),openai/o4-mini--high,iran_tst_2025_1,iran,proofs,OPC R1 8B,0.0
2036,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,iran_tst_2025_1,iran,proofs,OPC R1 8B,0.0
2037,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,iran_tst_2025_1,iran,proofs,OPC R1 8B,0.0
2038,gemini-2.5-pro,gemini/gemini-pro-2.5,iran_tst_2025_1,iran,proofs,OPC R1 8B,1.0
2039,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,iran_tst_2025_1,iran,proofs,OPC R1 8B,0.0
2040,Grok 4,xai/grok-4,iran_tst_2025_1,iran,proofs,OPC R1 8B,0.0
2041,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,iran_tst_2025_1,iran,proofs,OPC R1 8B,0.0
2042,GPT-5 (high),openai/gpt-5,iran_tst_2025_1,iran,proofs,OPC R1 8B,0.0
2043,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,iran_tst_2025_2,iran,proofs,OPC R1 8B,0.0
2044,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,iran_tst_2025_2,iran,proofs,OPC R1 8B,0.0
2045,gemini-2.5-pro,gemini/gemini-pro-2.5,iran_tst_2025_2,iran,proofs,OPC R1 8B,1.0
2046,o4-mini (high),openai/o4-mini--high,iran_tst_2025_2,iran,proofs,OPC R1 8B,0.0
2047,GPT-5 (high),openai/gpt-5,iran_tst_2025_2,iran,proofs,OPC R1 8B,0.0
2048,Grok 4,xai/grok-4,iran_tst_2025_2,iran,proofs,OPC R1 8B,0.0
2049,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,iran_tst_2025_2,iran,proofs,OPC R1 8B,0.0
2050,GPT OSS 120B (high),openai/oss-120b,iran_tst_2025_2,iran,proofs,OPC R1 8B,0.0
2051,Qwen3-4B (25/07),qwen/qwen3_4b,iran_tst_2025_2,iran,proofs,OPC R1 8B,0.0
2052,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,iran_tst_2025_2,iran,proofs,OPC R1 8B,0.0
2053,GPT OSS 120B (high),openai/oss-120b,iran_tst_2025_3,iran,proofs,OPC R1 8B,0.0
2054,gemini-2.5-pro,gemini/gemini-pro-2.5,iran_tst_2025_3,iran,proofs,OPC R1 8B,0.0
2055,Grok 4,xai/grok-4,iran_tst_2025_3,iran,proofs,OPC R1 8B,0.0
2056,GPT-5 (high),openai/gpt-5,iran_tst_2025_3,iran,proofs,OPC R1 8B,0.0
2057,Qwen3-4B (25/07),qwen/qwen3_4b,iran_tst_2025_3,iran,proofs,OPC R1 8B,0.0
2058,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,iran_tst_2025_3,iran,proofs,OPC R1 8B,0.0
2059,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,iran_tst_2025_3,iran,proofs,OPC R1 8B,0.0
2060,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,iran_tst_2025_3,iran,proofs,OPC R1 8B,0.0
2061,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,iran_tst_2025_3,iran,proofs,OPC R1 8B,0.0
2062,o4-mini (high),openai/o4-mini--high,iran_tst_2025_3,iran,proofs,OPC R1 8B,0.0
2063,Qwen3-4B (25/07),qwen/qwen3_4b,iran_tst_2025_4,iran,proofs,OPC R1 8B,1.0
2064,o4-mini (high),openai/o4-mini--high,iran_tst_2025_4,iran,proofs,OPC R1 8B,1.0
2065,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,iran_tst_2025_4,iran,proofs,OPC R1 8B,1.0
2066,GPT OSS 120B (high),openai/oss-120b,iran_tst_2025_4,iran,proofs,OPC R1 8B,1.0
2067,gemini-2.5-pro,gemini/gemini-pro-2.5,iran_tst_2025_4,iran,proofs,OPC R1 8B,1.0
2068,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,iran_tst_2025_4,iran,proofs,OPC R1 8B,1.0
2069,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,iran_tst_2025_4,iran,proofs,OPC R1 8B,1.0
2070,GPT-5 (high),openai/gpt-5,iran_tst_2025_4,iran,proofs,OPC R1 8B,1.0
2071,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,iran_tst_2025_4,iran,proofs,OPC R1 8B,1.0
2072,Grok 4,xai/grok-4,iran_tst_2025_4,iran,proofs,OPC R1 8B,1.0
2073,Grok 4,xai/grok-4,iran_tst_2025_5,iran,proofs,OPC R1 8B,0.0
2074,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,iran_tst_2025_5,iran,proofs,OPC R1 8B,0.0
2075,GPT-5 (high),openai/gpt-5,iran_tst_2025_5,iran,proofs,OPC R1 8B,0.0
2076,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,iran_tst_2025_5,iran,proofs,OPC R1 8B,0.0
2077,gemini-2.5-pro,gemini/gemini-pro-2.5,iran_tst_2025_5,iran,proofs,OPC R1 8B,0.0
2078,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,iran_tst_2025_5,iran,proofs,OPC R1 8B,0.0
2079,o4-mini (high),openai/o4-mini--high,iran_tst_2025_5,iran,proofs,OPC R1 8B,0.0
2080,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,iran_tst_2025_5,iran,proofs,OPC R1 8B,0.0
2081,Qwen3-4B (25/07),qwen/qwen3_4b,iran_tst_2025_5,iran,proofs,OPC R1 8B,0.0
2082,GPT OSS 120B (high),openai/oss-120b,iran_tst_2025_5,iran,proofs,OPC R1 8B,1.0
2083,GPT OSS 120B (high),openai/oss-120b,iran_tst_2025_6,iran,proofs,OPC R1 8B,0.0
2084,Grok 4,xai/grok-4,iran_tst_2025_6,iran,proofs,OPC R1 8B,0.0
2085,gemini-2.5-pro,gemini/gemini-pro-2.5,iran_tst_2025_6,iran,proofs,OPC R1 8B,0.0
2086,o4-mini (high),openai/o4-mini--high,iran_tst_2025_6,iran,proofs,OPC R1 8B,0.0
2087,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,iran_tst_2025_6,iran,proofs,OPC R1 8B,0.0
2088,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,iran_tst_2025_6,iran,proofs,OPC R1 8B,0.0
2089,GPT-5 (high),openai/gpt-5,iran_tst_2025_6,iran,proofs,OPC R1 8B,1.0
2090,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,iran_tst_2025_6,iran,proofs,OPC R1 8B,0.0
2091,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,iran_tst_2025_6,iran,proofs,OPC R1 8B,1.0
2092,Qwen3-4B (25/07),qwen/qwen3_4b,iran_tst_2025_6,iran,proofs,OPC R1 8B,0.0
2093,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,iran_tst_2025_7,iran,proofs,OPC R1 8B,1.0
2094,GPT-5 (high),openai/gpt-5,iran_tst_2025_7,iran,proofs,OPC R1 8B,1.0
2095,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,iran_tst_2025_7,iran,proofs,OPC R1 8B,1.0
2096,gemini-2.5-pro,gemini/gemini-pro-2.5,iran_tst_2025_7,iran,proofs,OPC R1 8B,1.0
2097,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,iran_tst_2025_7,iran,proofs,OPC R1 8B,1.0
2098,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,iran_tst_2025_7,iran,proofs,OPC R1 8B,1.0
2099,GPT OSS 120B (high),openai/oss-120b,iran_tst_2025_7,iran,proofs,OPC R1 8B,0.0
2100,o4-mini (high),openai/o4-mini--high,iran_tst_2025_7,iran,proofs,OPC R1 8B,0.0
2101,Qwen3-4B (25/07),qwen/qwen3_4b,iran_tst_2025_7,iran,proofs,OPC R1 8B,0.0
2102,Grok 4,xai/grok-4,iran_tst_2025_7,iran,proofs,OPC R1 8B,0.0
2103,GPT OSS 120B (high),openai/oss-120b,iran_tst_2025_8,iran,proofs,OPC R1 8B,1.0
2104,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,iran_tst_2025_8,iran,proofs,OPC R1 8B,0.0
2105,Qwen3-4B (25/07),qwen/qwen3_4b,iran_tst_2025_8,iran,proofs,OPC R1 8B,0.0
2106,gemini-2.5-pro,gemini/gemini-pro-2.5,iran_tst_2025_8,iran,proofs,OPC R1 8B,0.0
2107,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,iran_tst_2025_8,iran,proofs,OPC R1 8B,0.0
2108,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,iran_tst_2025_8,iran,proofs,OPC R1 8B,0.0
2109,Grok 4,xai/grok-4,iran_tst_2025_8,iran,proofs,OPC R1 8B,0.0
2110,o4-mini (high),openai/o4-mini--high,iran_tst_2025_8,iran,proofs,OPC R1 8B,0.0
2111,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,iran_tst_2025_8,iran,proofs,OPC R1 8B,0.0
2112,GPT-5 (high),openai/gpt-5,iran_tst_2025_8,iran,proofs,OPC R1 8B,0.0
2113,o4-mini (high),openai/o4-mini--high,iran_tst_2025_9,iran,proofs,OPC R1 8B,0.0
2114,Qwen3-4B (25/07),qwen/qwen3_4b,iran_tst_2025_9,iran,proofs,OPC R1 8B,0.0
2115,GPT OSS 120B (high),openai/oss-120b,iran_tst_2025_9,iran,proofs,OPC R1 8B,0.0
2116,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,iran_tst_2025_9,iran,proofs,OPC R1 8B,1.0
2117,Grok 4,xai/grok-4,iran_tst_2025_9,iran,proofs,OPC R1 8B,0.0
2118,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,iran_tst_2025_9,iran,proofs,OPC R1 8B,0.0
2119,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,iran_tst_2025_9,iran,proofs,OPC R1 8B,1.0
2120,gemini-2.5-pro,gemini/gemini-pro-2.5,iran_tst_2025_9,iran,proofs,OPC R1 8B,0.0
2121,GPT-5 (high),openai/gpt-5,iran_tst_2025_9,iran,proofs,OPC R1 8B,0.0
2122,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,iran_tst_2025_9,iran,proofs,OPC R1 8B,0.0
2123,gemini-2.5-pro,gemini/gemini-pro-2.5,israel_tst_2025_1,israel,proofs,OPC R1 8B,1.0
2124,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,israel_tst_2025_1,israel,proofs,OPC R1 8B,0.0
2125,GPT OSS 120B (high),openai/oss-120b,israel_tst_2025_1,israel,proofs,OPC R1 8B,0.0
2126,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,israel_tst_2025_1,israel,proofs,OPC R1 8B,0.0
2127,o4-mini (high),openai/o4-mini--high,israel_tst_2025_1,israel,proofs,OPC R1 8B,0.0
2128,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,israel_tst_2025_1,israel,proofs,OPC R1 8B,0.0
2129,Qwen3-4B (25/07),qwen/qwen3_4b,israel_tst_2025_1,israel,proofs,OPC R1 8B,0.0
2130,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,israel_tst_2025_1,israel,proofs,OPC R1 8B,0.0
2131,GPT-5 (high),openai/gpt-5,israel_tst_2025_1,israel,proofs,OPC R1 8B,1.0
2132,Grok 4,xai/grok-4,israel_tst_2025_1,israel,proofs,OPC R1 8B,0.0
2133,gemini-2.5-pro,gemini/gemini-pro-2.5,israel_tst_2025_10,israel,proofs,OPC R1 8B,0.0
2134,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,israel_tst_2025_10,israel,proofs,OPC R1 8B,0.0
2135,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,israel_tst_2025_10,israel,proofs,OPC R1 8B,0.0
2136,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,israel_tst_2025_10,israel,proofs,OPC R1 8B,0.0
2137,GPT OSS 120B (high),openai/oss-120b,israel_tst_2025_10,israel,proofs,OPC R1 8B,0.0
2138,GPT-5 (high),openai/gpt-5,israel_tst_2025_10,israel,proofs,OPC R1 8B,0.0
2139,o4-mini (high),openai/o4-mini--high,israel_tst_2025_10,israel,proofs,OPC R1 8B,0.0
2140,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,israel_tst_2025_10,israel,proofs,OPC R1 8B,1.0
2141,Qwen3-4B (25/07),qwen/qwen3_4b,israel_tst_2025_10,israel,proofs,OPC R1 8B,0.0
2142,Grok 4,xai/grok-4,israel_tst_2025_10,israel,proofs,OPC R1 8B,0.0
2143,Grok 4,xai/grok-4,israel_tst_2025_2,israel,proofs,OPC R1 8B,0.0
2144,gemini-2.5-pro,gemini/gemini-pro-2.5,israel_tst_2025_2,israel,proofs,OPC R1 8B,0.0
2145,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,israel_tst_2025_2,israel,proofs,OPC R1 8B,0.0
2146,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,israel_tst_2025_2,israel,proofs,OPC R1 8B,0.0
2147,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,israel_tst_2025_2,israel,proofs,OPC R1 8B,0.0
2148,GPT-5 (high),openai/gpt-5,israel_tst_2025_2,israel,proofs,OPC R1 8B,0.0
2149,Qwen3-4B (25/07),qwen/qwen3_4b,israel_tst_2025_2,israel,proofs,OPC R1 8B,0.0
2150,o4-mini (high),openai/o4-mini--high,israel_tst_2025_2,israel,proofs,OPC R1 8B,0.0
2151,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,israel_tst_2025_2,israel,proofs,OPC R1 8B,0.0
2152,GPT OSS 120B (high),openai/oss-120b,israel_tst_2025_2,israel,proofs,OPC R1 8B,0.0
2153,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,israel_tst_2025_3,israel,proofs,OPC R1 8B,0.0
2154,GPT OSS 120B (high),openai/oss-120b,israel_tst_2025_3,israel,proofs,OPC R1 8B,0.0
2155,gemini-2.5-pro,gemini/gemini-pro-2.5,israel_tst_2025_3,israel,proofs,OPC R1 8B,1.0
2156,Grok 4,xai/grok-4,israel_tst_2025_3,israel,proofs,OPC R1 8B,0.0
2157,GPT-5 (high),openai/gpt-5,israel_tst_2025_3,israel,proofs,OPC R1 8B,1.0
2158,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,israel_tst_2025_3,israel,proofs,OPC R1 8B,0.0
2159,o4-mini (high),openai/o4-mini--high,israel_tst_2025_3,israel,proofs,OPC R1 8B,0.0
2160,Qwen3-4B (25/07),qwen/qwen3_4b,israel_tst_2025_3,israel,proofs,OPC R1 8B,0.0
2161,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,israel_tst_2025_3,israel,proofs,OPC R1 8B,0.0
2162,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,israel_tst_2025_3,israel,proofs,OPC R1 8B,0.0
2163,Qwen3-4B (25/07),qwen/qwen3_4b,israel_tst_2025_4,israel,proofs,OPC R1 8B,0.0
2164,gemini-2.5-pro,gemini/gemini-pro-2.5,israel_tst_2025_4,israel,proofs,OPC R1 8B,0.0
2165,o4-mini (high),openai/o4-mini--high,israel_tst_2025_4,israel,proofs,OPC R1 8B,0.0
2166,Grok 4,xai/grok-4,israel_tst_2025_4,israel,proofs,OPC R1 8B,0.0
2167,GPT OSS 120B (high),openai/oss-120b,israel_tst_2025_4,israel,proofs,OPC R1 8B,0.0
2168,GPT-5 (high),openai/gpt-5,israel_tst_2025_4,israel,proofs,OPC R1 8B,0.0
2169,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,israel_tst_2025_4,israel,proofs,OPC R1 8B,0.0
2170,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,israel_tst_2025_4,israel,proofs,OPC R1 8B,0.0
2171,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,israel_tst_2025_4,israel,proofs,OPC R1 8B,0.0
2172,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,israel_tst_2025_4,israel,proofs,OPC R1 8B,0.0
2173,GPT-5 (high),openai/gpt-5,israel_tst_2025_5,israel,proofs,OPC R1 8B,0.0
2174,gemini-2.5-pro,gemini/gemini-pro-2.5,israel_tst_2025_5,israel,proofs,OPC R1 8B,0.0
2175,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,israel_tst_2025_5,israel,proofs,OPC R1 8B,0.0
2176,Grok 4,xai/grok-4,israel_tst_2025_5,israel,proofs,OPC R1 8B,0.0
2177,o4-mini (high),openai/o4-mini--high,israel_tst_2025_5,israel,proofs,OPC R1 8B,0.0
2178,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,israel_tst_2025_5,israel,proofs,OPC R1 8B,0.0
2179,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,israel_tst_2025_5,israel,proofs,OPC R1 8B,0.0
2180,GPT OSS 120B (high),openai/oss-120b,israel_tst_2025_5,israel,proofs,OPC R1 8B,1.0
2181,Qwen3-4B (25/07),qwen/qwen3_4b,israel_tst_2025_5,israel,proofs,OPC R1 8B,0.0
2182,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,israel_tst_2025_5,israel,proofs,OPC R1 8B,0.0
2183,GPT-5 (high),openai/gpt-5,israel_tst_2025_6,israel,proofs,OPC R1 8B,0.0
2184,Grok 4,xai/grok-4,israel_tst_2025_6,israel,proofs,OPC R1 8B,0.0
2185,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,israel_tst_2025_6,israel,proofs,OPC R1 8B,0.0
2186,gemini-2.5-pro,gemini/gemini-pro-2.5,israel_tst_2025_6,israel,proofs,OPC R1 8B,0.0
2187,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,israel_tst_2025_6,israel,proofs,OPC R1 8B,0.0
2188,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,israel_tst_2025_6,israel,proofs,OPC R1 8B,0.0
2189,o4-mini (high),openai/o4-mini--high,israel_tst_2025_6,israel,proofs,OPC R1 8B,0.0
2190,GPT OSS 120B (high),openai/oss-120b,israel_tst_2025_6,israel,proofs,OPC R1 8B,1.0
2191,Qwen3-4B (25/07),qwen/qwen3_4b,israel_tst_2025_6,israel,proofs,OPC R1 8B,0.0
2192,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,israel_tst_2025_6,israel,proofs,OPC R1 8B,0.0
2193,Qwen3-4B (25/07),qwen/qwen3_4b,israel_tst_2025_7,israel,proofs,OPC R1 8B,0.0
2194,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,israel_tst_2025_7,israel,proofs,OPC R1 8B,1.0
2195,gemini-2.5-pro,gemini/gemini-pro-2.5,israel_tst_2025_7,israel,proofs,OPC R1 8B,0.0
2196,o4-mini (high),openai/o4-mini--high,israel_tst_2025_7,israel,proofs,OPC R1 8B,0.0
2197,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,israel_tst_2025_7,israel,proofs,OPC R1 8B,0.0
2198,Grok 4,xai/grok-4,israel_tst_2025_7,israel,proofs,OPC R1 8B,0.0
2199,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,israel_tst_2025_7,israel,proofs,OPC R1 8B,0.0
2200,GPT OSS 120B (high),openai/oss-120b,israel_tst_2025_7,israel,proofs,OPC R1 8B,0.0
2201,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,israel_tst_2025_7,israel,proofs,OPC R1 8B,0.0
2202,GPT-5 (high),openai/gpt-5,israel_tst_2025_7,israel,proofs,OPC R1 8B,1.0
2203,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,israel_tst_2025_8,israel,proofs,OPC R1 8B,0.0
2204,GPT OSS 120B (high),openai/oss-120b,israel_tst_2025_8,israel,proofs,OPC R1 8B,1.0
2205,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,israel_tst_2025_8,israel,proofs,OPC R1 8B,0.0
2206,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,israel_tst_2025_8,israel,proofs,OPC R1 8B,1.0
2207,o4-mini (high),openai/o4-mini--high,israel_tst_2025_8,israel,proofs,OPC R1 8B,0.0
2208,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,israel_tst_2025_8,israel,proofs,OPC R1 8B,0.0
2209,Qwen3-4B (25/07),qwen/qwen3_4b,israel_tst_2025_8,israel,proofs,OPC R1 8B,0.0
2210,gemini-2.5-pro,gemini/gemini-pro-2.5,israel_tst_2025_8,israel,proofs,OPC R1 8B,0.0
2211,Grok 4,xai/grok-4,israel_tst_2025_8,israel,proofs,OPC R1 8B,0.0
2212,GPT-5 (high),openai/gpt-5,israel_tst_2025_8,israel,proofs,OPC R1 8B,1.0
2213,Qwen3-4B (25/07),qwen/qwen3_4b,israel_tst_2025_9,israel,proofs,OPC R1 8B,0.0
2214,Grok 4,xai/grok-4,israel_tst_2025_9,israel,proofs,OPC R1 8B,0.0
2215,gemini-2.5-pro,gemini/gemini-pro-2.5,israel_tst_2025_9,israel,proofs,OPC R1 8B,0.0
2216,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,israel_tst_2025_9,israel,proofs,OPC R1 8B,0.0
2217,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,israel_tst_2025_9,israel,proofs,OPC R1 8B,0.0
2218,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,israel_tst_2025_9,israel,proofs,OPC R1 8B,0.0
2219,GPT OSS 120B (high),openai/oss-120b,israel_tst_2025_9,israel,proofs,OPC R1 8B,0.0
2220,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,israel_tst_2025_9,israel,proofs,OPC R1 8B,0.0
2221,o4-mini (high),openai/o4-mini--high,israel_tst_2025_9,israel,proofs,OPC R1 8B,0.0
2222,GPT-5 (high),openai/gpt-5,israel_tst_2025_9,israel,proofs,OPC R1 8B,0.0
2223,Grok 4,xai/grok-4,izho_2025_1,izho,proofs,OPC R1 8B,1.0
2224,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,izho_2025_1,izho,proofs,OPC R1 8B,1.0
2225,GPT-5-mini (high),openai/gpt-5-mini,izho_2025_1,izho,proofs,OPC R1 8B,0.0
2226,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,izho_2025_1,izho,proofs,OPC R1 8B,1.0
2227,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,izho_2025_1,izho,proofs,OPC R1 8B,1.0
2228,Qwen3-4B (25/07),qwen/qwen3_4b,izho_2025_1,izho,proofs,OPC R1 8B,1.0
2229,o4-mini (high),openai/o4-mini--high,izho_2025_1,izho,proofs,OPC R1 8B,1.0
2230,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,izho_2025_1,izho,proofs,OPC R1 8B,1.0
2231,GPT OSS 120B (high),openai/oss-120b,izho_2025_1,izho,proofs,OPC R1 8B,1.0
2232,gemini-2.5-pro,gemini/gemini-pro-2.5,izho_2025_1,izho,proofs,OPC R1 8B,1.0
2233,GPT-5 (high),openai/gpt-5,izho_2025_1,izho,proofs,OPC R1 8B,1.0
2234,Qwen3-4B (25/07),qwen/qwen3_4b,izho_2025_2,izho,proofs,OPC R1 8B,0.0
2235,o4-mini (high),openai/o4-mini--high,izho_2025_2,izho,proofs,OPC R1 8B,0.0
2236,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,izho_2025_2,izho,proofs,OPC R1 8B,0.0
2237,gemini-2.5-pro,gemini/gemini-pro-2.5,izho_2025_2,izho,proofs,OPC R1 8B,1.0
2238,Grok 4,xai/grok-4,izho_2025_2,izho,proofs,OPC R1 8B,0.0
2239,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,izho_2025_2,izho,proofs,OPC R1 8B,1.0
2240,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,izho_2025_2,izho,proofs,OPC R1 8B,0.0
2241,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,izho_2025_2,izho,proofs,OPC R1 8B,0.0
2242,GPT OSS 120B (high),openai/oss-120b,izho_2025_2,izho,proofs,OPC R1 8B,0.0
2243,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,izho_2025_3,izho,proofs,OPC R1 8B,1.0
2244,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,izho_2025_3,izho,proofs,OPC R1 8B,0.0
2245,o4-mini (high),openai/o4-mini--high,izho_2025_3,izho,proofs,OPC R1 8B,0.0
2246,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,izho_2025_3,izho,proofs,OPC R1 8B,0.0
2247,GPT OSS 120B (high),openai/oss-120b,izho_2025_3,izho,proofs,OPC R1 8B,0.0
2248,GPT-5-mini (high),openai/gpt-5-mini,izho_2025_3,izho,proofs,OPC R1 8B,1.0
2249,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,izho_2025_3,izho,proofs,OPC R1 8B,0.0
2250,Qwen3-4B (25/07),qwen/qwen3_4b,izho_2025_3,izho,proofs,OPC R1 8B,0.0
2251,gemini-2.5-pro,gemini/gemini-pro-2.5,izho_2025_3,izho,proofs,OPC R1 8B,0.0
2252,Grok 4,xai/grok-4,izho_2025_3,izho,proofs,OPC R1 8B,0.0
2253,GPT-5 (high),openai/gpt-5,izho_2025_4,izho,proofs,OPC R1 8B,0.0
2254,Grok 4,xai/grok-4,izho_2025_4,izho,proofs,OPC R1 8B,1.0
2255,GPT OSS 120B (high),openai/oss-120b,izho_2025_4,izho,proofs,OPC R1 8B,0.0
2256,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,izho_2025_4,izho,proofs,OPC R1 8B,0.0
2257,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,izho_2025_4,izho,proofs,OPC R1 8B,0.0
2258,Qwen3-4B (25/07),qwen/qwen3_4b,izho_2025_4,izho,proofs,OPC R1 8B,0.0
2259,gemini-2.5-pro,gemini/gemini-pro-2.5,izho_2025_4,izho,proofs,OPC R1 8B,1.0
2260,o4-mini (high),openai/o4-mini--high,izho_2025_4,izho,proofs,OPC R1 8B,1.0
2261,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,izho_2025_4,izho,proofs,OPC R1 8B,1.0
2262,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,izho_2025_4,izho,proofs,OPC R1 8B,1.0
2263,GPT-5-mini (high),openai/gpt-5-mini,izho_2025_4,izho,proofs,OPC R1 8B,1.0
2264,o4-mini (high),openai/o4-mini--high,izho_2025_5,izho,proofs,OPC R1 8B,0.0
2265,Grok 4,xai/grok-4,izho_2025_5,izho,proofs,OPC R1 8B,0.0
2266,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,izho_2025_5,izho,proofs,OPC R1 8B,0.0
2267,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,izho_2025_5,izho,proofs,OPC R1 8B,0.0
2268,Qwen3-4B (25/07),qwen/qwen3_4b,izho_2025_5,izho,proofs,OPC R1 8B,0.0
2269,gemini-2.5-pro,gemini/gemini-pro-2.5,izho_2025_5,izho,proofs,OPC R1 8B,0.0
2270,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,izho_2025_5,izho,proofs,OPC R1 8B,0.0
2271,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,izho_2025_5,izho,proofs,OPC R1 8B,0.0
2272,GPT OSS 120B (high),openai/oss-120b,izho_2025_5,izho,proofs,OPC R1 8B,1.0
2273,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,izho_2025_6,izho,proofs,OPC R1 8B,0.0
2274,gemini-2.5-pro,gemini/gemini-pro-2.5,izho_2025_6,izho,proofs,OPC R1 8B,0.0
2275,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,izho_2025_6,izho,proofs,OPC R1 8B,0.0
2276,o4-mini (high),openai/o4-mini--high,izho_2025_6,izho,proofs,OPC R1 8B,0.0
2277,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,izho_2025_6,izho,proofs,OPC R1 8B,0.0
2278,Grok 4,xai/grok-4,izho_2025_6,izho,proofs,OPC R1 8B,0.0
2279,GPT OSS 120B (high),openai/oss-120b,izho_2025_6,izho,proofs,OPC R1 8B,0.0
2280,GPT-5-mini (high),openai/gpt-5-mini,izho_2025_6,izho,proofs,OPC R1 8B,0.0
2281,Qwen3-4B (25/07),qwen/qwen3_4b,izho_2025_6,izho,proofs,OPC R1 8B,0.0
2282,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,izho_2025_6,izho,proofs,OPC R1 8B,0.0
2283,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,jbmo_2025_1,jbmo,proofs,OPC R1 8B,0.0
2284,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,jbmo_2025_1,jbmo,proofs,OPC R1 8B,1.0
2285,Qwen3-4B (25/07),qwen/qwen3_4b,jbmo_2025_1,jbmo,proofs,OPC R1 8B,0.0
2286,Grok 4,xai/grok-4,jbmo_2025_1,jbmo,proofs,OPC R1 8B,0.0
2287,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,jbmo_2025_1,jbmo,proofs,OPC R1 8B,1.0
2288,GPT-5-mini (high),openai/gpt-5-mini,jbmo_2025_1,jbmo,proofs,OPC R1 8B,1.0
2289,GPT OSS 120B (high),openai/oss-120b,jbmo_2025_1,jbmo,proofs,OPC R1 8B,1.0
2290,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,jbmo_2025_1,jbmo,proofs,OPC R1 8B,0.0
2291,gemini-2.5-pro,gemini/gemini-pro-2.5,jbmo_2025_1,jbmo,proofs,OPC R1 8B,1.0
2292,o4-mini (high),openai/o4-mini--high,jbmo_2025_1,jbmo,proofs,OPC R1 8B,1.0
2293,GPT-5-mini (high),openai/gpt-5-mini,jbmo_2025_2,jbmo,proofs,OPC R1 8B,1.0
2294,Qwen3-4B (25/07),qwen/qwen3_4b,jbmo_2025_2,jbmo,proofs,OPC R1 8B,1.0
2295,gemini-2.5-pro,gemini/gemini-pro-2.5,jbmo_2025_2,jbmo,proofs,OPC R1 8B,1.0
2296,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,jbmo_2025_2,jbmo,proofs,OPC R1 8B,1.0
2297,GPT OSS 120B (high),openai/oss-120b,jbmo_2025_2,jbmo,proofs,OPC R1 8B,0.0
2298,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,jbmo_2025_2,jbmo,proofs,OPC R1 8B,1.0
2299,Grok 4,xai/grok-4,jbmo_2025_2,jbmo,proofs,OPC R1 8B,0.0
2300,o4-mini (high),openai/o4-mini--high,jbmo_2025_2,jbmo,proofs,OPC R1 8B,1.0
2301,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,jbmo_2025_2,jbmo,proofs,OPC R1 8B,0.0
2302,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,jbmo_2025_2,jbmo,proofs,OPC R1 8B,0.0
2303,GPT-5-mini (high),openai/gpt-5-mini,jbmo_2025_3,jbmo,proofs,OPC R1 8B,1.0
2304,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,jbmo_2025_3,jbmo,proofs,OPC R1 8B,1.0
2305,GPT OSS 120B (high),openai/oss-120b,jbmo_2025_3,jbmo,proofs,OPC R1 8B,1.0
2306,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,jbmo_2025_3,jbmo,proofs,OPC R1 8B,1.0
2307,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,jbmo_2025_3,jbmo,proofs,OPC R1 8B,1.0
2308,Qwen3-4B (25/07),qwen/qwen3_4b,jbmo_2025_3,jbmo,proofs,OPC R1 8B,1.0
2309,gemini-2.5-pro,gemini/gemini-pro-2.5,jbmo_2025_3,jbmo,proofs,OPC R1 8B,1.0
2310,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,jbmo_2025_3,jbmo,proofs,OPC R1 8B,1.0
2311,o4-mini (high),openai/o4-mini--high,jbmo_2025_3,jbmo,proofs,OPC R1 8B,1.0
2312,Grok 4,xai/grok-4,jbmo_2025_3,jbmo,proofs,OPC R1 8B,1.0
2313,GPT OSS 120B (high),openai/oss-120b,jbmo_2025_4,jbmo,proofs,OPC R1 8B,0.0
2314,GPT-5-mini (high),openai/gpt-5-mini,jbmo_2025_4,jbmo,proofs,OPC R1 8B,0.0
2315,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,jbmo_2025_4,jbmo,proofs,OPC R1 8B,0.0
2316,Grok 4,xai/grok-4,jbmo_2025_4,jbmo,proofs,OPC R1 8B,0.0
2317,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,jbmo_2025_4,jbmo,proofs,OPC R1 8B,1.0
2318,o4-mini (high),openai/o4-mini--high,jbmo_2025_4,jbmo,proofs,OPC R1 8B,0.0
2319,Qwen3-4B (25/07),qwen/qwen3_4b,jbmo_2025_4,jbmo,proofs,OPC R1 8B,0.0
2320,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,jbmo_2025_4,jbmo,proofs,OPC R1 8B,0.0
2321,gemini-2.5-pro,gemini/gemini-pro-2.5,jbmo_2025_4,jbmo,proofs,OPC R1 8B,0.0
2322,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,jbmo_2025_4,jbmo,proofs,OPC R1 8B,0.0
2323,Grok 4,xai/grok-4,korea_2025_1,korea,proofs,OPC R1 8B,0.0
2324,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,korea_2025_1,korea,proofs,OPC R1 8B,0.0
2325,GPT-5 (high),openai/gpt-5,korea_2025_1,korea,proofs,OPC R1 8B,1.0
2326,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,korea_2025_1,korea,proofs,OPC R1 8B,0.0
2327,o4-mini (high),openai/o4-mini--high,korea_2025_1,korea,proofs,OPC R1 8B,0.0
2328,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,korea_2025_1,korea,proofs,OPC R1 8B,0.0
2329,GPT-5-mini (high),openai/gpt-5-mini,korea_2025_1,korea,proofs,OPC R1 8B,1.0
2330,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,korea_2025_1,korea,proofs,OPC R1 8B,1.0
2331,gemini-2.5-pro,gemini/gemini-pro-2.5,korea_2025_1,korea,proofs,OPC R1 8B,0.0
2332,GPT OSS 120B (high),openai/oss-120b,korea_2025_1,korea,proofs,OPC R1 8B,0.0
2333,Qwen3-4B (25/07),qwen/qwen3_4b,korea_2025_1,korea,proofs,OPC R1 8B,0.0
2334,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,korea_2025_2,korea,proofs,OPC R1 8B,0.0
2335,Grok 4,xai/grok-4,korea_2025_2,korea,proofs,OPC R1 8B,0.0
2336,gemini-2.5-pro,gemini/gemini-pro-2.5,korea_2025_2,korea,proofs,OPC R1 8B,0.0
2337,GPT-5-mini (high),openai/gpt-5-mini,korea_2025_2,korea,proofs,OPC R1 8B,0.0
2338,GPT OSS 120B (high),openai/oss-120b,korea_2025_2,korea,proofs,OPC R1 8B,0.0
2339,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,korea_2025_2,korea,proofs,OPC R1 8B,0.0
2340,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,korea_2025_2,korea,proofs,OPC R1 8B,0.0
2341,o4-mini (high),openai/o4-mini--high,korea_2025_2,korea,proofs,OPC R1 8B,0.0
2342,GPT-5 (high),openai/gpt-5,korea_2025_2,korea,proofs,OPC R1 8B,1.0
2343,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,korea_2025_2,korea,proofs,OPC R1 8B,0.0
2344,Qwen3-4B (25/07),qwen/qwen3_4b,korea_2025_2,korea,proofs,OPC R1 8B,1.0
2345,Qwen3-4B (25/07),qwen/qwen3_4b,korea_2025_3,korea,proofs,OPC R1 8B,0.0
2346,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,korea_2025_3,korea,proofs,OPC R1 8B,0.0
2347,o4-mini (high),openai/o4-mini--high,korea_2025_3,korea,proofs,OPC R1 8B,0.0
2348,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,korea_2025_3,korea,proofs,OPC R1 8B,0.0
2349,Grok 4,xai/grok-4,korea_2025_3,korea,proofs,OPC R1 8B,0.0
2350,GPT OSS 120B (high),openai/oss-120b,korea_2025_3,korea,proofs,OPC R1 8B,0.0
2351,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,korea_2025_3,korea,proofs,OPC R1 8B,0.0
2352,GPT-5-mini (high),openai/gpt-5-mini,korea_2025_3,korea,proofs,OPC R1 8B,0.0
2353,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,korea_2025_3,korea,proofs,OPC R1 8B,0.0
2354,gemini-2.5-pro,gemini/gemini-pro-2.5,korea_2025_3,korea,proofs,OPC R1 8B,0.0
2355,GPT-5 (high),openai/gpt-5,korea_2025_3,korea,proofs,OPC R1 8B,0.0
2356,GPT-5-mini (high),openai/gpt-5-mini,korea_2025_4,korea,proofs,OPC R1 8B,0.0
2357,Grok 4,xai/grok-4,korea_2025_4,korea,proofs,OPC R1 8B,0.0
2358,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,korea_2025_4,korea,proofs,OPC R1 8B,0.0
2359,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,korea_2025_4,korea,proofs,OPC R1 8B,0.0
2360,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,korea_2025_4,korea,proofs,OPC R1 8B,0.0
2361,GPT-5 (high),openai/gpt-5,korea_2025_4,korea,proofs,OPC R1 8B,0.0
2362,Qwen3-4B (25/07),qwen/qwen3_4b,korea_2025_4,korea,proofs,OPC R1 8B,0.0
2363,o4-mini (high),openai/o4-mini--high,korea_2025_4,korea,proofs,OPC R1 8B,0.0
2364,gemini-2.5-pro,gemini/gemini-pro-2.5,korea_2025_4,korea,proofs,OPC R1 8B,0.0
2365,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,korea_2025_4,korea,proofs,OPC R1 8B,0.0
2366,GPT OSS 120B (high),openai/oss-120b,korea_2025_4,korea,proofs,OPC R1 8B,0.0
2367,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,korea_2025_5,korea,proofs,OPC R1 8B,1.0
2368,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,korea_2025_5,korea,proofs,OPC R1 8B,0.0
2369,GPT OSS 120B (high),openai/oss-120b,korea_2025_5,korea,proofs,OPC R1 8B,0.0
2370,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,korea_2025_5,korea,proofs,OPC R1 8B,1.0
2371,GPT-5 (high),openai/gpt-5,korea_2025_5,korea,proofs,OPC R1 8B,0.0
2372,Grok 4,xai/grok-4,korea_2025_5,korea,proofs,OPC R1 8B,0.0
2373,Qwen3-4B (25/07),qwen/qwen3_4b,korea_2025_5,korea,proofs,OPC R1 8B,0.0
2374,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,korea_2025_5,korea,proofs,OPC R1 8B,0.0
2375,GPT-5-mini (high),openai/gpt-5-mini,korea_2025_5,korea,proofs,OPC R1 8B,0.0
2376,o4-mini (high),openai/o4-mini--high,korea_2025_5,korea,proofs,OPC R1 8B,0.0
2377,gemini-2.5-pro,gemini/gemini-pro-2.5,korea_2025_5,korea,proofs,OPC R1 8B,0.0
2378,o4-mini (high),openai/o4-mini--high,korea_2025_6,korea,proofs,OPC R1 8B,0.0
2379,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,korea_2025_6,korea,proofs,OPC R1 8B,0.0
2380,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,korea_2025_6,korea,proofs,OPC R1 8B,0.0
2381,GPT-5 (high),openai/gpt-5,korea_2025_6,korea,proofs,OPC R1 8B,0.0
2382,Qwen3-4B (25/07),qwen/qwen3_4b,korea_2025_6,korea,proofs,OPC R1 8B,0.0
2383,GPT-5-mini (high),openai/gpt-5-mini,korea_2025_6,korea,proofs,OPC R1 8B,0.0
2384,Grok 4,xai/grok-4,korea_2025_6,korea,proofs,OPC R1 8B,0.0
2385,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,korea_2025_6,korea,proofs,OPC R1 8B,0.0
2386,GPT OSS 120B (high),openai/oss-120b,korea_2025_6,korea,proofs,OPC R1 8B,1.0
2387,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,korea_2025_6,korea,proofs,OPC R1 8B,0.0
2388,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_aime/aime_2025_1,matharena,answer,Final Answer Parser,1.0
2389,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_aime/aime_2025_1,matharena,answer,Final Answer Parser,1.0
2390,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_aime/aime_2025_1,matharena,answer,Final Answer Parser,1.0
2391,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_aime/aime_2025_10,matharena,answer,Final Answer Parser,0.0
2392,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_aime/aime_2025_10,matharena,answer,Final Answer Parser,1.0
2393,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_aime/aime_2025_10,matharena,answer,Final Answer Parser,0.0
2394,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_aime/aime_2025_11,matharena,answer,Final Answer Parser,1.0
2395,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_aime/aime_2025_11,matharena,answer,Final Answer Parser,0.0
2396,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_aime/aime_2025_11,matharena,answer,Final Answer Parser,1.0
2397,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_aime/aime_2025_12,matharena,answer,Final Answer Parser,1.0
2398,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_aime/aime_2025_12,matharena,answer,Final Answer Parser,1.0
2399,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_aime/aime_2025_12,matharena,answer,Final Answer Parser,1.0
2400,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_aime/aime_2025_13,matharena,answer,Final Answer Parser,0.0
2401,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_aime/aime_2025_13,matharena,answer,Final Answer Parser,0.0
2402,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_aime/aime_2025_13,matharena,answer,Final Answer Parser,1.0
2403,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_aime/aime_2025_14,matharena,answer,Final Answer Parser,0.0
2404,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_aime/aime_2025_14,matharena,answer,Final Answer Parser,0.0
2405,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_aime/aime_2025_14,matharena,answer,Final Answer Parser,0.0
2406,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_aime/aime_2025_15,matharena,answer,Final Answer Parser,0.0
2407,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_aime/aime_2025_15,matharena,answer,Final Answer Parser,0.0
2408,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_aime/aime_2025_15,matharena,answer,Final Answer Parser,0.0
2409,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_aime/aime_2025_16,matharena,answer,Final Answer Parser,1.0
2410,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_aime/aime_2025_16,matharena,answer,Final Answer Parser,1.0
2411,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_aime/aime_2025_16,matharena,answer,Final Answer Parser,1.0
2412,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_aime/aime_2025_17,matharena,answer,Final Answer Parser,1.0
2413,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_aime/aime_2025_17,matharena,answer,Final Answer Parser,1.0
2414,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_aime/aime_2025_17,matharena,answer,Final Answer Parser,1.0
2415,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_aime/aime_2025_18,matharena,answer,Final Answer Parser,0.0
2416,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_aime/aime_2025_18,matharena,answer,Final Answer Parser,1.0
2417,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_aime/aime_2025_18,matharena,answer,Final Answer Parser,1.0
2418,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_aime/aime_2025_19,matharena,answer,Final Answer Parser,1.0
2419,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_aime/aime_2025_19,matharena,answer,Final Answer Parser,1.0
2420,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_aime/aime_2025_19,matharena,answer,Final Answer Parser,1.0
2421,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_aime/aime_2025_2,matharena,answer,Final Answer Parser,1.0
2422,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_aime/aime_2025_2,matharena,answer,Final Answer Parser,1.0
2423,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_aime/aime_2025_2,matharena,answer,Final Answer Parser,1.0
2424,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_aime/aime_2025_20,matharena,answer,Final Answer Parser,1.0
2425,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_aime/aime_2025_20,matharena,answer,Final Answer Parser,0.0
2426,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_aime/aime_2025_20,matharena,answer,Final Answer Parser,1.0
2427,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_aime/aime_2025_21,matharena,answer,Final Answer Parser,1.0
2428,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_aime/aime_2025_21,matharena,answer,Final Answer Parser,1.0
2429,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_aime/aime_2025_21,matharena,answer,Final Answer Parser,1.0
2430,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_aime/aime_2025_22,matharena,answer,Final Answer Parser,1.0
2431,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_aime/aime_2025_22,matharena,answer,Final Answer Parser,1.0
2432,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_aime/aime_2025_22,matharena,answer,Final Answer Parser,1.0
2433,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_aime/aime_2025_23,matharena,answer,Final Answer Parser,1.0
2434,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_aime/aime_2025_23,matharena,answer,Final Answer Parser,1.0
2435,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_aime/aime_2025_23,matharena,answer,Final Answer Parser,1.0
2436,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_aime/aime_2025_24,matharena,answer,Final Answer Parser,1.0
2437,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_aime/aime_2025_24,matharena,answer,Final Answer Parser,1.0
2438,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_aime/aime_2025_24,matharena,answer,Final Answer Parser,1.0
2439,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_aime/aime_2025_25,matharena,answer,Final Answer Parser,1.0
2440,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_aime/aime_2025_25,matharena,answer,Final Answer Parser,1.0
2441,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_aime/aime_2025_25,matharena,answer,Final Answer Parser,1.0
2442,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_aime/aime_2025_26,matharena,answer,Final Answer Parser,1.0
2443,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_aime/aime_2025_26,matharena,answer,Final Answer Parser,1.0
2444,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_aime/aime_2025_26,matharena,answer,Final Answer Parser,1.0
2445,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_aime/aime_2025_27,matharena,answer,Final Answer Parser,1.0
2446,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_aime/aime_2025_27,matharena,answer,Final Answer Parser,1.0
2447,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_aime/aime_2025_27,matharena,answer,Final Answer Parser,1.0
2448,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_aime/aime_2025_28,matharena,answer,Final Answer Parser,1.0
2449,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_aime/aime_2025_28,matharena,answer,Final Answer Parser,0.0
2450,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_aime/aime_2025_28,matharena,answer,Final Answer Parser,0.0
2451,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_aime/aime_2025_29,matharena,answer,Final Answer Parser,1.0
2452,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_aime/aime_2025_29,matharena,answer,Final Answer Parser,1.0
2453,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_aime/aime_2025_29,matharena,answer,Final Answer Parser,1.0
2454,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_aime/aime_2025_3,matharena,answer,Final Answer Parser,1.0
2455,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_aime/aime_2025_3,matharena,answer,Final Answer Parser,1.0
2456,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_aime/aime_2025_3,matharena,answer,Final Answer Parser,1.0
2457,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_aime/aime_2025_30,matharena,answer,Final Answer Parser,1.0
2458,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_aime/aime_2025_30,matharena,answer,Final Answer Parser,0.0
2459,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_aime/aime_2025_30,matharena,answer,Final Answer Parser,1.0
2460,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_aime/aime_2025_4,matharena,answer,Final Answer Parser,1.0
2461,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_aime/aime_2025_4,matharena,answer,Final Answer Parser,1.0
2462,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_aime/aime_2025_4,matharena,answer,Final Answer Parser,1.0
2463,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_aime/aime_2025_5,matharena,answer,Final Answer Parser,1.0
2464,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_aime/aime_2025_5,matharena,answer,Final Answer Parser,1.0
2465,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_aime/aime_2025_5,matharena,answer,Final Answer Parser,1.0
2466,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_aime/aime_2025_6,matharena,answer,Final Answer Parser,1.0
2467,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_aime/aime_2025_6,matharena,answer,Final Answer Parser,1.0
2468,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_aime/aime_2025_6,matharena,answer,Final Answer Parser,1.0
2469,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_aime/aime_2025_7,matharena,answer,Final Answer Parser,0.0
2470,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_aime/aime_2025_7,matharena,answer,Final Answer Parser,1.0
2471,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_aime/aime_2025_7,matharena,answer,Final Answer Parser,1.0
2472,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_aime/aime_2025_8,matharena,answer,Final Answer Parser,1.0
2473,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_aime/aime_2025_8,matharena,answer,Final Answer Parser,1.0
2474,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_aime/aime_2025_8,matharena,answer,Final Answer Parser,1.0
2475,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_aime/aime_2025_9,matharena,answer,Final Answer Parser,1.0
2476,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_aime/aime_2025_9,matharena,answer,Final Answer Parser,1.0
2477,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_aime/aime_2025_9,matharena,answer,Final Answer Parser,0.0
2478,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_brumo/brumo_2025_1,matharena,answer,Final Answer Parser,1.0
2479,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_brumo/brumo_2025_1,matharena,answer,Final Answer Parser,1.0
2480,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_brumo/brumo_2025_1,matharena,answer,Final Answer Parser,1.0
2481,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_brumo/brumo_2025_10,matharena,answer,Final Answer Parser,1.0
2482,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_brumo/brumo_2025_10,matharena,answer,Final Answer Parser,1.0
2483,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_brumo/brumo_2025_10,matharena,answer,Final Answer Parser,1.0
2484,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_brumo/brumo_2025_11,matharena,answer,Final Answer Parser,1.0
2485,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_brumo/brumo_2025_11,matharena,answer,Final Answer Parser,1.0
2486,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_brumo/brumo_2025_11,matharena,answer,Final Answer Parser,1.0
2487,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_brumo/brumo_2025_12,matharena,answer,Final Answer Parser,0.0
2488,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_brumo/brumo_2025_12,matharena,answer,Final Answer Parser,0.0
2489,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_brumo/brumo_2025_12,matharena,answer,Final Answer Parser,1.0
2490,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_brumo/brumo_2025_13,matharena,answer,Final Answer Parser,0.0
2491,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_brumo/brumo_2025_13,matharena,answer,Final Answer Parser,0.0
2492,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_brumo/brumo_2025_13,matharena,answer,Final Answer Parser,1.0
2493,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_brumo/brumo_2025_14,matharena,answer,Final Answer Parser,1.0
2494,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_brumo/brumo_2025_14,matharena,answer,Final Answer Parser,1.0
2495,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_brumo/brumo_2025_15,matharena,answer,Final Answer Parser,0.0
2496,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_brumo/brumo_2025_15,matharena,answer,Final Answer Parser,1.0
2497,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_brumo/brumo_2025_15,matharena,answer,Final Answer Parser,0.0
2498,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_brumo/brumo_2025_16,matharena,answer,Final Answer Parser,1.0
2499,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_brumo/brumo_2025_16,matharena,answer,Final Answer Parser,1.0
2500,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_brumo/brumo_2025_16,matharena,answer,Final Answer Parser,0.0
2501,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_brumo/brumo_2025_17,matharena,answer,Final Answer Parser,1.0
2502,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_brumo/brumo_2025_17,matharena,answer,Final Answer Parser,1.0
2503,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_brumo/brumo_2025_17,matharena,answer,Final Answer Parser,1.0
2504,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_brumo/brumo_2025_18,matharena,answer,Final Answer Parser,1.0
2505,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_brumo/brumo_2025_18,matharena,answer,Final Answer Parser,1.0
2506,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_brumo/brumo_2025_18,matharena,answer,Final Answer Parser,1.0
2507,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_brumo/brumo_2025_19,matharena,answer,Final Answer Parser,1.0
2508,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_brumo/brumo_2025_19,matharena,answer,Final Answer Parser,1.0
2509,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_brumo/brumo_2025_19,matharena,answer,Final Answer Parser,1.0
2510,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_brumo/brumo_2025_2,matharena,answer,Final Answer Parser,1.0
2511,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_brumo/brumo_2025_2,matharena,answer,Final Answer Parser,1.0
2512,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_brumo/brumo_2025_2,matharena,answer,Final Answer Parser,1.0
2513,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_brumo/brumo_2025_20,matharena,answer,Final Answer Parser,1.0
2514,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_brumo/brumo_2025_20,matharena,answer,Final Answer Parser,1.0
2515,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_brumo/brumo_2025_20,matharena,answer,Final Answer Parser,1.0
2516,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_brumo/brumo_2025_21,matharena,answer,Final Answer Parser,1.0
2517,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_brumo/brumo_2025_21,matharena,answer,Final Answer Parser,1.0
2518,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_brumo/brumo_2025_21,matharena,answer,Final Answer Parser,0.0
2519,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_brumo/brumo_2025_22,matharena,answer,Final Answer Parser,1.0
2520,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_brumo/brumo_2025_22,matharena,answer,Final Answer Parser,0.0
2521,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_brumo/brumo_2025_22,matharena,answer,Final Answer Parser,1.0
2522,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_brumo/brumo_2025_23,matharena,answer,Final Answer Parser,0.0
2523,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_brumo/brumo_2025_23,matharena,answer,Final Answer Parser,0.0
2524,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_brumo/brumo_2025_23,matharena,answer,Final Answer Parser,0.0
2525,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_brumo/brumo_2025_24,matharena,answer,Final Answer Parser,1.0
2526,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_brumo/brumo_2025_24,matharena,answer,Final Answer Parser,1.0
2527,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_brumo/brumo_2025_24,matharena,answer,Final Answer Parser,1.0
2528,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_brumo/brumo_2025_25,matharena,answer,Final Answer Parser,1.0
2529,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_brumo/brumo_2025_25,matharena,answer,Final Answer Parser,1.0
2530,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_brumo/brumo_2025_25,matharena,answer,Final Answer Parser,1.0
2531,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_brumo/brumo_2025_26,matharena,answer,Final Answer Parser,1.0
2532,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_brumo/brumo_2025_26,matharena,answer,Final Answer Parser,1.0
2533,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_brumo/brumo_2025_26,matharena,answer,Final Answer Parser,1.0
2534,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_brumo/brumo_2025_27,matharena,answer,Final Answer Parser,1.0
2535,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_brumo/brumo_2025_27,matharena,answer,Final Answer Parser,0.0
2536,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_brumo/brumo_2025_27,matharena,answer,Final Answer Parser,1.0
2537,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_brumo/brumo_2025_28,matharena,answer,Final Answer Parser,0.0
2538,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_brumo/brumo_2025_28,matharena,answer,Final Answer Parser,1.0
2539,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_brumo/brumo_2025_28,matharena,answer,Final Answer Parser,0.0
2540,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_brumo/brumo_2025_29,matharena,answer,Final Answer Parser,0.0
2541,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_brumo/brumo_2025_29,matharena,answer,Final Answer Parser,1.0
2542,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_brumo/brumo_2025_29,matharena,answer,Final Answer Parser,1.0
2543,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_brumo/brumo_2025_3,matharena,answer,Final Answer Parser,1.0
2544,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_brumo/brumo_2025_3,matharena,answer,Final Answer Parser,1.0
2545,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_brumo/brumo_2025_3,matharena,answer,Final Answer Parser,1.0
2546,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_brumo/brumo_2025_30,matharena,answer,Final Answer Parser,0.0
2547,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_brumo/brumo_2025_30,matharena,answer,Final Answer Parser,1.0
2548,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_brumo/brumo_2025_30,matharena,answer,Final Answer Parser,0.0
2549,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_brumo/brumo_2025_4,matharena,answer,Final Answer Parser,1.0
2550,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_brumo/brumo_2025_4,matharena,answer,Final Answer Parser,1.0
2551,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_brumo/brumo_2025_4,matharena,answer,Final Answer Parser,1.0
2552,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_brumo/brumo_2025_5,matharena,answer,Final Answer Parser,1.0
2553,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_brumo/brumo_2025_5,matharena,answer,Final Answer Parser,1.0
2554,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_brumo/brumo_2025_5,matharena,answer,Final Answer Parser,1.0
2555,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_brumo/brumo_2025_6,matharena,answer,Final Answer Parser,1.0
2556,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_brumo/brumo_2025_6,matharena,answer,Final Answer Parser,0.0
2557,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_brumo/brumo_2025_6,matharena,answer,Final Answer Parser,1.0
2558,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_brumo/brumo_2025_7,matharena,answer,Final Answer Parser,1.0
2559,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_brumo/brumo_2025_7,matharena,answer,Final Answer Parser,1.0
2560,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_brumo/brumo_2025_7,matharena,answer,Final Answer Parser,1.0
2561,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_brumo/brumo_2025_8,matharena,answer,Final Answer Parser,1.0
2562,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_brumo/brumo_2025_8,matharena,answer,Final Answer Parser,1.0
2563,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_brumo/brumo_2025_8,matharena,answer,Final Answer Parser,1.0
2564,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_brumo/brumo_2025_9,matharena,answer,Final Answer Parser,1.0
2565,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_brumo/brumo_2025_9,matharena,answer,Final Answer Parser,1.0
2566,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_brumo/brumo_2025_9,matharena,answer,Final Answer Parser,1.0
2567,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_1,matharena,answer,Final Answer Parser,1.0
2568,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_1,matharena,answer,Final Answer Parser,1.0
2569,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_1,matharena,answer,Final Answer Parser,1.0
2570,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_1,matharena,answer,Final Answer Parser,1.0
2571,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_10,matharena,answer,Final Answer Parser,1.0
2572,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_10,matharena,answer,Final Answer Parser,1.0
2573,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_10,matharena,answer,Final Answer Parser,1.0
2574,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_10,matharena,answer,Final Answer Parser,1.0
2575,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_11,matharena,answer,Final Answer Parser,1.0
2576,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_11,matharena,answer,Final Answer Parser,1.0
2577,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_11,matharena,answer,Final Answer Parser,1.0
2578,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_11,matharena,answer,Final Answer Parser,1.0
2579,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_12,matharena,answer,Final Answer Parser,1.0
2580,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_12,matharena,answer,Final Answer Parser,1.0
2581,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_12,matharena,answer,Final Answer Parser,1.0
2582,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_12,matharena,answer,Final Answer Parser,1.0
2583,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_13,matharena,answer,Final Answer Parser,1.0
2584,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_13,matharena,answer,Final Answer Parser,1.0
2585,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_13,matharena,answer,Final Answer Parser,0.0
2586,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_13,matharena,answer,Final Answer Parser,1.0
2587,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_14,matharena,answer,Final Answer Parser,1.0
2588,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_14,matharena,answer,Final Answer Parser,1.0
2589,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_14,matharena,answer,Final Answer Parser,1.0
2590,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_14,matharena,answer,Final Answer Parser,0.0
2591,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_15,matharena,answer,Final Answer Parser,0.0
2592,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_15,matharena,answer,Final Answer Parser,0.0
2593,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_15,matharena,answer,Final Answer Parser,0.0
2594,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_15,matharena,answer,Final Answer Parser,0.0
2595,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_16,matharena,answer,Final Answer Parser,0.0
2596,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_16,matharena,answer,Final Answer Parser,1.0
2597,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_16,matharena,answer,Final Answer Parser,0.0
2598,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_16,matharena,answer,Final Answer Parser,0.0
2599,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_17,matharena,answer,Final Answer Parser,1.0
2600,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_17,matharena,answer,Final Answer Parser,1.0
2601,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_17,matharena,answer,Final Answer Parser,1.0
2602,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_17,matharena,answer,Final Answer Parser,1.0
2603,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_18,matharena,answer,Final Answer Parser,0.0
2604,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_18,matharena,answer,Final Answer Parser,0.0
2605,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_18,matharena,answer,Final Answer Parser,1.0
2606,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_18,matharena,answer,Final Answer Parser,1.0
2607,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_19,matharena,answer,Final Answer Parser,1.0
2608,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_19,matharena,answer,Final Answer Parser,1.0
2609,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_19,matharena,answer,Final Answer Parser,1.0
2610,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_19,matharena,answer,Final Answer Parser,0.0
2611,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_2,matharena,answer,Final Answer Parser,1.0
2612,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_2,matharena,answer,Final Answer Parser,1.0
2613,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_2,matharena,answer,Final Answer Parser,1.0
2614,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_2,matharena,answer,Final Answer Parser,1.0
2615,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_20,matharena,answer,Final Answer Parser,0.0
2616,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_20,matharena,answer,Final Answer Parser,1.0
2617,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_20,matharena,answer,Final Answer Parser,1.0
2618,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_20,matharena,answer,Final Answer Parser,1.0
2619,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_21,matharena,answer,Final Answer Parser,0.0
2620,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_21,matharena,answer,Final Answer Parser,0.0
2621,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_21,matharena,answer,Final Answer Parser,0.0
2622,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_21,matharena,answer,Final Answer Parser,1.0
2623,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_22,matharena,answer,Final Answer Parser,1.0
2624,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_22,matharena,answer,Final Answer Parser,1.0
2625,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_22,matharena,answer,Final Answer Parser,1.0
2626,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_22,matharena,answer,Final Answer Parser,1.0
2627,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_23,matharena,answer,Final Answer Parser,1.0
2628,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_23,matharena,answer,Final Answer Parser,1.0
2629,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_23,matharena,answer,Final Answer Parser,0.0
2630,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_23,matharena,answer,Final Answer Parser,1.0
2631,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_24,matharena,answer,Final Answer Parser,1.0
2632,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_24,matharena,answer,Final Answer Parser,1.0
2633,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_24,matharena,answer,Final Answer Parser,1.0
2634,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_24,matharena,answer,Final Answer Parser,1.0
2635,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_25,matharena,answer,Final Answer Parser,1.0
2636,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_25,matharena,answer,Final Answer Parser,0.0
2637,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_25,matharena,answer,Final Answer Parser,0.0
2638,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_25,matharena,answer,Final Answer Parser,0.0
2639,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_26,matharena,answer,Final Answer Parser,1.0
2640,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_26,matharena,answer,Final Answer Parser,1.0
2641,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_26,matharena,answer,Final Answer Parser,1.0
2642,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_26,matharena,answer,Final Answer Parser,1.0
2643,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_27,matharena,answer,Final Answer Parser,1.0
2644,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_27,matharena,answer,Final Answer Parser,0.0
2645,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_27,matharena,answer,Final Answer Parser,1.0
2646,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_27,matharena,answer,Final Answer Parser,1.0
2647,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_28,matharena,answer,Final Answer Parser,0.0
2648,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_28,matharena,answer,Final Answer Parser,0.0
2649,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_28,matharena,answer,Final Answer Parser,0.0
2650,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_28,matharena,answer,Final Answer Parser,0.0
2651,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_29,matharena,answer,Final Answer Parser,1.0
2652,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_29,matharena,answer,Final Answer Parser,1.0
2653,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_29,matharena,answer,Final Answer Parser,1.0
2654,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_29,matharena,answer,Final Answer Parser,0.0
2655,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_3,matharena,answer,Final Answer Parser,1.0
2656,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_3,matharena,answer,Final Answer Parser,1.0
2657,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_3,matharena,answer,Final Answer Parser,1.0
2658,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_3,matharena,answer,Final Answer Parser,1.0
2659,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_30,matharena,answer,Final Answer Parser,1.0
2660,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_30,matharena,answer,Final Answer Parser,0.0
2661,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_30,matharena,answer,Final Answer Parser,1.0
2662,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_30,matharena,answer,Final Answer Parser,0.0
2663,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_31,matharena,answer,Final Answer Parser,1.0
2664,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_31,matharena,answer,Final Answer Parser,1.0
2665,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_31,matharena,answer,Final Answer Parser,1.0
2666,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_31,matharena,answer,Final Answer Parser,1.0
2667,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_32,matharena,answer,Final Answer Parser,1.0
2668,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_32,matharena,answer,Final Answer Parser,0.0
2669,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_32,matharena,answer,Final Answer Parser,0.0
2670,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_32,matharena,answer,Final Answer Parser,0.0
2671,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_33,matharena,answer,Final Answer Parser,1.0
2672,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_33,matharena,answer,Final Answer Parser,1.0
2673,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_33,matharena,answer,Final Answer Parser,1.0
2674,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_33,matharena,answer,Final Answer Parser,1.0
2675,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_34,matharena,answer,Final Answer Parser,0.0
2676,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_34,matharena,answer,Final Answer Parser,0.0
2677,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_34,matharena,answer,Final Answer Parser,0.0
2678,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_34,matharena,answer,Final Answer Parser,0.0
2679,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_35,matharena,answer,Final Answer Parser,1.0
2680,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_35,matharena,answer,Final Answer Parser,1.0
2681,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_35,matharena,answer,Final Answer Parser,1.0
2682,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_35,matharena,answer,Final Answer Parser,1.0
2683,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_36,matharena,answer,Final Answer Parser,0.0
2684,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_36,matharena,answer,Final Answer Parser,0.0
2685,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_36,matharena,answer,Final Answer Parser,1.0
2686,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_36,matharena,answer,Final Answer Parser,1.0
2687,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_37,matharena,answer,Final Answer Parser,0.0
2688,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_37,matharena,answer,Final Answer Parser,1.0
2689,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_37,matharena,answer,Final Answer Parser,1.0
2690,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_37,matharena,answer,Final Answer Parser,1.0
2691,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_38,matharena,answer,Final Answer Parser,1.0
2692,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_38,matharena,answer,Final Answer Parser,0.0
2693,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_38,matharena,answer,Final Answer Parser,1.0
2694,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_38,matharena,answer,Final Answer Parser,0.0
2695,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_39,matharena,answer,Final Answer Parser,1.0
2696,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_39,matharena,answer,Final Answer Parser,0.0
2697,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_39,matharena,answer,Final Answer Parser,1.0
2698,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_39,matharena,answer,Final Answer Parser,0.0
2699,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_4,matharena,answer,Final Answer Parser,1.0
2700,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_4,matharena,answer,Final Answer Parser,1.0
2701,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_4,matharena,answer,Final Answer Parser,1.0
2702,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_4,matharena,answer,Final Answer Parser,1.0
2703,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_40,matharena,answer,Final Answer Parser,0.0
2704,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_40,matharena,answer,Final Answer Parser,0.0
2705,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_40,matharena,answer,Final Answer Parser,0.0
2706,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_40,matharena,answer,Final Answer Parser,1.0
2707,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_5,matharena,answer,Final Answer Parser,0.0
2708,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_5,matharena,answer,Final Answer Parser,1.0
2709,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_5,matharena,answer,Final Answer Parser,0.0
2710,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_5,matharena,answer,Final Answer Parser,0.0
2711,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_6,matharena,answer,Final Answer Parser,0.0
2712,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_6,matharena,answer,Final Answer Parser,1.0
2713,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_6,matharena,answer,Final Answer Parser,1.0
2714,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_6,matharena,answer,Final Answer Parser,1.0
2715,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_7,matharena,answer,Final Answer Parser,0.0
2716,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_7,matharena,answer,Final Answer Parser,0.0
2717,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_7,matharena,answer,Final Answer Parser,0.0
2718,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_7,matharena,answer,Final Answer Parser,0.0
2719,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_8,matharena,answer,Final Answer Parser,0.0
2720,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_8,matharena,answer,Final Answer Parser,0.0
2721,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_8,matharena,answer,Final Answer Parser,0.0
2722,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_8,matharena,answer,Final Answer Parser,0.0
2723,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_cmimc/cmimc_2025_9,matharena,answer,Final Answer Parser,0.0
2724,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_cmimc/cmimc_2025_9,matharena,answer,Final Answer Parser,0.0
2725,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_cmimc/cmimc_2025_9,matharena,answer,Final Answer Parser,0.0
2726,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_cmimc/cmimc_2025_9,matharena,answer,Final Answer Parser,1.0
2727,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_hmmt/hmmt_feb_2025_1,matharena,answer,Final Answer Parser,1.0
2728,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_hmmt/hmmt_feb_2025_1,matharena,answer,Final Answer Parser,1.0
2729,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_hmmt/hmmt_feb_2025_1,matharena,answer,Final Answer Parser,1.0
2730,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_hmmt/hmmt_feb_2025_10,matharena,answer,Final Answer Parser,1.0
2731,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_hmmt/hmmt_feb_2025_10,matharena,answer,Final Answer Parser,1.0
2732,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_hmmt/hmmt_feb_2025_10,matharena,answer,Final Answer Parser,1.0
2733,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_hmmt/hmmt_feb_2025_11,matharena,answer,Final Answer Parser,1.0
2734,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_hmmt/hmmt_feb_2025_11,matharena,answer,Final Answer Parser,1.0
2735,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_hmmt/hmmt_feb_2025_11,matharena,answer,Final Answer Parser,1.0
2736,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_hmmt/hmmt_feb_2025_12,matharena,answer,Final Answer Parser,1.0
2737,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_hmmt/hmmt_feb_2025_12,matharena,answer,Final Answer Parser,1.0
2738,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_hmmt/hmmt_feb_2025_12,matharena,answer,Final Answer Parser,1.0
2739,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_hmmt/hmmt_feb_2025_13,matharena,answer,Final Answer Parser,0.0
2740,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_hmmt/hmmt_feb_2025_13,matharena,answer,Final Answer Parser,0.0
2741,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_hmmt/hmmt_feb_2025_13,matharena,answer,Final Answer Parser,0.0
2742,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_hmmt/hmmt_feb_2025_14,matharena,answer,Final Answer Parser,0.0
2743,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_hmmt/hmmt_feb_2025_14,matharena,answer,Final Answer Parser,0.0
2744,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_hmmt/hmmt_feb_2025_14,matharena,answer,Final Answer Parser,0.0
2745,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_hmmt/hmmt_feb_2025_15,matharena,answer,Final Answer Parser,1.0
2746,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_hmmt/hmmt_feb_2025_15,matharena,answer,Final Answer Parser,0.0
2747,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_hmmt/hmmt_feb_2025_15,matharena,answer,Final Answer Parser,1.0
2748,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_hmmt/hmmt_feb_2025_16,matharena,answer,Final Answer Parser,1.0
2749,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_hmmt/hmmt_feb_2025_16,matharena,answer,Final Answer Parser,1.0
2750,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_hmmt/hmmt_feb_2025_16,matharena,answer,Final Answer Parser,0.0
2751,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_hmmt/hmmt_feb_2025_17,matharena,answer,Final Answer Parser,0.0
2752,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_hmmt/hmmt_feb_2025_17,matharena,answer,Final Answer Parser,0.0
2753,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_hmmt/hmmt_feb_2025_17,matharena,answer,Final Answer Parser,0.0
2754,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_hmmt/hmmt_feb_2025_18,matharena,answer,Final Answer Parser,1.0
2755,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_hmmt/hmmt_feb_2025_18,matharena,answer,Final Answer Parser,0.0
2756,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_hmmt/hmmt_feb_2025_18,matharena,answer,Final Answer Parser,0.0
2757,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_hmmt/hmmt_feb_2025_19,matharena,answer,Final Answer Parser,0.0
2758,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_hmmt/hmmt_feb_2025_19,matharena,answer,Final Answer Parser,0.0
2759,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_hmmt/hmmt_feb_2025_19,matharena,answer,Final Answer Parser,0.0
2760,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_hmmt/hmmt_feb_2025_2,matharena,answer,Final Answer Parser,1.0
2761,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_hmmt/hmmt_feb_2025_2,matharena,answer,Final Answer Parser,1.0
2762,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_hmmt/hmmt_feb_2025_2,matharena,answer,Final Answer Parser,1.0
2763,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_hmmt/hmmt_feb_2025_20,matharena,answer,Final Answer Parser,0.0
2764,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_hmmt/hmmt_feb_2025_20,matharena,answer,Final Answer Parser,0.0
2765,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_hmmt/hmmt_feb_2025_20,matharena,answer,Final Answer Parser,1.0
2766,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_hmmt/hmmt_feb_2025_21,matharena,answer,Final Answer Parser,1.0
2767,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_hmmt/hmmt_feb_2025_21,matharena,answer,Final Answer Parser,1.0
2768,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_hmmt/hmmt_feb_2025_21,matharena,answer,Final Answer Parser,1.0
2769,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_hmmt/hmmt_feb_2025_22,matharena,answer,Final Answer Parser,1.0
2770,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_hmmt/hmmt_feb_2025_22,matharena,answer,Final Answer Parser,1.0
2771,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_hmmt/hmmt_feb_2025_22,matharena,answer,Final Answer Parser,1.0
2772,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_hmmt/hmmt_feb_2025_23,matharena,answer,Final Answer Parser,1.0
2773,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_hmmt/hmmt_feb_2025_23,matharena,answer,Final Answer Parser,1.0
2774,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_hmmt/hmmt_feb_2025_23,matharena,answer,Final Answer Parser,1.0
2775,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_hmmt/hmmt_feb_2025_24,matharena,answer,Final Answer Parser,1.0
2776,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_hmmt/hmmt_feb_2025_24,matharena,answer,Final Answer Parser,0.0
2777,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_hmmt/hmmt_feb_2025_24,matharena,answer,Final Answer Parser,0.0
2778,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_hmmt/hmmt_feb_2025_25,matharena,answer,Final Answer Parser,1.0
2779,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_hmmt/hmmt_feb_2025_25,matharena,answer,Final Answer Parser,1.0
2780,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_hmmt/hmmt_feb_2025_25,matharena,answer,Final Answer Parser,0.0
2781,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_hmmt/hmmt_feb_2025_26,matharena,answer,Final Answer Parser,1.0
2782,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_hmmt/hmmt_feb_2025_26,matharena,answer,Final Answer Parser,1.0
2783,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_hmmt/hmmt_feb_2025_26,matharena,answer,Final Answer Parser,1.0
2784,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_hmmt/hmmt_feb_2025_27,matharena,answer,Final Answer Parser,1.0
2785,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_hmmt/hmmt_feb_2025_27,matharena,answer,Final Answer Parser,1.0
2786,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_hmmt/hmmt_feb_2025_27,matharena,answer,Final Answer Parser,1.0
2787,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_hmmt/hmmt_feb_2025_28,matharena,answer,Final Answer Parser,1.0
2788,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_hmmt/hmmt_feb_2025_28,matharena,answer,Final Answer Parser,1.0
2789,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_hmmt/hmmt_feb_2025_28,matharena,answer,Final Answer Parser,1.0
2790,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_hmmt/hmmt_feb_2025_29,matharena,answer,Final Answer Parser,1.0
2791,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_hmmt/hmmt_feb_2025_29,matharena,answer,Final Answer Parser,1.0
2792,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_hmmt/hmmt_feb_2025_29,matharena,answer,Final Answer Parser,1.0
2793,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_hmmt/hmmt_feb_2025_3,matharena,answer,Final Answer Parser,1.0
2794,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_hmmt/hmmt_feb_2025_3,matharena,answer,Final Answer Parser,1.0
2795,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_hmmt/hmmt_feb_2025_3,matharena,answer,Final Answer Parser,1.0
2796,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_hmmt/hmmt_feb_2025_30,matharena,answer,Final Answer Parser,0.0
2797,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_hmmt/hmmt_feb_2025_30,matharena,answer,Final Answer Parser,0.0
2798,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_hmmt/hmmt_feb_2025_30,matharena,answer,Final Answer Parser,0.0
2799,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_hmmt/hmmt_feb_2025_4,matharena,answer,Final Answer Parser,1.0
2800,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_hmmt/hmmt_feb_2025_4,matharena,answer,Final Answer Parser,1.0
2801,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_hmmt/hmmt_feb_2025_4,matharena,answer,Final Answer Parser,1.0
2802,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_hmmt/hmmt_feb_2025_5,matharena,answer,Final Answer Parser,1.0
2803,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_hmmt/hmmt_feb_2025_5,matharena,answer,Final Answer Parser,1.0
2804,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_hmmt/hmmt_feb_2025_5,matharena,answer,Final Answer Parser,1.0
2805,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_hmmt/hmmt_feb_2025_6,matharena,answer,Final Answer Parser,1.0
2806,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_hmmt/hmmt_feb_2025_6,matharena,answer,Final Answer Parser,1.0
2807,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_hmmt/hmmt_feb_2025_6,matharena,answer,Final Answer Parser,0.0
2808,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_hmmt/hmmt_feb_2025_7,matharena,answer,Final Answer Parser,1.0
2809,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_hmmt/hmmt_feb_2025_7,matharena,answer,Final Answer Parser,1.0
2810,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_hmmt/hmmt_feb_2025_7,matharena,answer,Final Answer Parser,1.0
2811,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_hmmt/hmmt_feb_2025_8,matharena,answer,Final Answer Parser,0.0
2812,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_hmmt/hmmt_feb_2025_8,matharena,answer,Final Answer Parser,1.0
2813,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_hmmt/hmmt_feb_2025_8,matharena,answer,Final Answer Parser,1.0
2814,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_hmmt/hmmt_feb_2025_9,matharena,answer,Final Answer Parser,1.0
2815,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_hmmt/hmmt_feb_2025_9,matharena,answer,Final Answer Parser,1.0
2816,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_hmmt/hmmt_feb_2025_9,matharena,answer,Final Answer Parser,1.0
2817,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_1,matharena,answer,Final Answer Parser,1.0
2818,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_1,matharena,answer,Final Answer Parser,1.0
2819,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_1,matharena,answer,Final Answer Parser,1.0
2820,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_10,matharena,answer,Final Answer Parser,1.0
2821,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_10,matharena,answer,Final Answer Parser,1.0
2822,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_10,matharena,answer,Final Answer Parser,1.0
2823,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_11,matharena,answer,Final Answer Parser,1.0
2824,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_11,matharena,answer,Final Answer Parser,1.0
2825,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_11,matharena,answer,Final Answer Parser,1.0
2826,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_12,matharena,answer,Final Answer Parser,1.0
2827,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_12,matharena,answer,Final Answer Parser,1.0
2828,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_12,matharena,answer,Final Answer Parser,1.0
2829,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_13,matharena,answer,Final Answer Parser,1.0
2830,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_13,matharena,answer,Final Answer Parser,1.0
2831,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_13,matharena,answer,Final Answer Parser,1.0
2832,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_14,matharena,answer,Final Answer Parser,1.0
2833,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_14,matharena,answer,Final Answer Parser,1.0
2834,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_14,matharena,answer,Final Answer Parser,1.0
2835,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_15,matharena,answer,Final Answer Parser,1.0
2836,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_15,matharena,answer,Final Answer Parser,1.0
2837,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_15,matharena,answer,Final Answer Parser,1.0
2838,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_16,matharena,answer,Final Answer Parser,1.0
2839,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_16,matharena,answer,Final Answer Parser,1.0
2840,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_16,matharena,answer,Final Answer Parser,1.0
2841,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_17,matharena,answer,Final Answer Parser,1.0
2842,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_17,matharena,answer,Final Answer Parser,0.0
2843,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_17,matharena,answer,Final Answer Parser,0.0
2844,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_18,matharena,answer,Final Answer Parser,1.0
2845,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_18,matharena,answer,Final Answer Parser,1.0
2846,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_18,matharena,answer,Final Answer Parser,0.0
2847,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_19,matharena,answer,Final Answer Parser,0.0
2848,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_19,matharena,answer,Final Answer Parser,0.0
2849,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_19,matharena,answer,Final Answer Parser,0.0
2850,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_2,matharena,answer,Final Answer Parser,1.0
2851,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_2,matharena,answer,Final Answer Parser,1.0
2852,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_2,matharena,answer,Final Answer Parser,1.0
2853,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_20,matharena,answer,Final Answer Parser,1.0
2854,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_20,matharena,answer,Final Answer Parser,0.0
2855,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_20,matharena,answer,Final Answer Parser,0.0
2856,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_21,matharena,answer,Final Answer Parser,1.0
2857,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_21,matharena,answer,Final Answer Parser,1.0
2858,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_21,matharena,answer,Final Answer Parser,1.0
2859,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_22,matharena,answer,Final Answer Parser,0.0
2860,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_22,matharena,answer,Final Answer Parser,0.0
2861,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_22,matharena,answer,Final Answer Parser,1.0
2862,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_23,matharena,answer,Final Answer Parser,1.0
2863,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_23,matharena,answer,Final Answer Parser,1.0
2864,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_23,matharena,answer,Final Answer Parser,1.0
2865,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_24,matharena,answer,Final Answer Parser,0.0
2866,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_24,matharena,answer,Final Answer Parser,1.0
2867,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_24,matharena,answer,Final Answer Parser,1.0
2868,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_25,matharena,answer,Final Answer Parser,1.0
2869,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_25,matharena,answer,Final Answer Parser,1.0
2870,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_25,matharena,answer,Final Answer Parser,1.0
2871,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_26,matharena,answer,Final Answer Parser,1.0
2872,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_26,matharena,answer,Final Answer Parser,1.0
2873,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_26,matharena,answer,Final Answer Parser,1.0
2874,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_27,matharena,answer,Final Answer Parser,0.0
2875,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_27,matharena,answer,Final Answer Parser,0.0
2876,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_27,matharena,answer,Final Answer Parser,0.0
2877,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_28,matharena,answer,Final Answer Parser,1.0
2878,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_28,matharena,answer,Final Answer Parser,1.0
2879,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_28,matharena,answer,Final Answer Parser,1.0
2880,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_29,matharena,answer,Final Answer Parser,1.0
2881,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_29,matharena,answer,Final Answer Parser,1.0
2882,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_29,matharena,answer,Final Answer Parser,1.0
2883,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_3,matharena,answer,Final Answer Parser,1.0
2884,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_3,matharena,answer,Final Answer Parser,1.0
2885,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_3,matharena,answer,Final Answer Parser,1.0
2886,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_30,matharena,answer,Final Answer Parser,0.0
2887,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_30,matharena,answer,Final Answer Parser,1.0
2888,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_30,matharena,answer,Final Answer Parser,0.0
2889,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_31,matharena,answer,Final Answer Parser,1.0
2890,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_31,matharena,answer,Final Answer Parser,1.0
2891,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_31,matharena,answer,Final Answer Parser,1.0
2892,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_32,matharena,answer,Final Answer Parser,1.0
2893,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_32,matharena,answer,Final Answer Parser,1.0
2894,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_32,matharena,answer,Final Answer Parser,0.0
2895,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_33,matharena,answer,Final Answer Parser,1.0
2896,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_33,matharena,answer,Final Answer Parser,1.0
2897,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_33,matharena,answer,Final Answer Parser,1.0
2898,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_34,matharena,answer,Final Answer Parser,1.0
2899,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_34,matharena,answer,Final Answer Parser,0.0
2900,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_34,matharena,answer,Final Answer Parser,0.0
2901,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_35,matharena,answer,Final Answer Parser,1.0
2902,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_35,matharena,answer,Final Answer Parser,1.0
2903,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_35,matharena,answer,Final Answer Parser,1.0
2904,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_36,matharena,answer,Final Answer Parser,1.0
2905,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_36,matharena,answer,Final Answer Parser,1.0
2906,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_36,matharena,answer,Final Answer Parser,1.0
2907,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_37,matharena,answer,Final Answer Parser,1.0
2908,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_37,matharena,answer,Final Answer Parser,1.0
2909,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_37,matharena,answer,Final Answer Parser,1.0
2910,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_38,matharena,answer,Final Answer Parser,1.0
2911,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_38,matharena,answer,Final Answer Parser,0.0
2912,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_38,matharena,answer,Final Answer Parser,0.0
2913,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_39,matharena,answer,Final Answer Parser,1.0
2914,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_39,matharena,answer,Final Answer Parser,1.0
2915,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_39,matharena,answer,Final Answer Parser,1.0
2916,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_4,matharena,answer,Final Answer Parser,1.0
2917,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_4,matharena,answer,Final Answer Parser,1.0
2918,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_4,matharena,answer,Final Answer Parser,1.0
2919,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_40,matharena,answer,Final Answer Parser,1.0
2920,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_40,matharena,answer,Final Answer Parser,1.0
2921,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_40,matharena,answer,Final Answer Parser,1.0
2922,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_41,matharena,answer,Final Answer Parser,1.0
2923,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_41,matharena,answer,Final Answer Parser,0.0
2924,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_41,matharena,answer,Final Answer Parser,1.0
2925,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_42,matharena,answer,Final Answer Parser,0.0
2926,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_42,matharena,answer,Final Answer Parser,0.0
2927,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_42,matharena,answer,Final Answer Parser,0.0
2928,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_43,matharena,answer,Final Answer Parser,0.0
2929,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_43,matharena,answer,Final Answer Parser,0.0
2930,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_43,matharena,answer,Final Answer Parser,0.0
2931,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_44,matharena,answer,Final Answer Parser,1.0
2932,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_44,matharena,answer,Final Answer Parser,1.0
2933,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_44,matharena,answer,Final Answer Parser,1.0
2934,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_45,matharena,answer,Final Answer Parser,1.0
2935,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_45,matharena,answer,Final Answer Parser,1.0
2936,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_45,matharena,answer,Final Answer Parser,1.0
2937,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_46,matharena,answer,Final Answer Parser,1.0
2938,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_46,matharena,answer,Final Answer Parser,1.0
2939,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_46,matharena,answer,Final Answer Parser,1.0
2940,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_47,matharena,answer,Final Answer Parser,1.0
2941,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_47,matharena,answer,Final Answer Parser,1.0
2942,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_47,matharena,answer,Final Answer Parser,1.0
2943,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_48,matharena,answer,Final Answer Parser,1.0
2944,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_48,matharena,answer,Final Answer Parser,1.0
2945,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_48,matharena,answer,Final Answer Parser,1.0
2946,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_49,matharena,answer,Final Answer Parser,1.0
2947,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_49,matharena,answer,Final Answer Parser,1.0
2948,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_49,matharena,answer,Final Answer Parser,1.0
2949,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_5,matharena,answer,Final Answer Parser,1.0
2950,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_5,matharena,answer,Final Answer Parser,1.0
2951,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_5,matharena,answer,Final Answer Parser,1.0
2952,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_50,matharena,answer,Final Answer Parser,1.0
2953,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_50,matharena,answer,Final Answer Parser,0.0
2954,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_50,matharena,answer,Final Answer Parser,1.0
2955,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_51,matharena,answer,Final Answer Parser,1.0
2956,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_51,matharena,answer,Final Answer Parser,1.0
2957,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_51,matharena,answer,Final Answer Parser,1.0
2958,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_52,matharena,answer,Final Answer Parser,1.0
2959,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_52,matharena,answer,Final Answer Parser,1.0
2960,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_52,matharena,answer,Final Answer Parser,0.0
2961,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_53,matharena,answer,Final Answer Parser,0.0
2962,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_53,matharena,answer,Final Answer Parser,1.0
2963,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_53,matharena,answer,Final Answer Parser,0.0
2964,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_6,matharena,answer,Final Answer Parser,1.0
2965,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_6,matharena,answer,Final Answer Parser,1.0
2966,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_6,matharena,answer,Final Answer Parser,1.0
2967,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_7,matharena,answer,Final Answer Parser,1.0
2968,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_7,matharena,answer,Final Answer Parser,1.0
2969,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_7,matharena,answer,Final Answer Parser,1.0
2970,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_8,matharena,answer,Final Answer Parser,0.0
2971,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_8,matharena,answer,Final Answer Parser,0.0
2972,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_8,matharena,answer,Final Answer Parser,1.0
2973,Qwen3-4B (25/07),qwen/qwen3_4b,matharena_smt/smt_2025_9,matharena,answer,Final Answer Parser,1.0
2974,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,matharena_smt/smt_2025_9,matharena,answer,Final Answer Parser,0.0
2975,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,matharena_smt/smt_2025_9,matharena,answer,Final Answer Parser,1.0
2976,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,nordic_2025_1,nordic,proofs,OPC R1 8B,1.0
2977,GPT-5-mini (high),openai/gpt-5-mini,nordic_2025_1,nordic,proofs,OPC R1 8B,1.0
2978,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,nordic_2025_1,nordic,proofs,OPC R1 8B,1.0
2979,Qwen3-4B (25/07),qwen/qwen3_4b,nordic_2025_1,nordic,proofs,OPC R1 8B,1.0
2980,o4-mini (high),openai/o4-mini--high,nordic_2025_1,nordic,proofs,OPC R1 8B,1.0
2981,GPT OSS 120B (high),openai/oss-120b,nordic_2025_1,nordic,proofs,OPC R1 8B,0.0
2982,GPT-5 (high),openai/gpt-5,nordic_2025_1,nordic,proofs,OPC R1 8B,1.0
2983,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,nordic_2025_1,nordic,proofs,OPC R1 8B,0.0
2984,Grok 4,xai/grok-4,nordic_2025_1,nordic,proofs,OPC R1 8B,1.0
2985,gemini-2.5-pro,gemini/gemini-pro-2.5,nordic_2025_1,nordic,proofs,OPC R1 8B,1.0
2986,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,nordic_2025_1,nordic,proofs,OPC R1 8B,1.0
2987,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,nordic_2025_2,nordic,proofs,OPC R1 8B,1.0
2988,GPT-5-mini (high),openai/gpt-5-mini,nordic_2025_2,nordic,proofs,OPC R1 8B,1.0
2989,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,nordic_2025_2,nordic,proofs,OPC R1 8B,0.0
2990,o4-mini (high),openai/o4-mini--high,nordic_2025_2,nordic,proofs,OPC R1 8B,1.0
2991,GPT OSS 120B (high),openai/oss-120b,nordic_2025_2,nordic,proofs,OPC R1 8B,1.0
2992,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,nordic_2025_2,nordic,proofs,OPC R1 8B,1.0
2993,gemini-2.5-pro,gemini/gemini-pro-2.5,nordic_2025_2,nordic,proofs,OPC R1 8B,1.0
2994,GPT-5 (high),openai/gpt-5,nordic_2025_2,nordic,proofs,OPC R1 8B,1.0
2995,Qwen3-4B (25/07),qwen/qwen3_4b,nordic_2025_2,nordic,proofs,OPC R1 8B,0.0
2996,Grok 4,xai/grok-4,nordic_2025_2,nordic,proofs,OPC R1 8B,1.0
2997,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,nordic_2025_2,nordic,proofs,OPC R1 8B,1.0
2998,gemini-2.5-pro,gemini/gemini-pro-2.5,nordic_2025_3,nordic,proofs,OPC R1 8B,1.0
2999,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,nordic_2025_3,nordic,proofs,OPC R1 8B,0.0
3000,GPT OSS 120B (high),openai/oss-120b,nordic_2025_3,nordic,proofs,OPC R1 8B,1.0
3001,GPT-5-mini (high),openai/gpt-5-mini,nordic_2025_3,nordic,proofs,OPC R1 8B,1.0
3002,o4-mini (high),openai/o4-mini--high,nordic_2025_3,nordic,proofs,OPC R1 8B,1.0
3003,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,nordic_2025_3,nordic,proofs,OPC R1 8B,0.0
3004,GPT-5 (high),openai/gpt-5,nordic_2025_3,nordic,proofs,OPC R1 8B,1.0
3005,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,nordic_2025_3,nordic,proofs,OPC R1 8B,0.0
3006,Qwen3-4B (25/07),qwen/qwen3_4b,nordic_2025_3,nordic,proofs,OPC R1 8B,0.0
3007,Grok 4,xai/grok-4,nordic_2025_3,nordic,proofs,OPC R1 8B,0.0
3008,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,nordic_2025_3,nordic,proofs,OPC R1 8B,0.0
3009,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,pan_african_2025_1,pan,proofs,OPC R1 8B,0.0
3010,GPT-5-mini (high),openai/gpt-5-mini,pan_african_2025_1,pan,proofs,OPC R1 8B,0.0
3011,GPT OSS 120B (high),openai/oss-120b,pan_african_2025_1,pan,proofs,OPC R1 8B,1.0
3012,Grok 4,xai/grok-4,pan_african_2025_1,pan,proofs,OPC R1 8B,0.0
3013,GPT-5 (high),openai/gpt-5,pan_african_2025_1,pan,proofs,OPC R1 8B,0.0
3014,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,pan_african_2025_1,pan,proofs,OPC R1 8B,0.0
3015,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,pan_african_2025_1,pan,proofs,OPC R1 8B,0.0
3016,gemini-2.5-pro,gemini/gemini-pro-2.5,pan_african_2025_1,pan,proofs,OPC R1 8B,0.0
3017,Qwen3-4B (25/07),qwen/qwen3_4b,pan_african_2025_1,pan,proofs,OPC R1 8B,0.0
3018,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,pan_african_2025_1,pan,proofs,OPC R1 8B,0.0
3019,o4-mini (high),openai/o4-mini--high,pan_african_2025_1,pan,proofs,OPC R1 8B,0.0
3020,GPT-5-mini (high),openai/gpt-5-mini,pan_african_2025_2,pan,proofs,OPC R1 8B,1.0
3021,GPT OSS 120B (high),openai/oss-120b,pan_african_2025_2,pan,proofs,OPC R1 8B,1.0
3022,Grok 4,xai/grok-4,pan_african_2025_2,pan,proofs,OPC R1 8B,1.0
3023,gemini-2.5-pro,gemini/gemini-pro-2.5,pan_african_2025_2,pan,proofs,OPC R1 8B,1.0
3024,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,pan_african_2025_2,pan,proofs,OPC R1 8B,1.0
3025,Qwen3-4B (25/07),qwen/qwen3_4b,pan_african_2025_2,pan,proofs,OPC R1 8B,1.0
3026,o4-mini (high),openai/o4-mini--high,pan_african_2025_2,pan,proofs,OPC R1 8B,1.0
3027,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,pan_african_2025_2,pan,proofs,OPC R1 8B,1.0
3028,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,pan_african_2025_2,pan,proofs,OPC R1 8B,1.0
3029,GPT-5 (high),openai/gpt-5,pan_african_2025_2,pan,proofs,OPC R1 8B,1.0
3030,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,pan_african_2025_2,pan,proofs,OPC R1 8B,1.0
3031,GPT-5 (high),openai/gpt-5,pan_african_2025_3,pan,proofs,OPC R1 8B,1.0
3032,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,pan_african_2025_3,pan,proofs,OPC R1 8B,1.0
3033,GPT OSS 120B (high),openai/oss-120b,pan_african_2025_3,pan,proofs,OPC R1 8B,0.0
3034,Qwen3-4B (25/07),qwen/qwen3_4b,pan_african_2025_3,pan,proofs,OPC R1 8B,1.0
3035,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,pan_african_2025_3,pan,proofs,OPC R1 8B,1.0
3036,gemini-2.5-pro,gemini/gemini-pro-2.5,pan_african_2025_3,pan,proofs,OPC R1 8B,1.0
3037,o4-mini (high),openai/o4-mini--high,pan_african_2025_3,pan,proofs,OPC R1 8B,1.0
3038,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,pan_african_2025_3,pan,proofs,OPC R1 8B,1.0
3039,GPT-5-mini (high),openai/gpt-5-mini,pan_african_2025_3,pan,proofs,OPC R1 8B,1.0
3040,Grok 4,xai/grok-4,pan_african_2025_3,pan,proofs,OPC R1 8B,1.0
3041,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,pan_african_2025_3,pan,proofs,OPC R1 8B,1.0
3042,Qwen3-4B (25/07),qwen/qwen3_4b,pan_african_2025_4,pan,proofs,OPC R1 8B,1.0
3043,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,pan_african_2025_4,pan,proofs,OPC R1 8B,1.0
3044,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,pan_african_2025_4,pan,proofs,OPC R1 8B,1.0
3045,GPT-5-mini (high),openai/gpt-5-mini,pan_african_2025_4,pan,proofs,OPC R1 8B,1.0
3046,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,pan_african_2025_4,pan,proofs,OPC R1 8B,1.0
3047,o4-mini (high),openai/o4-mini--high,pan_african_2025_4,pan,proofs,OPC R1 8B,1.0
3048,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,pan_african_2025_4,pan,proofs,OPC R1 8B,1.0
3049,GPT OSS 120B (high),openai/oss-120b,pan_african_2025_4,pan,proofs,OPC R1 8B,1.0
3050,Grok 4,xai/grok-4,pan_african_2025_4,pan,proofs,OPC R1 8B,1.0
3051,gemini-2.5-pro,gemini/gemini-pro-2.5,pan_african_2025_4,pan,proofs,OPC R1 8B,1.0
3052,GPT-5 (high),openai/gpt-5,pan_african_2025_4,pan,proofs,OPC R1 8B,1.0
3053,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,pan_african_2025_5,pan,proofs,OPC R1 8B,0.0
3054,GPT OSS 120B (high),openai/oss-120b,pan_african_2025_5,pan,proofs,OPC R1 8B,0.0
3055,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,pan_african_2025_5,pan,proofs,OPC R1 8B,1.0
3056,Qwen3-4B (25/07),qwen/qwen3_4b,pan_african_2025_5,pan,proofs,OPC R1 8B,1.0
3057,Grok 4,xai/grok-4,pan_african_2025_5,pan,proofs,OPC R1 8B,0.0
3058,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,pan_african_2025_5,pan,proofs,OPC R1 8B,0.0
3059,GPT-5 (high),openai/gpt-5,pan_african_2025_5,pan,proofs,OPC R1 8B,1.0
3060,gemini-2.5-pro,gemini/gemini-pro-2.5,pan_african_2025_5,pan,proofs,OPC R1 8B,1.0
3061,GPT-5-mini (high),openai/gpt-5-mini,pan_african_2025_5,pan,proofs,OPC R1 8B,1.0
3062,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,pan_african_2025_5,pan,proofs,OPC R1 8B,0.0
3063,o4-mini (high),openai/o4-mini--high,pan_african_2025_5,pan,proofs,OPC R1 8B,0.0
3064,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,pan_african_2025_6,pan,proofs,OPC R1 8B,0.0
3065,gemini-2.5-pro,gemini/gemini-pro-2.5,pan_african_2025_6,pan,proofs,OPC R1 8B,1.0
3066,Grok 4,xai/grok-4,pan_african_2025_6,pan,proofs,OPC R1 8B,1.0
3067,Qwen3-4B (25/07),qwen/qwen3_4b,pan_african_2025_6,pan,proofs,OPC R1 8B,0.0
3068,o4-mini (high),openai/o4-mini--high,pan_african_2025_6,pan,proofs,OPC R1 8B,0.0
3069,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,pan_african_2025_6,pan,proofs,OPC R1 8B,0.0
3070,GPT OSS 120B (high),openai/oss-120b,pan_african_2025_6,pan,proofs,OPC R1 8B,0.0
3071,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,pan_african_2025_6,pan,proofs,OPC R1 8B,1.0
3072,GPT-5-mini (high),openai/gpt-5-mini,pan_african_2025_6,pan,proofs,OPC R1 8B,1.0
3073,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,pan_african_2025_6,pan,proofs,OPC R1 8B,0.0
3074,GPT-5 (high),openai/gpt-5,pan_african_2025_6,pan,proofs,OPC R1 8B,1.0
3075,Qwen3-4B (25/07),qwen/qwen3_4b,philippines_2025_1,philippines,proofs,OPC R1 8B,1.0
3076,o4-mini (high),openai/o4-mini--high,philippines_2025_1,philippines,proofs,OPC R1 8B,1.0
3077,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,philippines_2025_1,philippines,proofs,OPC R1 8B,0.0
3078,GPT OSS 120B (high),openai/oss-120b,philippines_2025_1,philippines,proofs,OPC R1 8B,0.0
3079,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,philippines_2025_1,philippines,proofs,OPC R1 8B,0.0
3080,GPT-5-mini (high),openai/gpt-5-mini,philippines_2025_1,philippines,proofs,OPC R1 8B,1.0
3081,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,philippines_2025_1,philippines,proofs,OPC R1 8B,1.0
3082,GPT-5 (high),openai/gpt-5,philippines_2025_1,philippines,proofs,OPC R1 8B,1.0
3083,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,philippines_2025_1,philippines,proofs,OPC R1 8B,1.0
3084,Grok 4,xai/grok-4,philippines_2025_1,philippines,proofs,OPC R1 8B,1.0
3085,gemini-2.5-pro,gemini/gemini-pro-2.5,philippines_2025_1,philippines,proofs,OPC R1 8B,1.0
3086,GPT-5 (high),openai/gpt-5,philippines_2025_2,philippines,proofs,OPC R1 8B,0.0
3087,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,philippines_2025_2,philippines,proofs,OPC R1 8B,0.0
3088,gemini-2.5-pro,gemini/gemini-pro-2.5,philippines_2025_2,philippines,proofs,OPC R1 8B,0.0
3089,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,philippines_2025_2,philippines,proofs,OPC R1 8B,0.0
3090,o4-mini (high),openai/o4-mini--high,philippines_2025_2,philippines,proofs,OPC R1 8B,0.0
3091,GPT-5-mini (high),openai/gpt-5-mini,philippines_2025_2,philippines,proofs,OPC R1 8B,0.0
3092,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,philippines_2025_2,philippines,proofs,OPC R1 8B,0.0
3093,GPT OSS 120B (high),openai/oss-120b,philippines_2025_2,philippines,proofs,OPC R1 8B,0.0
3094,Grok 4,xai/grok-4,philippines_2025_2,philippines,proofs,OPC R1 8B,0.0
3095,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,philippines_2025_2,philippines,proofs,OPC R1 8B,0.0
3096,Qwen3-4B (25/07),qwen/qwen3_4b,philippines_2025_2,philippines,proofs,OPC R1 8B,0.0
3097,GPT OSS 120B (high),openai/oss-120b,philippines_2025_3,philippines,proofs,OPC R1 8B,0.0
3098,Grok 4,xai/grok-4,philippines_2025_3,philippines,proofs,OPC R1 8B,0.0
3099,Qwen3-4B (25/07),qwen/qwen3_4b,philippines_2025_3,philippines,proofs,OPC R1 8B,0.0
3100,gemini-2.5-pro,gemini/gemini-pro-2.5,philippines_2025_3,philippines,proofs,OPC R1 8B,1.0
3101,o4-mini (high),openai/o4-mini--high,philippines_2025_3,philippines,proofs,OPC R1 8B,1.0
3102,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,philippines_2025_3,philippines,proofs,OPC R1 8B,1.0
3103,GPT-5 (high),openai/gpt-5,philippines_2025_3,philippines,proofs,OPC R1 8B,1.0
3104,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,philippines_2025_3,philippines,proofs,OPC R1 8B,0.0
3105,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,philippines_2025_3,philippines,proofs,OPC R1 8B,0.0
3106,GPT-5-mini (high),openai/gpt-5-mini,philippines_2025_3,philippines,proofs,OPC R1 8B,1.0
3107,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,philippines_2025_3,philippines,proofs,OPC R1 8B,0.0
3108,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,philippines_2025_4,philippines,proofs,OPC R1 8B,0.0
3109,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,philippines_2025_4,philippines,proofs,OPC R1 8B,0.0
3110,Grok 4,xai/grok-4,philippines_2025_4,philippines,proofs,OPC R1 8B,0.0
3111,GPT OSS 120B (high),openai/oss-120b,philippines_2025_4,philippines,proofs,OPC R1 8B,1.0
3112,GPT-5-mini (high),openai/gpt-5-mini,philippines_2025_4,philippines,proofs,OPC R1 8B,0.0
3113,Qwen3-4B (25/07),qwen/qwen3_4b,philippines_2025_4,philippines,proofs,OPC R1 8B,0.0
3114,o4-mini (high),openai/o4-mini--high,philippines_2025_4,philippines,proofs,OPC R1 8B,0.0
3115,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,philippines_2025_4,philippines,proofs,OPC R1 8B,0.0
3116,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,philippines_2025_4,philippines,proofs,OPC R1 8B,0.0
3117,gemini-2.5-pro,gemini/gemini-pro-2.5,philippines_2025_4,philippines,proofs,OPC R1 8B,0.0
3118,GPT-5 (high),openai/gpt-5,philippines_2025_4,philippines,proofs,OPC R1 8B,0.0
3119,GPT-5 (high),openai/gpt-5,philippines_2025_5,philippines,proofs,OPC R1 8B,1.0
3120,gemini-2.5-pro,gemini/gemini-pro-2.5,philippines_2025_5,philippines,proofs,OPC R1 8B,1.0
3121,Grok 4,xai/grok-4,philippines_2025_5,philippines,proofs,OPC R1 8B,1.0
3122,o4-mini (high),openai/o4-mini--high,philippines_2025_5,philippines,proofs,OPC R1 8B,0.0
3123,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,philippines_2025_5,philippines,proofs,OPC R1 8B,1.0
3124,GPT OSS 120B (high),openai/oss-120b,philippines_2025_5,philippines,proofs,OPC R1 8B,0.0
3125,GPT-5-mini (high),openai/gpt-5-mini,philippines_2025_5,philippines,proofs,OPC R1 8B,1.0
3126,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,philippines_2025_5,philippines,proofs,OPC R1 8B,1.0
3127,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,philippines_2025_5,philippines,proofs,OPC R1 8B,0.0
3128,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,philippines_2025_5,philippines,proofs,OPC R1 8B,0.0
3129,Qwen3-4B (25/07),qwen/qwen3_4b,philippines_2025_5,philippines,proofs,OPC R1 8B,0.0
3130,GPT-5 (high),openai/gpt-5,philippines_2025_6,philippines,proofs,OPC R1 8B,1.0
3131,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,philippines_2025_6,philippines,proofs,OPC R1 8B,1.0
3132,gemini-2.5-pro,gemini/gemini-pro-2.5,philippines_2025_6,philippines,proofs,OPC R1 8B,1.0
3133,Qwen3-4B (25/07),qwen/qwen3_4b,philippines_2025_6,philippines,proofs,OPC R1 8B,1.0
3134,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,philippines_2025_6,philippines,proofs,OPC R1 8B,0.0
3135,Grok 4,xai/grok-4,philippines_2025_6,philippines,proofs,OPC R1 8B,1.0
3136,GPT-5-mini (high),openai/gpt-5-mini,philippines_2025_6,philippines,proofs,OPC R1 8B,1.0
3137,o4-mini (high),openai/o4-mini--high,philippines_2025_6,philippines,proofs,OPC R1 8B,0.0
3138,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,philippines_2025_6,philippines,proofs,OPC R1 8B,1.0
3139,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,philippines_2025_6,philippines,proofs,OPC R1 8B,0.0
3140,GPT OSS 120B (high),openai/oss-120b,philippines_2025_6,philippines,proofs,OPC R1 8B,0.0
3141,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,philippines_2025_7,philippines,proofs,OPC R1 8B,0.0
3142,GPT OSS 120B (high),openai/oss-120b,philippines_2025_7,philippines,proofs,OPC R1 8B,0.0
3143,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,philippines_2025_7,philippines,proofs,OPC R1 8B,0.0
3144,Qwen3-4B (25/07),qwen/qwen3_4b,philippines_2025_7,philippines,proofs,OPC R1 8B,0.0
3145,o4-mini (high),openai/o4-mini--high,philippines_2025_7,philippines,proofs,OPC R1 8B,0.0
3146,Grok 4,xai/grok-4,philippines_2025_7,philippines,proofs,OPC R1 8B,0.0
3147,gemini-2.5-pro,gemini/gemini-pro-2.5,philippines_2025_7,philippines,proofs,OPC R1 8B,0.0
3148,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,philippines_2025_7,philippines,proofs,OPC R1 8B,0.0
3149,GPT-5-mini (high),openai/gpt-5-mini,philippines_2025_7,philippines,proofs,OPC R1 8B,0.0
3150,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,philippines_2025_7,philippines,proofs,OPC R1 8B,0.0
3151,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,philippines_2025_8,philippines,proofs,OPC R1 8B,0.0
3152,GPT OSS 120B (high),openai/oss-120b,philippines_2025_8,philippines,proofs,OPC R1 8B,0.0
3153,o4-mini (high),openai/o4-mini--high,philippines_2025_8,philippines,proofs,OPC R1 8B,0.0
3154,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,philippines_2025_8,philippines,proofs,OPC R1 8B,0.0
3155,Qwen3-4B (25/07),qwen/qwen3_4b,philippines_2025_8,philippines,proofs,OPC R1 8B,0.0
3156,gemini-2.5-pro,gemini/gemini-pro-2.5,philippines_2025_8,philippines,proofs,OPC R1 8B,0.0
3157,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,philippines_2025_8,philippines,proofs,OPC R1 8B,1.0
3158,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,philippines_2025_8,philippines,proofs,OPC R1 8B,0.0
3159,Grok 4,xai/grok-4,philippines_2025_8,philippines,proofs,OPC R1 8B,0.0
3160,GPT-5-mini (high),openai/gpt-5-mini,philippines_2025_8,philippines,proofs,OPC R1 8B,1.0
3161,Grok 4,xai/grok-4,polish_2025_1,polish,proofs,OPC R1 8B,0.0
3162,GPT-5 (high),openai/gpt-5,polish_2025_1,polish,proofs,OPC R1 8B,0.0
3163,GPT OSS 120B (high),openai/oss-120b,polish_2025_1,polish,proofs,OPC R1 8B,1.0
3164,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,polish_2025_1,polish,proofs,OPC R1 8B,1.0
3165,GPT-5-mini (high),openai/gpt-5-mini,polish_2025_1,polish,proofs,OPC R1 8B,1.0
3166,o4-mini (high),openai/o4-mini--high,polish_2025_1,polish,proofs,OPC R1 8B,1.0
3167,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,polish_2025_1,polish,proofs,OPC R1 8B,1.0
3168,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,polish_2025_1,polish,proofs,OPC R1 8B,1.0
3169,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,polish_2025_1,polish,proofs,OPC R1 8B,1.0
3170,Qwen3-4B (25/07),qwen/qwen3_4b,polish_2025_1,polish,proofs,OPC R1 8B,1.0
3171,gemini-2.5-pro,gemini/gemini-pro-2.5,polish_2025_1,polish,proofs,OPC R1 8B,1.0
3172,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,polish_2025_2,polish,proofs,OPC R1 8B,0.0
3173,GPT OSS 120B (high),openai/oss-120b,polish_2025_2,polish,proofs,OPC R1 8B,0.0
3174,Grok 4,xai/grok-4,polish_2025_2,polish,proofs,OPC R1 8B,0.0
3175,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,polish_2025_2,polish,proofs,OPC R1 8B,1.0
3176,gemini-2.5-pro,gemini/gemini-pro-2.5,polish_2025_2,polish,proofs,OPC R1 8B,1.0
3177,Qwen3-4B (25/07),qwen/qwen3_4b,polish_2025_2,polish,proofs,OPC R1 8B,1.0
3178,o4-mini (high),openai/o4-mini--high,polish_2025_2,polish,proofs,OPC R1 8B,0.0
3179,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,polish_2025_2,polish,proofs,OPC R1 8B,0.0
3180,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,polish_2025_2,polish,proofs,OPC R1 8B,1.0
3181,GPT-5 (high),openai/gpt-5,polish_2025_2,polish,proofs,OPC R1 8B,1.0
3182,GPT-5-mini (high),openai/gpt-5-mini,polish_2025_2,polish,proofs,OPC R1 8B,1.0
3183,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,polish_2025_3,polish,proofs,OPC R1 8B,1.0
3184,gemini-2.5-pro,gemini/gemini-pro-2.5,polish_2025_3,polish,proofs,OPC R1 8B,1.0
3185,GPT-5-mini (high),openai/gpt-5-mini,polish_2025_3,polish,proofs,OPC R1 8B,1.0
3186,GPT-5 (high),openai/gpt-5,polish_2025_3,polish,proofs,OPC R1 8B,1.0
3187,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,polish_2025_3,polish,proofs,OPC R1 8B,0.0
3188,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,polish_2025_3,polish,proofs,OPC R1 8B,1.0
3189,o4-mini (high),openai/o4-mini--high,polish_2025_3,polish,proofs,OPC R1 8B,1.0
3190,Qwen3-4B (25/07),qwen/qwen3_4b,polish_2025_3,polish,proofs,OPC R1 8B,1.0
3191,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,polish_2025_3,polish,proofs,OPC R1 8B,1.0
3192,GPT OSS 120B (high),openai/oss-120b,polish_2025_3,polish,proofs,OPC R1 8B,1.0
3193,Grok 4,xai/grok-4,polish_2025_3,polish,proofs,OPC R1 8B,1.0
3194,gemini-2.5-pro,gemini/gemini-pro-2.5,polish_2025_4,polish,proofs,OPC R1 8B,0.0
3195,GPT-5-mini (high),openai/gpt-5-mini,polish_2025_4,polish,proofs,OPC R1 8B,0.0
3196,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,polish_2025_4,polish,proofs,OPC R1 8B,0.0
3197,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,polish_2025_4,polish,proofs,OPC R1 8B,0.0
3198,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,polish_2025_4,polish,proofs,OPC R1 8B,0.0
3199,GPT OSS 120B (high),openai/oss-120b,polish_2025_4,polish,proofs,OPC R1 8B,0.0
3200,GPT-5 (high),openai/gpt-5,polish_2025_4,polish,proofs,OPC R1 8B,0.0
3201,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,polish_2025_4,polish,proofs,OPC R1 8B,0.0
3202,Grok 4,xai/grok-4,polish_2025_4,polish,proofs,OPC R1 8B,0.0
3203,Qwen3-4B (25/07),qwen/qwen3_4b,polish_2025_4,polish,proofs,OPC R1 8B,0.0
3204,o4-mini (high),openai/o4-mini--high,polish_2025_4,polish,proofs,OPC R1 8B,0.0
3205,Grok 4,xai/grok-4,polish_2025_5,polish,proofs,OPC R1 8B,0.0
3206,Qwen3-4B (25/07),qwen/qwen3_4b,polish_2025_5,polish,proofs,OPC R1 8B,0.0
3207,gemini-2.5-pro,gemini/gemini-pro-2.5,polish_2025_5,polish,proofs,OPC R1 8B,0.0
3208,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,polish_2025_5,polish,proofs,OPC R1 8B,0.0
3209,GPT-5 (high),openai/gpt-5,polish_2025_5,polish,proofs,OPC R1 8B,0.0
3210,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,polish_2025_5,polish,proofs,OPC R1 8B,0.0
3211,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,polish_2025_5,polish,proofs,OPC R1 8B,0.0
3212,o4-mini (high),openai/o4-mini--high,polish_2025_5,polish,proofs,OPC R1 8B,0.0
3213,GPT-5-mini (high),openai/gpt-5-mini,polish_2025_5,polish,proofs,OPC R1 8B,0.0
3214,GPT OSS 120B (high),openai/oss-120b,polish_2025_5,polish,proofs,OPC R1 8B,1.0
3215,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,polish_2025_5,polish,proofs,OPC R1 8B,0.0
3216,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,polish_2025_6,polish,proofs,OPC R1 8B,0.0
3217,GPT-5 (high),openai/gpt-5,polish_2025_6,polish,proofs,OPC R1 8B,0.0
3218,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,polish_2025_6,polish,proofs,OPC R1 8B,0.0
3219,gemini-2.5-pro,gemini/gemini-pro-2.5,polish_2025_6,polish,proofs,OPC R1 8B,0.0
3220,o4-mini (high),openai/o4-mini--high,polish_2025_6,polish,proofs,OPC R1 8B,0.0
3221,GPT-5-mini (high),openai/gpt-5-mini,polish_2025_6,polish,proofs,OPC R1 8B,0.0
3222,GPT OSS 120B (high),openai/oss-120b,polish_2025_6,polish,proofs,OPC R1 8B,0.0
3223,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,polish_2025_6,polish,proofs,OPC R1 8B,0.0
3224,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,polish_2025_6,polish,proofs,OPC R1 8B,0.0
3225,Qwen3-4B (25/07),qwen/qwen3_4b,polish_2025_6,polish,proofs,OPC R1 8B,1.0
3226,Grok 4,xai/grok-4,polish_2025_6,polish,proofs,OPC R1 8B,0.0
3227,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,rmm_2025_1,rmm,proofs,OPC R1 8B,0.0
3228,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,rmm_2025_1,rmm,proofs,OPC R1 8B,0.0
3229,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,rmm_2025_1,rmm,proofs,OPC R1 8B,0.0
3230,GPT-5 (high),openai/gpt-5,rmm_2025_1,rmm,proofs,OPC R1 8B,0.0
3231,o4-mini (high),openai/o4-mini--high,rmm_2025_1,rmm,proofs,OPC R1 8B,0.0
3232,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,rmm_2025_1,rmm,proofs,OPC R1 8B,0.0
3233,Qwen3-4B (25/07),qwen/qwen3_4b,rmm_2025_1,rmm,proofs,OPC R1 8B,0.0
3234,gemini-2.5-pro,gemini/gemini-pro-2.5,rmm_2025_1,rmm,proofs,OPC R1 8B,0.0
3235,GPT-5-mini (high),openai/gpt-5-mini,rmm_2025_1,rmm,proofs,OPC R1 8B,1.0
3236,GPT OSS 120B (high),openai/oss-120b,rmm_2025_1,rmm,proofs,OPC R1 8B,0.0
3237,Grok 4,xai/grok-4,rmm_2025_1,rmm,proofs,OPC R1 8B,1.0
3238,gemini-2.5-pro,gemini/gemini-pro-2.5,rmm_2025_2,rmm,proofs,OPC R1 8B,0.0
3239,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,rmm_2025_2,rmm,proofs,OPC R1 8B,0.0
3240,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,rmm_2025_2,rmm,proofs,OPC R1 8B,1.0
3241,GPT OSS 120B (high),openai/oss-120b,rmm_2025_2,rmm,proofs,OPC R1 8B,0.0
3242,GPT-5 (high),openai/gpt-5,rmm_2025_2,rmm,proofs,OPC R1 8B,0.0
3243,o4-mini (high),openai/o4-mini--high,rmm_2025_2,rmm,proofs,OPC R1 8B,1.0
3244,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,rmm_2025_2,rmm,proofs,OPC R1 8B,1.0
3245,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,rmm_2025_2,rmm,proofs,OPC R1 8B,0.0
3246,GPT-5-mini (high),openai/gpt-5-mini,rmm_2025_2,rmm,proofs,OPC R1 8B,0.0
3247,Grok 4,xai/grok-4,rmm_2025_2,rmm,proofs,OPC R1 8B,1.0
3248,Qwen3-4B (25/07),qwen/qwen3_4b,rmm_2025_2,rmm,proofs,OPC R1 8B,1.0
3249,o4-mini (high),openai/o4-mini--high,rmm_2025_3,rmm,proofs,OPC R1 8B,0.0
3250,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,rmm_2025_3,rmm,proofs,OPC R1 8B,0.0
3251,GPT-5 (high),openai/gpt-5,rmm_2025_3,rmm,proofs,OPC R1 8B,1.0
3252,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,rmm_2025_3,rmm,proofs,OPC R1 8B,0.0
3253,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,rmm_2025_3,rmm,proofs,OPC R1 8B,0.0
3254,GPT OSS 120B (high),openai/oss-120b,rmm_2025_3,rmm,proofs,OPC R1 8B,0.0
3255,GPT-5-mini (high),openai/gpt-5-mini,rmm_2025_3,rmm,proofs,OPC R1 8B,1.0
3256,Grok 4,xai/grok-4,rmm_2025_3,rmm,proofs,OPC R1 8B,1.0
3257,Qwen3-4B (25/07),qwen/qwen3_4b,rmm_2025_3,rmm,proofs,OPC R1 8B,0.0
3258,gemini-2.5-pro,gemini/gemini-pro-2.5,rmm_2025_3,rmm,proofs,OPC R1 8B,0.0
3259,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,rmm_2025_3,rmm,proofs,OPC R1 8B,0.0
3260,Qwen3-4B (25/07),qwen/qwen3_4b,rmm_2025_4,rmm,proofs,OPC R1 8B,0.0
3261,Grok 4,xai/grok-4,rmm_2025_4,rmm,proofs,OPC R1 8B,0.0
3262,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,rmm_2025_4,rmm,proofs,OPC R1 8B,0.0
3263,GPT-5 (high),openai/gpt-5,rmm_2025_4,rmm,proofs,OPC R1 8B,0.0
3264,o4-mini (high),openai/o4-mini--high,rmm_2025_4,rmm,proofs,OPC R1 8B,0.0
3265,GPT OSS 120B (high),openai/oss-120b,rmm_2025_4,rmm,proofs,OPC R1 8B,0.0
3266,gemini-2.5-pro,gemini/gemini-pro-2.5,rmm_2025_4,rmm,proofs,OPC R1 8B,0.0
3267,GPT-5-mini (high),openai/gpt-5-mini,rmm_2025_4,rmm,proofs,OPC R1 8B,0.0
3268,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,rmm_2025_4,rmm,proofs,OPC R1 8B,0.0
3269,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,rmm_2025_4,rmm,proofs,OPC R1 8B,0.0
3270,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,rmm_2025_4,rmm,proofs,OPC R1 8B,1.0
3271,Grok 4,xai/grok-4,rmm_2025_5,rmm,proofs,OPC R1 8B,0.0
3272,Qwen3-4B (25/07),qwen/qwen3_4b,rmm_2025_5,rmm,proofs,OPC R1 8B,0.0
3273,gemini-2.5-pro,gemini/gemini-pro-2.5,rmm_2025_5,rmm,proofs,OPC R1 8B,0.0
3274,GPT OSS 120B (high),openai/oss-120b,rmm_2025_5,rmm,proofs,OPC R1 8B,0.0
3275,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,rmm_2025_5,rmm,proofs,OPC R1 8B,0.0
3276,GPT-5-mini (high),openai/gpt-5-mini,rmm_2025_5,rmm,proofs,OPC R1 8B,0.0
3277,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,rmm_2025_5,rmm,proofs,OPC R1 8B,0.0
3278,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,rmm_2025_5,rmm,proofs,OPC R1 8B,0.0
3279,o4-mini (high),openai/o4-mini--high,rmm_2025_5,rmm,proofs,OPC R1 8B,0.0
3280,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,rmm_2025_5,rmm,proofs,OPC R1 8B,0.0
3281,gemini-2.5-pro,gemini/gemini-pro-2.5,rmm_2025_6,rmm,proofs,OPC R1 8B,0.0
3282,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,rmm_2025_6,rmm,proofs,OPC R1 8B,1.0
3283,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,rmm_2025_6,rmm,proofs,OPC R1 8B,1.0
3284,GPT-5 (high),openai/gpt-5,rmm_2025_6,rmm,proofs,OPC R1 8B,1.0
3285,GPT-5-mini (high),openai/gpt-5-mini,rmm_2025_6,rmm,proofs,OPC R1 8B,0.0
3286,Qwen3-4B (25/07),qwen/qwen3_4b,rmm_2025_6,rmm,proofs,OPC R1 8B,0.0
3287,Grok 4,xai/grok-4,rmm_2025_6,rmm,proofs,OPC R1 8B,1.0
3288,GPT OSS 120B (high),openai/oss-120b,rmm_2025_6,rmm,proofs,OPC R1 8B,0.0
3289,o4-mini (high),openai/o4-mini--high,rmm_2025_6,rmm,proofs,OPC R1 8B,0.0
3290,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,rmm_2025_6,rmm,proofs,OPC R1 8B,0.0
3291,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,rmm_2025_6,rmm,proofs,OPC R1 8B,0.0
3292,o4-mini (high),openai/o4-mini--high,romania_10_2025_1,romania,proofs,OPC R1 8B,0.0
3293,GPT-5 (high),openai/gpt-5,romania_10_2025_1,romania,proofs,OPC R1 8B,0.0
3294,GPT-5-mini (high),openai/gpt-5-mini,romania_10_2025_1,romania,proofs,OPC R1 8B,0.0
3295,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,romania_10_2025_1,romania,proofs,OPC R1 8B,0.0
3296,Grok 4,xai/grok-4,romania_10_2025_1,romania,proofs,OPC R1 8B,0.0
3297,gemini-2.5-pro,gemini/gemini-pro-2.5,romania_10_2025_1,romania,proofs,OPC R1 8B,1.0
3298,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,romania_10_2025_1,romania,proofs,OPC R1 8B,0.0
3299,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,romania_10_2025_1,romania,proofs,OPC R1 8B,0.0
3300,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,romania_10_2025_1,romania,proofs,OPC R1 8B,0.0
3301,GPT OSS 120B (high),openai/oss-120b,romania_10_2025_1,romania,proofs,OPC R1 8B,0.0
3302,Qwen3-4B (25/07),qwen/qwen3_4b,romania_10_2025_1,romania,proofs,OPC R1 8B,0.0
3303,GPT-5-mini (high),openai/gpt-5-mini,romania_10_2025_2,romania,proofs,OPC R1 8B,1.0
3304,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,romania_10_2025_2,romania,proofs,OPC R1 8B,0.0
3305,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,romania_10_2025_2,romania,proofs,OPC R1 8B,1.0
3306,gemini-2.5-pro,gemini/gemini-pro-2.5,romania_10_2025_2,romania,proofs,OPC R1 8B,1.0
3307,o4-mini (high),openai/o4-mini--high,romania_10_2025_2,romania,proofs,OPC R1 8B,1.0
3308,Grok 4,xai/grok-4,romania_10_2025_2,romania,proofs,OPC R1 8B,1.0
3309,Qwen3-4B (25/07),qwen/qwen3_4b,romania_10_2025_2,romania,proofs,OPC R1 8B,0.0
3310,GPT OSS 120B (high),openai/oss-120b,romania_10_2025_2,romania,proofs,OPC R1 8B,0.0
3311,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,romania_10_2025_2,romania,proofs,OPC R1 8B,1.0
3312,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,romania_10_2025_2,romania,proofs,OPC R1 8B,0.0
3313,GPT-5 (high),openai/gpt-5,romania_10_2025_2,romania,proofs,OPC R1 8B,1.0
3314,GPT OSS 120B (high),openai/oss-120b,romania_10_2025_3,romania,proofs,OPC R1 8B,0.0
3315,GPT-5 (high),openai/gpt-5,romania_10_2025_3,romania,proofs,OPC R1 8B,0.0
3316,gemini-2.5-pro,gemini/gemini-pro-2.5,romania_10_2025_3,romania,proofs,OPC R1 8B,1.0
3317,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,romania_10_2025_3,romania,proofs,OPC R1 8B,1.0
3318,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,romania_10_2025_3,romania,proofs,OPC R1 8B,0.0
3319,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,romania_10_2025_3,romania,proofs,OPC R1 8B,0.0
3320,GPT-5-mini (high),openai/gpt-5-mini,romania_10_2025_3,romania,proofs,OPC R1 8B,0.0
3321,o4-mini (high),openai/o4-mini--high,romania_10_2025_3,romania,proofs,OPC R1 8B,0.0
3322,Qwen3-4B (25/07),qwen/qwen3_4b,romania_10_2025_3,romania,proofs,OPC R1 8B,1.0
3323,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,romania_10_2025_3,romania,proofs,OPC R1 8B,1.0
3324,Grok 4,xai/grok-4,romania_10_2025_3,romania,proofs,OPC R1 8B,0.0
3325,GPT-5-mini (high),openai/gpt-5-mini,romania_11_2025_1,romania,proofs,OPC R1 8B,1.0
3326,Grok 4,xai/grok-4,romania_11_2025_1,romania,proofs,OPC R1 8B,0.0
3327,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,romania_11_2025_1,romania,proofs,OPC R1 8B,1.0
3328,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,romania_11_2025_1,romania,proofs,OPC R1 8B,1.0
3329,o4-mini (high),openai/o4-mini--high,romania_11_2025_1,romania,proofs,OPC R1 8B,1.0
3330,GPT-5 (high),openai/gpt-5,romania_11_2025_1,romania,proofs,OPC R1 8B,1.0
3331,GPT OSS 120B (high),openai/oss-120b,romania_11_2025_1,romania,proofs,OPC R1 8B,0.0
3332,gemini-2.5-pro,gemini/gemini-pro-2.5,romania_11_2025_1,romania,proofs,OPC R1 8B,1.0
3333,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,romania_11_2025_1,romania,proofs,OPC R1 8B,0.0
3334,Qwen3-4B (25/07),qwen/qwen3_4b,romania_11_2025_1,romania,proofs,OPC R1 8B,1.0
3335,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,romania_11_2025_1,romania,proofs,OPC R1 8B,0.0
3336,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,romania_11_2025_2,romania,proofs,OPC R1 8B,0.0
3337,GPT OSS 120B (high),openai/oss-120b,romania_11_2025_2,romania,proofs,OPC R1 8B,0.0
3338,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,romania_11_2025_2,romania,proofs,OPC R1 8B,1.0
3339,GPT-5-mini (high),openai/gpt-5-mini,romania_11_2025_2,romania,proofs,OPC R1 8B,1.0
3340,Grok 4,xai/grok-4,romania_11_2025_2,romania,proofs,OPC R1 8B,1.0
3341,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,romania_11_2025_2,romania,proofs,OPC R1 8B,1.0
3342,Qwen3-4B (25/07),qwen/qwen3_4b,romania_11_2025_2,romania,proofs,OPC R1 8B,0.0
3343,o4-mini (high),openai/o4-mini--high,romania_11_2025_2,romania,proofs,OPC R1 8B,0.0
3344,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,romania_11_2025_2,romania,proofs,OPC R1 8B,0.0
3345,GPT-5 (high),openai/gpt-5,romania_11_2025_2,romania,proofs,OPC R1 8B,1.0
3346,gemini-2.5-pro,gemini/gemini-pro-2.5,romania_11_2025_2,romania,proofs,OPC R1 8B,0.0
3347,GPT OSS 120B (high),openai/oss-120b,romania_11_2025_3,romania,proofs,OPC R1 8B,0.0
3348,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,romania_11_2025_3,romania,proofs,OPC R1 8B,0.0
3349,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,romania_11_2025_3,romania,proofs,OPC R1 8B,0.0
3350,o4-mini (high),openai/o4-mini--high,romania_11_2025_3,romania,proofs,OPC R1 8B,0.0
3351,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,romania_11_2025_3,romania,proofs,OPC R1 8B,0.0
3352,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,romania_11_2025_3,romania,proofs,OPC R1 8B,0.0
3353,Qwen3-4B (25/07),qwen/qwen3_4b,romania_11_2025_3,romania,proofs,OPC R1 8B,0.0
3354,gemini-2.5-pro,gemini/gemini-pro-2.5,romania_11_2025_3,romania,proofs,OPC R1 8B,0.0
3355,Grok 4,xai/grok-4,romania_11_2025_3,romania,proofs,OPC R1 8B,0.0
3356,GPT-5 (high),openai/gpt-5,romania_11_2025_3,romania,proofs,OPC R1 8B,0.0
3357,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,romania_12_2025_1,romania,proofs,OPC R1 8B,0.0
3358,GPT OSS 120B (high),openai/oss-120b,romania_12_2025_1,romania,proofs,OPC R1 8B,1.0
3359,o4-mini (high),openai/o4-mini--high,romania_12_2025_1,romania,proofs,OPC R1 8B,0.0
3360,Grok 4,xai/grok-4,romania_12_2025_1,romania,proofs,OPC R1 8B,0.0
3361,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,romania_12_2025_1,romania,proofs,OPC R1 8B,0.0
3362,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,romania_12_2025_1,romania,proofs,OPC R1 8B,0.0
3363,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,romania_12_2025_1,romania,proofs,OPC R1 8B,0.0
3364,GPT-5 (high),openai/gpt-5,romania_12_2025_1,romania,proofs,OPC R1 8B,0.0
3365,gemini-2.5-pro,gemini/gemini-pro-2.5,romania_12_2025_1,romania,proofs,OPC R1 8B,1.0
3366,Qwen3-4B (25/07),qwen/qwen3_4b,romania_12_2025_1,romania,proofs,OPC R1 8B,0.0
3367,GPT OSS 120B (high),openai/oss-120b,romania_12_2025_2,romania,proofs,OPC R1 8B,1.0
3368,Qwen3-4B (25/07),qwen/qwen3_4b,romania_12_2025_2,romania,proofs,OPC R1 8B,1.0
3369,GPT-5-mini (high),openai/gpt-5-mini,romania_12_2025_2,romania,proofs,OPC R1 8B,1.0
3370,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,romania_12_2025_2,romania,proofs,OPC R1 8B,1.0
3371,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,romania_12_2025_2,romania,proofs,OPC R1 8B,1.0
3372,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,romania_12_2025_2,romania,proofs,OPC R1 8B,0.0
3373,Grok 4,xai/grok-4,romania_12_2025_2,romania,proofs,OPC R1 8B,1.0
3374,o4-mini (high),openai/o4-mini--high,romania_12_2025_2,romania,proofs,OPC R1 8B,0.0
3375,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,romania_12_2025_2,romania,proofs,OPC R1 8B,0.0
3376,gemini-2.5-pro,gemini/gemini-pro-2.5,romania_12_2025_2,romania,proofs,OPC R1 8B,1.0
3377,GPT-5 (high),openai/gpt-5,romania_12_2025_2,romania,proofs,OPC R1 8B,1.0
3378,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,romania_12_2025_3,romania,proofs,OPC R1 8B,0.0
3379,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,romania_12_2025_3,romania,proofs,OPC R1 8B,1.0
3380,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,romania_12_2025_3,romania,proofs,OPC R1 8B,0.0
3381,gemini-2.5-pro,gemini/gemini-pro-2.5,romania_12_2025_3,romania,proofs,OPC R1 8B,0.0
3382,GPT OSS 120B (high),openai/oss-120b,romania_12_2025_3,romania,proofs,OPC R1 8B,0.0
3383,Grok 4,xai/grok-4,romania_12_2025_3,romania,proofs,OPC R1 8B,1.0
3384,o4-mini (high),openai/o4-mini--high,romania_12_2025_3,romania,proofs,OPC R1 8B,0.0
3385,Qwen3-4B (25/07),qwen/qwen3_4b,romania_12_2025_3,romania,proofs,OPC R1 8B,0.0
3386,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,romania_12_2025_3,romania,proofs,OPC R1 8B,0.0
3387,GPT-5 (high),openai/gpt-5,romania_12_2025_3,romania,proofs,OPC R1 8B,0.0
3388,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,romania_9_2025_1,romania,proofs,OPC R1 8B,0.0
3389,Grok 4,xai/grok-4,romania_9_2025_1,romania,proofs,OPC R1 8B,0.0
3390,Qwen3-4B (25/07),qwen/qwen3_4b,romania_9_2025_1,romania,proofs,OPC R1 8B,0.0
3391,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,romania_9_2025_1,romania,proofs,OPC R1 8B,0.0
3392,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,romania_9_2025_1,romania,proofs,OPC R1 8B,0.0
3393,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,romania_9_2025_1,romania,proofs,OPC R1 8B,0.0
3394,o4-mini (high),openai/o4-mini--high,romania_9_2025_1,romania,proofs,OPC R1 8B,0.0
3395,GPT OSS 120B (high),openai/oss-120b,romania_9_2025_1,romania,proofs,OPC R1 8B,0.0
3396,gemini-2.5-pro,gemini/gemini-pro-2.5,romania_9_2025_1,romania,proofs,OPC R1 8B,0.0
3397,GPT-5 (high),openai/gpt-5,romania_9_2025_1,romania,proofs,OPC R1 8B,1.0
3398,gemini-2.5-pro,gemini/gemini-pro-2.5,romania_9_2025_2,romania,proofs,OPC R1 8B,0.0
3399,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,romania_9_2025_2,romania,proofs,OPC R1 8B,0.0
3400,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,romania_9_2025_2,romania,proofs,OPC R1 8B,0.0
3401,o4-mini (high),openai/o4-mini--high,romania_9_2025_2,romania,proofs,OPC R1 8B,0.0
3402,GPT-5 (high),openai/gpt-5,romania_9_2025_2,romania,proofs,OPC R1 8B,0.0
3403,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,romania_9_2025_2,romania,proofs,OPC R1 8B,0.0
3404,Qwen3-4B (25/07),qwen/qwen3_4b,romania_9_2025_2,romania,proofs,OPC R1 8B,0.0
3405,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,romania_9_2025_2,romania,proofs,OPC R1 8B,0.0
3406,Grok 4,xai/grok-4,romania_9_2025_2,romania,proofs,OPC R1 8B,0.0
3407,GPT OSS 120B (high),openai/oss-120b,romania_9_2025_2,romania,proofs,OPC R1 8B,0.0
3408,Qwen3-4B (25/07),qwen/qwen3_4b,romania_tst_2025_1,romania,proofs,OPC R1 8B,0.0
3409,GPT-5 (high),openai/gpt-5,romania_tst_2025_1,romania,proofs,OPC R1 8B,0.0
3410,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,romania_tst_2025_1,romania,proofs,OPC R1 8B,0.0
3411,gemini-2.5-pro,gemini/gemini-pro-2.5,romania_tst_2025_1,romania,proofs,OPC R1 8B,0.0
3412,GPT OSS 120B (high),openai/oss-120b,romania_tst_2025_1,romania,proofs,OPC R1 8B,1.0
3413,Grok 4,xai/grok-4,romania_tst_2025_1,romania,proofs,OPC R1 8B,0.0
3414,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,romania_tst_2025_1,romania,proofs,OPC R1 8B,0.0
3415,o4-mini (high),openai/o4-mini--high,romania_tst_2025_1,romania,proofs,OPC R1 8B,0.0
3416,GPT-5-mini (high),openai/gpt-5-mini,romania_tst_2025_1,romania,proofs,OPC R1 8B,0.0
3417,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,romania_tst_2025_1,romania,proofs,OPC R1 8B,0.0
3418,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,romania_tst_2025_1,romania,proofs,OPC R1 8B,0.0
3419,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,romania_tst_2025_2,romania,proofs,OPC R1 8B,0.0
3420,gemini-2.5-pro,gemini/gemini-pro-2.5,romania_tst_2025_2,romania,proofs,OPC R1 8B,1.0
3421,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,romania_tst_2025_2,romania,proofs,OPC R1 8B,0.0
3422,Grok 4,xai/grok-4,romania_tst_2025_2,romania,proofs,OPC R1 8B,0.0
3423,GPT-5 (high),openai/gpt-5,romania_tst_2025_2,romania,proofs,OPC R1 8B,1.0
3424,o4-mini (high),openai/o4-mini--high,romania_tst_2025_2,romania,proofs,OPC R1 8B,0.0
3425,Qwen3-4B (25/07),qwen/qwen3_4b,romania_tst_2025_2,romania,proofs,OPC R1 8B,1.0
3426,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,romania_tst_2025_2,romania,proofs,OPC R1 8B,0.0
3427,GPT-5-mini (high),openai/gpt-5-mini,romania_tst_2025_2,romania,proofs,OPC R1 8B,1.0
3428,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,romania_tst_2025_2,romania,proofs,OPC R1 8B,0.0
3429,GPT OSS 120B (high),openai/oss-120b,romania_tst_2025_2,romania,proofs,OPC R1 8B,0.0
3430,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,romania_tst_2025_3,romania,proofs,OPC R1 8B,0.0
3431,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,romania_tst_2025_3,romania,proofs,OPC R1 8B,0.0
3432,GPT OSS 120B (high),openai/oss-120b,romania_tst_2025_3,romania,proofs,OPC R1 8B,0.0
3433,GPT-5-mini (high),openai/gpt-5-mini,romania_tst_2025_3,romania,proofs,OPC R1 8B,0.0
3434,GPT-5 (high),openai/gpt-5,romania_tst_2025_3,romania,proofs,OPC R1 8B,0.0
3435,Grok 4,xai/grok-4,romania_tst_2025_3,romania,proofs,OPC R1 8B,0.0
3436,Qwen3-4B (25/07),qwen/qwen3_4b,romania_tst_2025_3,romania,proofs,OPC R1 8B,0.0
3437,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,romania_tst_2025_3,romania,proofs,OPC R1 8B,0.0
3438,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,romania_tst_2025_3,romania,proofs,OPC R1 8B,0.0
3439,gemini-2.5-pro,gemini/gemini-pro-2.5,romania_tst_2025_3,romania,proofs,OPC R1 8B,0.0
3440,o4-mini (high),openai/o4-mini--high,romania_tst_2025_3,romania,proofs,OPC R1 8B,0.0
3441,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,serbia_tst_bmo_2025_1,serbia,proofs,OPC R1 8B,0.0
3442,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,serbia_tst_bmo_2025_1,serbia,proofs,OPC R1 8B,1.0
3443,Qwen3-4B (25/07),qwen/qwen3_4b,serbia_tst_bmo_2025_1,serbia,proofs,OPC R1 8B,0.0
3444,Grok 4,xai/grok-4,serbia_tst_bmo_2025_1,serbia,proofs,OPC R1 8B,0.0
3445,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,serbia_tst_bmo_2025_1,serbia,proofs,OPC R1 8B,0.0
3446,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,serbia_tst_bmo_2025_1,serbia,proofs,OPC R1 8B,0.0
3447,o4-mini (high),openai/o4-mini--high,serbia_tst_bmo_2025_1,serbia,proofs,OPC R1 8B,0.0
3448,gemini-2.5-pro,gemini/gemini-pro-2.5,serbia_tst_bmo_2025_1,serbia,proofs,OPC R1 8B,0.0
3449,GPT OSS 120B (high),openai/oss-120b,serbia_tst_bmo_2025_1,serbia,proofs,OPC R1 8B,1.0
3450,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,serbia_tst_bmo_2025_2,serbia,proofs,OPC R1 8B,0.0
3451,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,serbia_tst_bmo_2025_2,serbia,proofs,OPC R1 8B,0.0
3452,gemini-2.5-pro,gemini/gemini-pro-2.5,serbia_tst_bmo_2025_2,serbia,proofs,OPC R1 8B,0.0
3453,Grok 4,xai/grok-4,serbia_tst_bmo_2025_2,serbia,proofs,OPC R1 8B,0.0
3454,Qwen3-4B (25/07),qwen/qwen3_4b,serbia_tst_bmo_2025_2,serbia,proofs,OPC R1 8B,0.0
3455,o4-mini (high),openai/o4-mini--high,serbia_tst_bmo_2025_2,serbia,proofs,OPC R1 8B,1.0
3456,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,serbia_tst_bmo_2025_2,serbia,proofs,OPC R1 8B,0.0
3457,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,serbia_tst_bmo_2025_2,serbia,proofs,OPC R1 8B,0.0
3458,GPT OSS 120B (high),openai/oss-120b,serbia_tst_bmo_2025_2,serbia,proofs,OPC R1 8B,0.0
3459,Grok 4,xai/grok-4,serbia_tst_bmo_2025_3,serbia,proofs,OPC R1 8B,1.0
3460,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,serbia_tst_bmo_2025_3,serbia,proofs,OPC R1 8B,0.0
3461,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,serbia_tst_bmo_2025_3,serbia,proofs,OPC R1 8B,1.0
3462,GPT OSS 120B (high),openai/oss-120b,serbia_tst_bmo_2025_3,serbia,proofs,OPC R1 8B,1.0
3463,o4-mini (high),openai/o4-mini--high,serbia_tst_bmo_2025_3,serbia,proofs,OPC R1 8B,0.0
3464,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,serbia_tst_bmo_2025_3,serbia,proofs,OPC R1 8B,1.0
3465,gemini-2.5-pro,gemini/gemini-pro-2.5,serbia_tst_bmo_2025_3,serbia,proofs,OPC R1 8B,0.0
3466,Qwen3-4B (25/07),qwen/qwen3_4b,serbia_tst_bmo_2025_3,serbia,proofs,OPC R1 8B,0.0
3467,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,serbia_tst_bmo_2025_3,serbia,proofs,OPC R1 8B,0.0
3468,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,serbia_tst_bmo_2025_4,serbia,proofs,OPC R1 8B,0.0
3469,gemini-2.5-pro,gemini/gemini-pro-2.5,serbia_tst_bmo_2025_4,serbia,proofs,OPC R1 8B,0.0
3470,Grok 4,xai/grok-4,serbia_tst_bmo_2025_4,serbia,proofs,OPC R1 8B,0.0
3471,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,serbia_tst_bmo_2025_4,serbia,proofs,OPC R1 8B,0.0
3472,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,serbia_tst_bmo_2025_4,serbia,proofs,OPC R1 8B,0.0
3473,o4-mini (high),openai/o4-mini--high,serbia_tst_bmo_2025_4,serbia,proofs,OPC R1 8B,0.0
3474,Qwen3-4B (25/07),qwen/qwen3_4b,serbia_tst_bmo_2025_4,serbia,proofs,OPC R1 8B,0.0
3475,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,serbia_tst_bmo_2025_4,serbia,proofs,OPC R1 8B,0.0
3476,GPT OSS 120B (high),openai/oss-120b,serbia_tst_bmo_2025_4,serbia,proofs,OPC R1 8B,0.0
3477,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,spain_2025_1,spain,proofs,OPC R1 8B,0.0
3478,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,spain_2025_1,spain,proofs,OPC R1 8B,1.0
3479,gemini-2.5-pro,gemini/gemini-pro-2.5,spain_2025_1,spain,proofs,OPC R1 8B,1.0
3480,GPT-5-mini (high),openai/gpt-5-mini,spain_2025_1,spain,proofs,OPC R1 8B,1.0
3481,GPT-5 (high),openai/gpt-5,spain_2025_1,spain,proofs,OPC R1 8B,0.0
3482,GPT OSS 120B (high),openai/oss-120b,spain_2025_1,spain,proofs,OPC R1 8B,0.0
3483,o4-mini (high),openai/o4-mini--high,spain_2025_1,spain,proofs,OPC R1 8B,0.0
3484,Grok 4,xai/grok-4,spain_2025_1,spain,proofs,OPC R1 8B,1.0
3485,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,spain_2025_1,spain,proofs,OPC R1 8B,1.0
3486,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,spain_2025_1,spain,proofs,OPC R1 8B,0.0
3487,Qwen3-4B (25/07),qwen/qwen3_4b,spain_2025_1,spain,proofs,OPC R1 8B,1.0
3488,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,spain_2025_2,spain,proofs,OPC R1 8B,1.0
3489,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,spain_2025_2,spain,proofs,OPC R1 8B,1.0
3490,GPT OSS 120B (high),openai/oss-120b,spain_2025_2,spain,proofs,OPC R1 8B,0.0
3491,o4-mini (high),openai/o4-mini--high,spain_2025_2,spain,proofs,OPC R1 8B,0.0
3492,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,spain_2025_2,spain,proofs,OPC R1 8B,0.0
3493,GPT-5 (high),openai/gpt-5,spain_2025_2,spain,proofs,OPC R1 8B,1.0
3494,Qwen3-4B (25/07),qwen/qwen3_4b,spain_2025_2,spain,proofs,OPC R1 8B,1.0
3495,gemini-2.5-pro,gemini/gemini-pro-2.5,spain_2025_2,spain,proofs,OPC R1 8B,1.0
3496,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,spain_2025_2,spain,proofs,OPC R1 8B,1.0
3497,Grok 4,xai/grok-4,spain_2025_2,spain,proofs,OPC R1 8B,1.0
3498,GPT-5-mini (high),openai/gpt-5-mini,spain_2025_2,spain,proofs,OPC R1 8B,1.0
3499,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,spain_2025_3,spain,proofs,OPC R1 8B,1.0
3500,Qwen3-4B (25/07),qwen/qwen3_4b,spain_2025_3,spain,proofs,OPC R1 8B,0.0
3501,o4-mini (high),openai/o4-mini--high,spain_2025_3,spain,proofs,OPC R1 8B,0.0
3502,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,spain_2025_3,spain,proofs,OPC R1 8B,0.0
3503,GPT OSS 120B (high),openai/oss-120b,spain_2025_3,spain,proofs,OPC R1 8B,0.0
3504,GPT-5 (high),openai/gpt-5,spain_2025_3,spain,proofs,OPC R1 8B,1.0
3505,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,spain_2025_3,spain,proofs,OPC R1 8B,0.0
3506,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,spain_2025_3,spain,proofs,OPC R1 8B,0.0
3507,Grok 4,xai/grok-4,spain_2025_3,spain,proofs,OPC R1 8B,0.0
3508,gemini-2.5-pro,gemini/gemini-pro-2.5,spain_2025_3,spain,proofs,OPC R1 8B,1.0
3509,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,spain_2025_4,spain,proofs,OPC R1 8B,1.0
3510,Grok 4,xai/grok-4,spain_2025_4,spain,proofs,OPC R1 8B,0.0
3511,GPT-5 (high),openai/gpt-5,spain_2025_4,spain,proofs,OPC R1 8B,0.0
3512,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,spain_2025_4,spain,proofs,OPC R1 8B,0.0
3513,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,spain_2025_4,spain,proofs,OPC R1 8B,0.0
3514,Qwen3-4B (25/07),qwen/qwen3_4b,spain_2025_4,spain,proofs,OPC R1 8B,0.0
3515,gemini-2.5-pro,gemini/gemini-pro-2.5,spain_2025_4,spain,proofs,OPC R1 8B,0.0
3516,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,spain_2025_4,spain,proofs,OPC R1 8B,0.0
3517,GPT OSS 120B (high),openai/oss-120b,spain_2025_4,spain,proofs,OPC R1 8B,0.0
3518,o4-mini (high),openai/o4-mini--high,spain_2025_4,spain,proofs,OPC R1 8B,0.0
3519,GPT-5 (high),openai/gpt-5,spain_2025_5,spain,proofs,OPC R1 8B,1.0
3520,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,spain_2025_5,spain,proofs,OPC R1 8B,0.0
3521,GPT-5-mini (high),openai/gpt-5-mini,spain_2025_5,spain,proofs,OPC R1 8B,0.0
3522,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,spain_2025_5,spain,proofs,OPC R1 8B,0.0
3523,Grok 4,xai/grok-4,spain_2025_5,spain,proofs,OPC R1 8B,0.0
3524,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,spain_2025_5,spain,proofs,OPC R1 8B,0.0
3525,gemini-2.5-pro,gemini/gemini-pro-2.5,spain_2025_5,spain,proofs,OPC R1 8B,0.0
3526,o4-mini (high),openai/o4-mini--high,spain_2025_5,spain,proofs,OPC R1 8B,0.0
3527,GPT OSS 120B (high),openai/oss-120b,spain_2025_5,spain,proofs,OPC R1 8B,0.0
3528,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,spain_2025_5,spain,proofs,OPC R1 8B,0.0
3529,Qwen3-4B (25/07),qwen/qwen3_4b,spain_2025_5,spain,proofs,OPC R1 8B,0.0
3530,Grok 4,xai/grok-4,thai_2025_1,thai,proofs,OPC R1 8B,1.0
3531,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,thai_2025_1,thai,proofs,OPC R1 8B,1.0
3532,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,thai_2025_1,thai,proofs,OPC R1 8B,1.0
3533,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,thai_2025_1,thai,proofs,OPC R1 8B,1.0
3534,GPT OSS 120B (high),openai/oss-120b,thai_2025_1,thai,proofs,OPC R1 8B,1.0
3535,Qwen3-4B (25/07),qwen/qwen3_4b,thai_2025_1,thai,proofs,OPC R1 8B,0.0
3536,gemini-2.5-pro,gemini/gemini-pro-2.5,thai_2025_1,thai,proofs,OPC R1 8B,1.0
3537,o4-mini (high),openai/o4-mini--high,thai_2025_1,thai,proofs,OPC R1 8B,1.0
3538,GPT-5 (high),openai/gpt-5,thai_2025_1,thai,proofs,OPC R1 8B,1.0
3539,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,thai_2025_1,thai,proofs,OPC R1 8B,0.0
3540,Grok 4,xai/grok-4,thai_2025_10,thai,proofs,OPC R1 8B,0.0
3541,o4-mini (high),openai/o4-mini--high,thai_2025_10,thai,proofs,OPC R1 8B,1.0
3542,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,thai_2025_10,thai,proofs,OPC R1 8B,0.0
3543,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,thai_2025_10,thai,proofs,OPC R1 8B,0.0
3544,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,thai_2025_10,thai,proofs,OPC R1 8B,0.0
3545,GPT OSS 120B (high),openai/oss-120b,thai_2025_10,thai,proofs,OPC R1 8B,1.0
3546,Qwen3-4B (25/07),qwen/qwen3_4b,thai_2025_10,thai,proofs,OPC R1 8B,0.0
3547,GPT-5 (high),openai/gpt-5,thai_2025_10,thai,proofs,OPC R1 8B,1.0
3548,gemini-2.5-pro,gemini/gemini-pro-2.5,thai_2025_10,thai,proofs,OPC R1 8B,1.0
3549,GPT-5-mini (high),openai/gpt-5-mini,thai_2025_10,thai,proofs,OPC R1 8B,1.0
3550,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,thai_2025_10,thai,proofs,OPC R1 8B,0.0
3551,GPT OSS 120B (high),openai/oss-120b,thai_2025_2,thai,proofs,OPC R1 8B,0.0
3552,o4-mini (high),openai/o4-mini--high,thai_2025_2,thai,proofs,OPC R1 8B,1.0
3553,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,thai_2025_2,thai,proofs,OPC R1 8B,1.0
3554,GPT-5-mini (high),openai/gpt-5-mini,thai_2025_2,thai,proofs,OPC R1 8B,1.0
3555,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,thai_2025_2,thai,proofs,OPC R1 8B,1.0
3556,GPT-5 (high),openai/gpt-5,thai_2025_2,thai,proofs,OPC R1 8B,1.0
3557,Qwen3-4B (25/07),qwen/qwen3_4b,thai_2025_2,thai,proofs,OPC R1 8B,1.0
3558,gemini-2.5-pro,gemini/gemini-pro-2.5,thai_2025_2,thai,proofs,OPC R1 8B,1.0
3559,Grok 4,xai/grok-4,thai_2025_2,thai,proofs,OPC R1 8B,1.0
3560,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,thai_2025_2,thai,proofs,OPC R1 8B,1.0
3561,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,thai_2025_2,thai,proofs,OPC R1 8B,1.0
3562,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,thai_2025_3,thai,proofs,OPC R1 8B,0.0
3563,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,thai_2025_3,thai,proofs,OPC R1 8B,0.0
3564,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,thai_2025_3,thai,proofs,OPC R1 8B,1.0
3565,gemini-2.5-pro,gemini/gemini-pro-2.5,thai_2025_3,thai,proofs,OPC R1 8B,0.0
3566,Grok 4,xai/grok-4,thai_2025_3,thai,proofs,OPC R1 8B,0.0
3567,GPT-5 (high),openai/gpt-5,thai_2025_3,thai,proofs,OPC R1 8B,1.0
3568,GPT OSS 120B (high),openai/oss-120b,thai_2025_3,thai,proofs,OPC R1 8B,1.0
3569,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,thai_2025_3,thai,proofs,OPC R1 8B,1.0
3570,Qwen3-4B (25/07),qwen/qwen3_4b,thai_2025_3,thai,proofs,OPC R1 8B,0.0
3571,o4-mini (high),openai/o4-mini--high,thai_2025_3,thai,proofs,OPC R1 8B,1.0
3572,gemini-2.5-pro,gemini/gemini-pro-2.5,thai_2025_4,thai,proofs,OPC R1 8B,1.0
3573,GPT-5 (high),openai/gpt-5,thai_2025_4,thai,proofs,OPC R1 8B,0.0
3574,Qwen3-4B (25/07),qwen/qwen3_4b,thai_2025_4,thai,proofs,OPC R1 8B,0.0
3575,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,thai_2025_4,thai,proofs,OPC R1 8B,0.0
3576,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,thai_2025_4,thai,proofs,OPC R1 8B,0.0
3577,GPT OSS 120B (high),openai/oss-120b,thai_2025_4,thai,proofs,OPC R1 8B,1.0
3578,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,thai_2025_4,thai,proofs,OPC R1 8B,0.0
3579,o4-mini (high),openai/o4-mini--high,thai_2025_4,thai,proofs,OPC R1 8B,0.0
3580,Grok 4,xai/grok-4,thai_2025_4,thai,proofs,OPC R1 8B,0.0
3581,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,thai_2025_4,thai,proofs,OPC R1 8B,0.0
3582,GPT-5 (high),openai/gpt-5,thai_2025_5,thai,proofs,OPC R1 8B,1.0
3583,GPT OSS 120B (high),openai/oss-120b,thai_2025_5,thai,proofs,OPC R1 8B,1.0
3584,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,thai_2025_5,thai,proofs,OPC R1 8B,1.0
3585,gemini-2.5-pro,gemini/gemini-pro-2.5,thai_2025_5,thai,proofs,OPC R1 8B,1.0
3586,GPT-5-mini (high),openai/gpt-5-mini,thai_2025_5,thai,proofs,OPC R1 8B,0.0
3587,Grok 4,xai/grok-4,thai_2025_5,thai,proofs,OPC R1 8B,0.0
3588,o4-mini (high),openai/o4-mini--high,thai_2025_5,thai,proofs,OPC R1 8B,1.0
3589,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,thai_2025_5,thai,proofs,OPC R1 8B,0.0
3590,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,thai_2025_5,thai,proofs,OPC R1 8B,1.0
3591,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,thai_2025_5,thai,proofs,OPC R1 8B,0.0
3592,Qwen3-4B (25/07),qwen/qwen3_4b,thai_2025_5,thai,proofs,OPC R1 8B,0.0
3593,Qwen3-4B (25/07),qwen/qwen3_4b,thai_2025_6,thai,proofs,OPC R1 8B,0.0
3594,Grok 4,xai/grok-4,thai_2025_6,thai,proofs,OPC R1 8B,1.0
3595,GPT-5-mini (high),openai/gpt-5-mini,thai_2025_6,thai,proofs,OPC R1 8B,1.0
3596,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,thai_2025_6,thai,proofs,OPC R1 8B,0.0
3597,o4-mini (high),openai/o4-mini--high,thai_2025_6,thai,proofs,OPC R1 8B,1.0
3598,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,thai_2025_6,thai,proofs,OPC R1 8B,1.0
3599,GPT OSS 120B (high),openai/oss-120b,thai_2025_6,thai,proofs,OPC R1 8B,1.0
3600,gemini-2.5-pro,gemini/gemini-pro-2.5,thai_2025_6,thai,proofs,OPC R1 8B,1.0
3601,GPT-5 (high),openai/gpt-5,thai_2025_6,thai,proofs,OPC R1 8B,1.0
3602,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,thai_2025_6,thai,proofs,OPC R1 8B,0.0
3603,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,thai_2025_6,thai,proofs,OPC R1 8B,1.0
3604,Qwen3-4B (25/07),qwen/qwen3_4b,thai_2025_7,thai,proofs,OPC R1 8B,0.0
3605,GPT-5 (high),openai/gpt-5,thai_2025_7,thai,proofs,OPC R1 8B,1.0
3606,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,thai_2025_7,thai,proofs,OPC R1 8B,0.0
3607,o4-mini (high),openai/o4-mini--high,thai_2025_7,thai,proofs,OPC R1 8B,1.0
3608,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,thai_2025_7,thai,proofs,OPC R1 8B,1.0
3609,GPT OSS 120B (high),openai/oss-120b,thai_2025_7,thai,proofs,OPC R1 8B,0.0
3610,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,thai_2025_7,thai,proofs,OPC R1 8B,0.0
3611,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,thai_2025_7,thai,proofs,OPC R1 8B,1.0
3612,Grok 4,xai/grok-4,thai_2025_7,thai,proofs,OPC R1 8B,0.0
3613,gemini-2.5-pro,gemini/gemini-pro-2.5,thai_2025_7,thai,proofs,OPC R1 8B,0.0
3614,Qwen3-4B (25/07),qwen/qwen3_4b,thai_2025_8,thai,proofs,OPC R1 8B,0.0
3615,gemini-2.5-pro,gemini/gemini-pro-2.5,thai_2025_8,thai,proofs,OPC R1 8B,1.0
3616,GPT OSS 120B (high),openai/oss-120b,thai_2025_8,thai,proofs,OPC R1 8B,0.0
3617,GPT-5-mini (high),openai/gpt-5-mini,thai_2025_8,thai,proofs,OPC R1 8B,1.0
3618,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,thai_2025_8,thai,proofs,OPC R1 8B,1.0
3619,GPT-5 (high),openai/gpt-5,thai_2025_8,thai,proofs,OPC R1 8B,1.0
3620,o4-mini (high),openai/o4-mini--high,thai_2025_8,thai,proofs,OPC R1 8B,1.0
3621,Grok 4,xai/grok-4,thai_2025_8,thai,proofs,OPC R1 8B,0.0
3622,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,thai_2025_8,thai,proofs,OPC R1 8B,0.0
3623,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,thai_2025_8,thai,proofs,OPC R1 8B,0.0
3624,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,thai_2025_8,thai,proofs,OPC R1 8B,0.0
3625,o4-mini (high),openai/o4-mini--high,thai_2025_9,thai,proofs,OPC R1 8B,1.0
3626,GPT OSS 120B (high),openai/oss-120b,thai_2025_9,thai,proofs,OPC R1 8B,0.0
3627,Qwen3-4B (25/07),qwen/qwen3_4b,thai_2025_9,thai,proofs,OPC R1 8B,0.0
3628,GPT-5 (high),openai/gpt-5,thai_2025_9,thai,proofs,OPC R1 8B,1.0
3629,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,thai_2025_9,thai,proofs,OPC R1 8B,1.0
3630,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,thai_2025_9,thai,proofs,OPC R1 8B,0.0
3631,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,thai_2025_9,thai,proofs,OPC R1 8B,0.0
3632,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,thai_2025_9,thai,proofs,OPC R1 8B,0.0
3633,gemini-2.5-pro,gemini/gemini-pro-2.5,thai_2025_9,thai,proofs,OPC R1 8B,0.0
3634,Grok 4,xai/grok-4,thai_2025_9,thai,proofs,OPC R1 8B,1.0
3635,GPT-5-mini (high),openai/gpt-5-mini,thai_2025_9,thai,proofs,OPC R1 8B,1.0
3636,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,turkey_tst_2025_1,turkey,proofs,OPC R1 8B,1.0
3637,gemini-2.5-pro,gemini/gemini-pro-2.5,turkey_tst_2025_1,turkey,proofs,OPC R1 8B,1.0
3638,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,turkey_tst_2025_1,turkey,proofs,OPC R1 8B,0.0
3639,o4-mini (high),openai/o4-mini--high,turkey_tst_2025_1,turkey,proofs,OPC R1 8B,1.0
3640,GPT-5-mini (high),openai/gpt-5-mini,turkey_tst_2025_1,turkey,proofs,OPC R1 8B,1.0
3641,GPT-5 (high),openai/gpt-5,turkey_tst_2025_1,turkey,proofs,OPC R1 8B,1.0
3642,GPT OSS 120B (high),openai/oss-120b,turkey_tst_2025_1,turkey,proofs,OPC R1 8B,0.0
3643,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,turkey_tst_2025_1,turkey,proofs,OPC R1 8B,0.0
3644,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,turkey_tst_2025_1,turkey,proofs,OPC R1 8B,1.0
3645,Grok 4,xai/grok-4,turkey_tst_2025_1,turkey,proofs,OPC R1 8B,1.0
3646,Qwen3-4B (25/07),qwen/qwen3_4b,turkey_tst_2025_1,turkey,proofs,OPC R1 8B,1.0
3647,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,turkey_tst_2025_2,turkey,proofs,OPC R1 8B,0.0
3648,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,turkey_tst_2025_2,turkey,proofs,OPC R1 8B,0.0
3649,gemini-2.5-pro,gemini/gemini-pro-2.5,turkey_tst_2025_2,turkey,proofs,OPC R1 8B,0.0
3650,GPT OSS 120B (high),openai/oss-120b,turkey_tst_2025_2,turkey,proofs,OPC R1 8B,0.0
3651,Grok 4,xai/grok-4,turkey_tst_2025_2,turkey,proofs,OPC R1 8B,0.0
3652,GPT-5-mini (high),openai/gpt-5-mini,turkey_tst_2025_2,turkey,proofs,OPC R1 8B,1.0
3653,GPT-5 (high),openai/gpt-5,turkey_tst_2025_2,turkey,proofs,OPC R1 8B,1.0
3654,Qwen3-4B (25/07),qwen/qwen3_4b,turkey_tst_2025_2,turkey,proofs,OPC R1 8B,0.0
3655,o4-mini (high),openai/o4-mini--high,turkey_tst_2025_2,turkey,proofs,OPC R1 8B,0.0
3656,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,turkey_tst_2025_2,turkey,proofs,OPC R1 8B,0.0
3657,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,turkey_tst_2025_2,turkey,proofs,OPC R1 8B,0.0
3658,gemini-2.5-pro,gemini/gemini-pro-2.5,turkey_tst_2025_3,turkey,proofs,OPC R1 8B,1.0
3659,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,turkey_tst_2025_3,turkey,proofs,OPC R1 8B,0.0
3660,GPT OSS 120B (high),openai/oss-120b,turkey_tst_2025_3,turkey,proofs,OPC R1 8B,0.0
3661,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,turkey_tst_2025_3,turkey,proofs,OPC R1 8B,0.0
3662,o4-mini (high),openai/o4-mini--high,turkey_tst_2025_3,turkey,proofs,OPC R1 8B,1.0
3663,Grok 4,xai/grok-4,turkey_tst_2025_3,turkey,proofs,OPC R1 8B,0.0
3664,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,turkey_tst_2025_3,turkey,proofs,OPC R1 8B,0.0
3665,GPT-5 (high),openai/gpt-5,turkey_tst_2025_3,turkey,proofs,OPC R1 8B,0.0
3666,Qwen3-4B (25/07),qwen/qwen3_4b,turkey_tst_2025_3,turkey,proofs,OPC R1 8B,0.0
3667,GPT-5-mini (high),openai/gpt-5-mini,turkey_tst_2025_3,turkey,proofs,OPC R1 8B,0.0
3668,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,turkey_tst_2025_3,turkey,proofs,OPC R1 8B,0.0
3669,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,turkey_tst_2025_4,turkey,proofs,OPC R1 8B,0.0
3670,gemini-2.5-pro,gemini/gemini-pro-2.5,turkey_tst_2025_4,turkey,proofs,OPC R1 8B,0.0
3671,o4-mini (high),openai/o4-mini--high,turkey_tst_2025_4,turkey,proofs,OPC R1 8B,0.0
3672,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,turkey_tst_2025_4,turkey,proofs,OPC R1 8B,0.0
3673,GPT-5-mini (high),openai/gpt-5-mini,turkey_tst_2025_4,turkey,proofs,OPC R1 8B,0.0
3674,Grok 4,xai/grok-4,turkey_tst_2025_4,turkey,proofs,OPC R1 8B,0.0
3675,GPT OSS 120B (high),openai/oss-120b,turkey_tst_2025_4,turkey,proofs,OPC R1 8B,0.0
3676,Qwen3-4B (25/07),qwen/qwen3_4b,turkey_tst_2025_4,turkey,proofs,OPC R1 8B,0.0
3677,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,turkey_tst_2025_4,turkey,proofs,OPC R1 8B,0.0
3678,GPT-5 (high),openai/gpt-5,turkey_tst_2025_4,turkey,proofs,OPC R1 8B,0.0
3679,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,turkey_tst_2025_4,turkey,proofs,OPC R1 8B,0.0
3680,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,turkey_tst_2025_5,turkey,proofs,OPC R1 8B,0.0
3681,gemini-2.5-pro,gemini/gemini-pro-2.5,turkey_tst_2025_5,turkey,proofs,OPC R1 8B,0.0
3682,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,turkey_tst_2025_5,turkey,proofs,OPC R1 8B,0.0
3683,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,turkey_tst_2025_5,turkey,proofs,OPC R1 8B,0.0
3684,o4-mini (high),openai/o4-mini--high,turkey_tst_2025_5,turkey,proofs,OPC R1 8B,0.0
3685,GPT-5 (high),openai/gpt-5,turkey_tst_2025_5,turkey,proofs,OPC R1 8B,0.0
3686,Grok 4,xai/grok-4,turkey_tst_2025_5,turkey,proofs,OPC R1 8B,0.0
3687,GPT OSS 120B (high),openai/oss-120b,turkey_tst_2025_5,turkey,proofs,OPC R1 8B,0.0
3688,Qwen3-4B (25/07),qwen/qwen3_4b,turkey_tst_2025_5,turkey,proofs,OPC R1 8B,0.0
3689,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,turkey_tst_2025_5,turkey,proofs,OPC R1 8B,0.0
3690,gemini-2.5-pro,gemini/gemini-pro-2.5,turkey_tst_2025_6,turkey,proofs,OPC R1 8B,0.0
3691,GPT-5 (high),openai/gpt-5,turkey_tst_2025_6,turkey,proofs,OPC R1 8B,0.0
3692,Qwen3-4B (25/07),qwen/qwen3_4b,turkey_tst_2025_6,turkey,proofs,OPC R1 8B,0.0
3693,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,turkey_tst_2025_6,turkey,proofs,OPC R1 8B,0.0
3694,GPT-5-mini (high),openai/gpt-5-mini,turkey_tst_2025_6,turkey,proofs,OPC R1 8B,0.0
3695,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,turkey_tst_2025_6,turkey,proofs,OPC R1 8B,0.0
3696,o4-mini (high),openai/o4-mini--high,turkey_tst_2025_6,turkey,proofs,OPC R1 8B,0.0
3697,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,turkey_tst_2025_6,turkey,proofs,OPC R1 8B,0.0
3698,Grok 4,xai/grok-4,turkey_tst_2025_6,turkey,proofs,OPC R1 8B,0.0
3699,GPT OSS 120B (high),openai/oss-120b,turkey_tst_2025_6,turkey,proofs,OPC R1 8B,1.0
3700,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,turkey_tst_2025_6,turkey,proofs,OPC R1 8B,0.0
3701,Grok 4,xai/grok-4,turkey_tst_2025_7,turkey,proofs,OPC R1 8B,0.0
3702,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,turkey_tst_2025_7,turkey,proofs,OPC R1 8B,0.0
3703,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,turkey_tst_2025_7,turkey,proofs,OPC R1 8B,0.0
3704,Qwen3-4B (25/07),qwen/qwen3_4b,turkey_tst_2025_7,turkey,proofs,OPC R1 8B,0.0
3705,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,turkey_tst_2025_7,turkey,proofs,OPC R1 8B,0.0
3706,GPT OSS 120B (high),openai/oss-120b,turkey_tst_2025_7,turkey,proofs,OPC R1 8B,0.0
3707,o4-mini (high),openai/o4-mini--high,turkey_tst_2025_7,turkey,proofs,OPC R1 8B,0.0
3708,GPT-5 (high),openai/gpt-5,turkey_tst_2025_7,turkey,proofs,OPC R1 8B,0.0
3709,GPT-5-mini (high),openai/gpt-5-mini,turkey_tst_2025_7,turkey,proofs,OPC R1 8B,0.0
3710,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,turkey_tst_2025_7,turkey,proofs,OPC R1 8B,0.0
3711,gemini-2.5-pro,gemini/gemini-pro-2.5,turkey_tst_2025_7,turkey,proofs,OPC R1 8B,0.0
3712,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,turkey_tst_2025_8,turkey,proofs,OPC R1 8B,0.0
3713,Grok 4,xai/grok-4,turkey_tst_2025_8,turkey,proofs,OPC R1 8B,0.0
3714,GPT-5-mini (high),openai/gpt-5-mini,turkey_tst_2025_8,turkey,proofs,OPC R1 8B,0.0
3715,GPT OSS 120B (high),openai/oss-120b,turkey_tst_2025_8,turkey,proofs,OPC R1 8B,1.0
3716,GPT-5 (high),openai/gpt-5,turkey_tst_2025_8,turkey,proofs,OPC R1 8B,0.0
3717,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,turkey_tst_2025_8,turkey,proofs,OPC R1 8B,0.0
3718,o4-mini (high),openai/o4-mini--high,turkey_tst_2025_8,turkey,proofs,OPC R1 8B,0.0
3719,gemini-2.5-pro,gemini/gemini-pro-2.5,turkey_tst_2025_8,turkey,proofs,OPC R1 8B,0.0
3720,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,turkey_tst_2025_8,turkey,proofs,OPC R1 8B,0.0
3721,Qwen3-4B (25/07),qwen/qwen3_4b,turkey_tst_2025_8,turkey,proofs,OPC R1 8B,0.0
3722,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,turkey_tst_2025_8,turkey,proofs,OPC R1 8B,0.0
3723,Qwen3-4B (25/07),qwen/qwen3_4b,turkey_tst_2025_9,turkey,proofs,OPC R1 8B,0.0
3724,Grok 4,xai/grok-4,turkey_tst_2025_9,turkey,proofs,OPC R1 8B,0.0
3725,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,turkey_tst_2025_9,turkey,proofs,OPC R1 8B,0.0
3726,gemini-2.5-pro,gemini/gemini-pro-2.5,turkey_tst_2025_9,turkey,proofs,OPC R1 8B,0.0
3727,GPT-5 (high),openai/gpt-5,turkey_tst_2025_9,turkey,proofs,OPC R1 8B,0.0
3728,o4-mini (high),openai/o4-mini--high,turkey_tst_2025_9,turkey,proofs,OPC R1 8B,0.0
3729,GPT OSS 120B (high),openai/oss-120b,turkey_tst_2025_9,turkey,proofs,OPC R1 8B,0.0
3730,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,turkey_tst_2025_9,turkey,proofs,OPC R1 8B,1.0
3731,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,turkey_tst_2025_9,turkey,proofs,OPC R1 8B,0.0
3732,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,turkey_tst_2025_9,turkey,proofs,OPC R1 8B,1.0
3733,GPT-5-mini (high),openai/gpt-5-mini,turkey_tst_2025_9,turkey,proofs,OPC R1 8B,0.0
3734,GPT OSS 120B (high),openai/oss-120b,usamo_2025_1,usamo,proofs,OPC R1 8B,0.0
3735,GPT-5-mini (high),openai/gpt-5-mini,usamo_2025_1,usamo,proofs,OPC R1 8B,1.0
3736,Qwen3-4B (25/07),qwen/qwen3_4b,usamo_2025_1,usamo,proofs,OPC R1 8B,0.0
3737,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,usamo_2025_1,usamo,proofs,OPC R1 8B,1.0
3738,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,usamo_2025_1,usamo,proofs,OPC R1 8B,0.0
3739,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,usamo_2025_1,usamo,proofs,OPC R1 8B,0.0
3740,gemini-2.5-pro,gemini/gemini-pro-2.5,usamo_2025_1,usamo,proofs,OPC R1 8B,0.0
3741,Grok 4,xai/grok-4,usamo_2025_1,usamo,proofs,OPC R1 8B,0.0
3742,o4-mini (high),openai/o4-mini--high,usamo_2025_1,usamo,proofs,OPC R1 8B,0.0
3743,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,usamo_2025_1,usamo,proofs,OPC R1 8B,1.0
3744,GPT-5 (high),openai/gpt-5,usamo_2025_1,usamo,proofs,OPC R1 8B,1.0
3745,GPT OSS 120B (high),openai/oss-120b,usamo_2025_2,usamo,proofs,OPC R1 8B,0.0
3746,o4-mini (high),openai/o4-mini--high,usamo_2025_2,usamo,proofs,OPC R1 8B,0.0
3747,GPT-5-mini (high),openai/gpt-5-mini,usamo_2025_2,usamo,proofs,OPC R1 8B,0.0
3748,Grok 4,xai/grok-4,usamo_2025_2,usamo,proofs,OPC R1 8B,0.0
3749,GPT-5 (high),openai/gpt-5,usamo_2025_2,usamo,proofs,OPC R1 8B,0.0
3750,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,usamo_2025_2,usamo,proofs,OPC R1 8B,0.0
3751,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,usamo_2025_2,usamo,proofs,OPC R1 8B,0.0
3752,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,usamo_2025_2,usamo,proofs,OPC R1 8B,0.0
3753,gemini-2.5-pro,gemini/gemini-pro-2.5,usamo_2025_2,usamo,proofs,OPC R1 8B,0.0
3754,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,usamo_2025_2,usamo,proofs,OPC R1 8B,0.0
3755,Qwen3-4B (25/07),qwen/qwen3_4b,usamo_2025_2,usamo,proofs,OPC R1 8B,0.0
3756,o4-mini (high),openai/o4-mini--high,usamo_2025_3,usamo,proofs,OPC R1 8B,0.0
3757,gemini-2.5-pro,gemini/gemini-pro-2.5,usamo_2025_3,usamo,proofs,OPC R1 8B,0.0
3758,GPT-5 (high),openai/gpt-5,usamo_2025_3,usamo,proofs,OPC R1 8B,1.0
3759,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,usamo_2025_3,usamo,proofs,OPC R1 8B,0.0
3760,GPT OSS 120B (high),openai/oss-120b,usamo_2025_3,usamo,proofs,OPC R1 8B,0.0
3761,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,usamo_2025_3,usamo,proofs,OPC R1 8B,0.0
3762,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,usamo_2025_3,usamo,proofs,OPC R1 8B,0.0
3763,Grok 4,xai/grok-4,usamo_2025_3,usamo,proofs,OPC R1 8B,0.0
3764,Qwen3-4B (25/07),qwen/qwen3_4b,usamo_2025_3,usamo,proofs,OPC R1 8B,0.0
3765,GPT-5-mini (high),openai/gpt-5-mini,usamo_2025_3,usamo,proofs,OPC R1 8B,0.0
3766,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,usamo_2025_3,usamo,proofs,OPC R1 8B,0.0
3767,GPT-5-mini (high),openai/gpt-5-mini,usamo_2025_4,usamo,proofs,OPC R1 8B,1.0
3768,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,usamo_2025_4,usamo,proofs,OPC R1 8B,1.0
3769,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,usamo_2025_4,usamo,proofs,OPC R1 8B,1.0
3770,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,usamo_2025_4,usamo,proofs,OPC R1 8B,0.0
3771,Grok 4,xai/grok-4,usamo_2025_4,usamo,proofs,OPC R1 8B,1.0
3772,GPT-5 (high),openai/gpt-5,usamo_2025_4,usamo,proofs,OPC R1 8B,1.0
3773,GPT OSS 120B (high),openai/oss-120b,usamo_2025_4,usamo,proofs,OPC R1 8B,1.0
3774,o4-mini (high),openai/o4-mini--high,usamo_2025_4,usamo,proofs,OPC R1 8B,1.0
3775,Qwen3-4B (25/07),qwen/qwen3_4b,usamo_2025_4,usamo,proofs,OPC R1 8B,0.0
3776,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,usamo_2025_4,usamo,proofs,OPC R1 8B,0.0
3777,gemini-2.5-pro,gemini/gemini-pro-2.5,usamo_2025_4,usamo,proofs,OPC R1 8B,0.0
3778,gemini-2.5-pro,gemini/gemini-pro-2.5,usamo_2025_5,usamo,proofs,OPC R1 8B,0.0
3779,o4-mini (high),openai/o4-mini--high,usamo_2025_5,usamo,proofs,OPC R1 8B,0.0
3780,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,usamo_2025_5,usamo,proofs,OPC R1 8B,0.0
3781,GPT-5 (high),openai/gpt-5,usamo_2025_5,usamo,proofs,OPC R1 8B,1.0
3782,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,usamo_2025_5,usamo,proofs,OPC R1 8B,0.0
3783,Grok 4,xai/grok-4,usamo_2025_5,usamo,proofs,OPC R1 8B,0.0
3784,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,usamo_2025_5,usamo,proofs,OPC R1 8B,0.0
3785,GPT-5-mini (high),openai/gpt-5-mini,usamo_2025_5,usamo,proofs,OPC R1 8B,0.0
3786,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,usamo_2025_5,usamo,proofs,OPC R1 8B,0.0
3787,Qwen3-4B (25/07),qwen/qwen3_4b,usamo_2025_5,usamo,proofs,OPC R1 8B,0.0
3788,GPT OSS 120B (high),openai/oss-120b,usamo_2025_5,usamo,proofs,OPC R1 8B,0.0
3789,GPT OSS 120B (high),openai/oss-120b,usamo_2025_6,usamo,proofs,OPC R1 8B,0.0
3790,GPT-5 (high),openai/gpt-5,usamo_2025_6,usamo,proofs,OPC R1 8B,0.0
3791,Qwen3-4B (25/07),qwen/qwen3_4b,usamo_2025_6,usamo,proofs,OPC R1 8B,0.0
3792,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,usamo_2025_6,usamo,proofs,OPC R1 8B,0.0
3793,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,usamo_2025_6,usamo,proofs,OPC R1 8B,0.0
3794,GPT-5-mini (high),openai/gpt-5-mini,usamo_2025_6,usamo,proofs,OPC R1 8B,0.0
3795,o4-mini (high),openai/o4-mini--high,usamo_2025_6,usamo,proofs,OPC R1 8B,0.0
3796,Grok 4,xai/grok-4,usamo_2025_6,usamo,proofs,OPC R1 8B,0.0
3797,gemini-2.5-pro,gemini/gemini-pro-2.5,usamo_2025_6,usamo,proofs,OPC R1 8B,0.0
3798,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,usamo_2025_6,usamo,proofs,OPC R1 8B,0.0
3799,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,usamo_2025_6,usamo,proofs,OPC R1 8B,0.0
3800,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,usatst_2025_1,usatst,proofs,OPC R1 8B,0.0
3801,GPT-5-mini (high),openai/gpt-5-mini,usatst_2025_1,usatst,proofs,OPC R1 8B,1.0
3802,Qwen3-4B (25/07),qwen/qwen3_4b,usatst_2025_1,usatst,proofs,OPC R1 8B,0.0
3803,gemini-2.5-pro,gemini/gemini-pro-2.5,usatst_2025_1,usatst,proofs,OPC R1 8B,1.0
3804,o4-mini (high),openai/o4-mini--high,usatst_2025_1,usatst,proofs,OPC R1 8B,0.0
3805,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,usatst_2025_1,usatst,proofs,OPC R1 8B,1.0
3806,Grok 4,xai/grok-4,usatst_2025_1,usatst,proofs,OPC R1 8B,1.0
3807,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,usatst_2025_1,usatst,proofs,OPC R1 8B,1.0
3808,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,usatst_2025_1,usatst,proofs,OPC R1 8B,0.0
3809,GPT OSS 120B (high),openai/oss-120b,usatst_2025_1,usatst,proofs,OPC R1 8B,1.0
3810,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,usatst_2025_2,usatst,proofs,OPC R1 8B,0.0
3811,GPT-5-mini (high),openai/gpt-5-mini,usatst_2025_2,usatst,proofs,OPC R1 8B,0.0
3812,Grok 4,xai/grok-4,usatst_2025_2,usatst,proofs,OPC R1 8B,0.0
3813,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,usatst_2025_2,usatst,proofs,OPC R1 8B,0.0
3814,GPT-5 (high),openai/gpt-5,usatst_2025_2,usatst,proofs,OPC R1 8B,0.0
3815,GPT OSS 120B (high),openai/oss-120b,usatst_2025_2,usatst,proofs,OPC R1 8B,0.0
3816,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,usatst_2025_2,usatst,proofs,OPC R1 8B,0.0
3817,o4-mini (high),openai/o4-mini--high,usatst_2025_2,usatst,proofs,OPC R1 8B,0.0
3818,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,usatst_2025_2,usatst,proofs,OPC R1 8B,1.0
3819,gemini-2.5-pro,gemini/gemini-pro-2.5,usatst_2025_2,usatst,proofs,OPC R1 8B,0.0
3820,Qwen3-4B (25/07),qwen/qwen3_4b,usatst_2025_2,usatst,proofs,OPC R1 8B,0.0
3821,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,usatst_2025_3,usatst,proofs,OPC R1 8B,0.0
3822,Grok 4,xai/grok-4,usatst_2025_3,usatst,proofs,OPC R1 8B,0.0
3823,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,usatst_2025_3,usatst,proofs,OPC R1 8B,0.0
3824,gemini-2.5-pro,gemini/gemini-pro-2.5,usatst_2025_3,usatst,proofs,OPC R1 8B,1.0
3825,o4-mini (high),openai/o4-mini--high,usatst_2025_3,usatst,proofs,OPC R1 8B,0.0
3826,GPT OSS 120B (high),openai/oss-120b,usatst_2025_3,usatst,proofs,OPC R1 8B,0.0
3827,GPT-5 (high),openai/gpt-5,usatst_2025_3,usatst,proofs,OPC R1 8B,0.0
3828,Qwen3-4B (25/07),qwen/qwen3_4b,usatst_2025_3,usatst,proofs,OPC R1 8B,0.0
3829,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,usatst_2025_3,usatst,proofs,OPC R1 8B,0.0
3830,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,usatst_2025_3,usatst,proofs,OPC R1 8B,0.0
3831,Qwen3-4B (25/07),qwen/qwen3_4b,usatst_2025_4,usatst,proofs,OPC R1 8B,0.0
3832,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,usatst_2025_4,usatst,proofs,OPC R1 8B,0.0
3833,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,usatst_2025_4,usatst,proofs,OPC R1 8B,0.0
3834,o4-mini (high),openai/o4-mini--high,usatst_2025_4,usatst,proofs,OPC R1 8B,0.0
3835,GPT-5 (high),openai/gpt-5,usatst_2025_4,usatst,proofs,OPC R1 8B,0.0
3836,Grok 4,xai/grok-4,usatst_2025_4,usatst,proofs,OPC R1 8B,0.0
3837,gemini-2.5-pro,gemini/gemini-pro-2.5,usatst_2025_4,usatst,proofs,OPC R1 8B,1.0
3838,GPT OSS 120B (high),openai/oss-120b,usatst_2025_4,usatst,proofs,OPC R1 8B,0.0
3839,GPT-5-mini (high),openai/gpt-5-mini,usatst_2025_4,usatst,proofs,OPC R1 8B,1.0
3840,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,usatst_2025_4,usatst,proofs,OPC R1 8B,1.0
3841,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,usatst_2025_4,usatst,proofs,OPC R1 8B,0.0
3842,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,usatst_2025_5,usatst,proofs,OPC R1 8B,0.0
3843,GPT-5 (high),openai/gpt-5,usatst_2025_5,usatst,proofs,OPC R1 8B,0.0
3844,o4-mini (high),openai/o4-mini--high,usatst_2025_5,usatst,proofs,OPC R1 8B,0.0
3845,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,usatst_2025_5,usatst,proofs,OPC R1 8B,0.0
3846,GPT OSS 120B (high),openai/oss-120b,usatst_2025_5,usatst,proofs,OPC R1 8B,0.0
3847,Qwen3-4B (25/07),qwen/qwen3_4b,usatst_2025_5,usatst,proofs,OPC R1 8B,0.0
3848,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,usatst_2025_5,usatst,proofs,OPC R1 8B,0.0
3849,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,usatst_2025_5,usatst,proofs,OPC R1 8B,0.0
3850,GPT-5-mini (high),openai/gpt-5-mini,usatst_2025_5,usatst,proofs,OPC R1 8B,0.0
3851,gemini-2.5-pro,gemini/gemini-pro-2.5,usatst_2025_5,usatst,proofs,OPC R1 8B,0.0
3852,Grok 4,xai/grok-4,usatst_2025_5,usatst,proofs,OPC R1 8B,0.0
3853,o4-mini (high),openai/o4-mini--high,usatst_2025_6,usatst,proofs,OPC R1 8B,0.0
3854,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,usatst_2025_6,usatst,proofs,OPC R1 8B,0.0
3855,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,usatst_2025_6,usatst,proofs,OPC R1 8B,0.0
3856,Qwen3-4B (25/07),qwen/qwen3_4b,usatst_2025_6,usatst,proofs,OPC R1 8B,0.0
3857,Grok 4,xai/grok-4,usatst_2025_6,usatst,proofs,OPC R1 8B,0.0
3858,GPT-5 (high),openai/gpt-5,usatst_2025_6,usatst,proofs,OPC R1 8B,0.0
3859,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,usatst_2025_6,usatst,proofs,OPC R1 8B,0.0
3860,GPT OSS 120B (high),openai/oss-120b,usatst_2025_6,usatst,proofs,OPC R1 8B,0.0
3861,GPT-5-mini (high),openai/gpt-5-mini,usatst_2025_6,usatst,proofs,OPC R1 8B,0.0
3862,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,usatst_2025_6,usatst,proofs,OPC R1 8B,0.0
3863,gemini-2.5-pro,gemini/gemini-pro-2.5,usatst_2025_6,usatst,proofs,OPC R1 8B,0.0
3864,o4-mini (high),openai/o4-mini--high,usatst_2025_7,usatst,proofs,OPC R1 8B,0.0
3865,GPT-5-mini (high),openai/gpt-5-mini,usatst_2025_7,usatst,proofs,OPC R1 8B,0.0
3866,GPT-5 (high),openai/gpt-5,usatst_2025_7,usatst,proofs,OPC R1 8B,0.0
3867,Qwen3-4B (25/07),qwen/qwen3_4b,usatst_2025_7,usatst,proofs,OPC R1 8B,0.0
3868,GPT OSS 120B (high),openai/oss-120b,usatst_2025_7,usatst,proofs,OPC R1 8B,0.0
3869,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,usatst_2025_7,usatst,proofs,OPC R1 8B,1.0
3870,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,usatst_2025_7,usatst,proofs,OPC R1 8B,0.0
3871,Grok 4,xai/grok-4,usatst_2025_7,usatst,proofs,OPC R1 8B,0.0
3872,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,usatst_2025_7,usatst,proofs,OPC R1 8B,0.0
3873,gemini-2.5-pro,gemini/gemini-pro-2.5,usatst_2025_7,usatst,proofs,OPC R1 8B,0.0
3874,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,usatst_2025_7,usatst,proofs,OPC R1 8B,0.0
3875,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,usatst_2025_8,usatst,proofs,OPC R1 8B,0.0
3876,o4-mini (high),openai/o4-mini--high,usatst_2025_8,usatst,proofs,OPC R1 8B,0.0
3877,Qwen3-4B (25/07),qwen/qwen3_4b,usatst_2025_8,usatst,proofs,OPC R1 8B,0.0
3878,GPT-5-mini (high),openai/gpt-5-mini,usatst_2025_8,usatst,proofs,OPC R1 8B,0.0
3879,GPT OSS 120B (high),openai/oss-120b,usatst_2025_8,usatst,proofs,OPC R1 8B,0.0
3880,gemini-2.5-pro,gemini/gemini-pro-2.5,usatst_2025_8,usatst,proofs,OPC R1 8B,0.0
3881,GPT-5 (high),openai/gpt-5,usatst_2025_8,usatst,proofs,OPC R1 8B,0.0
3882,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,usatst_2025_8,usatst,proofs,OPC R1 8B,0.0
3883,Grok 4,xai/grok-4,usatst_2025_8,usatst,proofs,OPC R1 8B,0.0
3884,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,usatst_2025_8,usatst,proofs,OPC R1 8B,0.0
3885,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,usatst_2025_8,usatst,proofs,OPC R1 8B,0.0
3886,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,usatst_2025_9,usatst,proofs,OPC R1 8B,0.0
3887,Qwen3-4B (25/07),qwen/qwen3_4b,usatst_2025_9,usatst,proofs,OPC R1 8B,0.0
3888,GPT-5 (high),openai/gpt-5,usatst_2025_9,usatst,proofs,OPC R1 8B,0.0
3889,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,usatst_2025_9,usatst,proofs,OPC R1 8B,0.0
3890,o4-mini (high),openai/o4-mini--high,usatst_2025_9,usatst,proofs,OPC R1 8B,0.0
3891,Grok 4,xai/grok-4,usatst_2025_9,usatst,proofs,OPC R1 8B,0.0
3892,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,usatst_2025_9,usatst,proofs,OPC R1 8B,0.0
3893,gemini-2.5-pro,gemini/gemini-pro-2.5,usatst_2025_9,usatst,proofs,OPC R1 8B,0.0
3894,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,usatst_2025_9,usatst,proofs,OPC R1 8B,0.0
3895,GPT OSS 120B (high),openai/oss-120b,usatst_2025_9,usatst,proofs,OPC R1 8B,1.0
3896,GPT-5-mini (high),openai/gpt-5-mini,usatst_2025_9,usatst,proofs,OPC R1 8B,0.0
3897,Grok 4,xai/grok-4,vietnam_2025_1,vietnam,proofs,OPC R1 8B,1.0
3898,Qwen3-4B (25/07),qwen/qwen3_4b,vietnam_2025_1,vietnam,proofs,OPC R1 8B,1.0
3899,GPT-5 (high),openai/gpt-5,vietnam_2025_1,vietnam,proofs,OPC R1 8B,1.0
3900,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,vietnam_2025_1,vietnam,proofs,OPC R1 8B,1.0
3901,GPT OSS 120B (high),openai/oss-120b,vietnam_2025_1,vietnam,proofs,OPC R1 8B,1.0
3902,gemini-2.5-pro,gemini/gemini-pro-2.5,vietnam_2025_1,vietnam,proofs,OPC R1 8B,1.0
3903,o4-mini (high),openai/o4-mini--high,vietnam_2025_1,vietnam,proofs,OPC R1 8B,0.0
3904,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,vietnam_2025_1,vietnam,proofs,OPC R1 8B,0.0
3905,GPT-5-mini (high),openai/gpt-5-mini,vietnam_2025_1,vietnam,proofs,OPC R1 8B,1.0
3906,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,vietnam_2025_1,vietnam,proofs,OPC R1 8B,1.0
3907,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,vietnam_2025_1,vietnam,proofs,OPC R1 8B,1.0
3908,GPT OSS 120B (high),openai/oss-120b,vietnam_2025_2,vietnam,proofs,OPC R1 8B,0.0
3909,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,vietnam_2025_2,vietnam,proofs,OPC R1 8B,0.0
3910,Grok 4,xai/grok-4,vietnam_2025_2,vietnam,proofs,OPC R1 8B,0.0
3911,o4-mini (high),openai/o4-mini--high,vietnam_2025_2,vietnam,proofs,OPC R1 8B,0.0
3912,gemini-2.5-pro,gemini/gemini-pro-2.5,vietnam_2025_2,vietnam,proofs,OPC R1 8B,1.0
3913,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,vietnam_2025_2,vietnam,proofs,OPC R1 8B,1.0
3914,GPT-5-mini (high),openai/gpt-5-mini,vietnam_2025_2,vietnam,proofs,OPC R1 8B,1.0
3915,Qwen3-4B (25/07),qwen/qwen3_4b,vietnam_2025_2,vietnam,proofs,OPC R1 8B,0.0
3916,GPT-5 (high),openai/gpt-5,vietnam_2025_2,vietnam,proofs,OPC R1 8B,1.0
3917,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,vietnam_2025_2,vietnam,proofs,OPC R1 8B,1.0
3918,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,vietnam_2025_2,vietnam,proofs,OPC R1 8B,0.0
3919,GPT OSS 120B (high),openai/oss-120b,vietnam_2025_3,vietnam,proofs,OPC R1 8B,1.0
3920,GPT-5-mini (high),openai/gpt-5-mini,vietnam_2025_3,vietnam,proofs,OPC R1 8B,0.0
3921,Grok 4,xai/grok-4,vietnam_2025_3,vietnam,proofs,OPC R1 8B,0.0
3922,GPT-5 (high),openai/gpt-5,vietnam_2025_3,vietnam,proofs,OPC R1 8B,0.0
3923,Qwen3-4B (25/07),qwen/qwen3_4b,vietnam_2025_3,vietnam,proofs,OPC R1 8B,0.0
3924,o4-mini (high),openai/o4-mini--high,vietnam_2025_3,vietnam,proofs,OPC R1 8B,0.0
3925,gemini-2.5-pro,gemini/gemini-pro-2.5,vietnam_2025_3,vietnam,proofs,OPC R1 8B,0.0
3926,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,vietnam_2025_3,vietnam,proofs,OPC R1 8B,0.0
3927,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,vietnam_2025_3,vietnam,proofs,OPC R1 8B,0.0
3928,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,vietnam_2025_3,vietnam,proofs,OPC R1 8B,0.0
3929,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,vietnam_2025_3,vietnam,proofs,OPC R1 8B,0.0
3930,Grok 4,xai/grok-4,vietnam_2025_4,vietnam,proofs,OPC R1 8B,0.0
3931,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,vietnam_2025_4,vietnam,proofs,OPC R1 8B,0.0
3932,GPT OSS 120B (high),openai/oss-120b,vietnam_2025_4,vietnam,proofs,OPC R1 8B,1.0
3933,Qwen3-4B (25/07),qwen/qwen3_4b,vietnam_2025_4,vietnam,proofs,OPC R1 8B,0.0
3934,GPT-5 (high),openai/gpt-5,vietnam_2025_4,vietnam,proofs,OPC R1 8B,0.0
3935,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,vietnam_2025_4,vietnam,proofs,OPC R1 8B,0.0
3936,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,vietnam_2025_4,vietnam,proofs,OPC R1 8B,0.0
3937,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,vietnam_2025_4,vietnam,proofs,OPC R1 8B,0.0
3938,o4-mini (high),openai/o4-mini--high,vietnam_2025_4,vietnam,proofs,OPC R1 8B,0.0
3939,gemini-2.5-pro,gemini/gemini-pro-2.5,vietnam_2025_4,vietnam,proofs,OPC R1 8B,0.0
3940,Grok 4,xai/grok-4,vietnam_2025_5,vietnam,proofs,OPC R1 8B,0.0
3941,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,vietnam_2025_5,vietnam,proofs,OPC R1 8B,0.0
3942,o4-mini (high),openai/o4-mini--high,vietnam_2025_5,vietnam,proofs,OPC R1 8B,0.0
3943,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,vietnam_2025_5,vietnam,proofs,OPC R1 8B,0.0
3944,GPT OSS 120B (high),openai/oss-120b,vietnam_2025_5,vietnam,proofs,OPC R1 8B,0.0
3945,Qwen3-4B (25/07),qwen/qwen3_4b,vietnam_2025_5,vietnam,proofs,OPC R1 8B,0.0
3946,GPT-5 (high),openai/gpt-5,vietnam_2025_5,vietnam,proofs,OPC R1 8B,0.0
3947,gemini-2.5-pro,gemini/gemini-pro-2.5,vietnam_2025_5,vietnam,proofs,OPC R1 8B,0.0
3948,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,vietnam_2025_5,vietnam,proofs,OPC R1 8B,0.0
3949,GPT-5-mini (high),openai/gpt-5-mini,vietnam_2025_5,vietnam,proofs,OPC R1 8B,1.0
3950,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,vietnam_2025_5,vietnam,proofs,OPC R1 8B,0.0
3951,GPT OSS 120B (high),openai/oss-120b,vietnam_2025_6,vietnam,proofs,OPC R1 8B,1.0
3952,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,vietnam_2025_6,vietnam,proofs,OPC R1 8B,0.0
3953,GPT-5 (high),openai/gpt-5,vietnam_2025_6,vietnam,proofs,OPC R1 8B,0.0
3954,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,vietnam_2025_6,vietnam,proofs,OPC R1 8B,0.0
3955,o4-mini (high),openai/o4-mini--high,vietnam_2025_6,vietnam,proofs,OPC R1 8B,0.0
3956,Grok 4 Fast (Reasoning),xai/grok-4-fast-reasoning,vietnam_2025_6,vietnam,proofs,OPC R1 8B,0.0
3957,DeepSeek-R1-Qwen3-8B,deepseek/deepseek_distill_8b,vietnam_2025_6,vietnam,proofs,OPC R1 8B,0.0
3958,gemini-2.5-pro,gemini/gemini-pro-2.5,vietnam_2025_6,vietnam,proofs,OPC R1 8B,0.0
3959,Qwen3-4B (25/07),qwen/qwen3_4b,vietnam_2025_6,vietnam,proofs,OPC R1 8B,0.0
3960,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_aime/aime_2025_1,matharena,matharena,Final Answer Parser,1.0
3961,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_aime/aime_2025_10,matharena,matharena,Final Answer Parser,0.75
3962,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_aime/aime_2025_11,matharena,matharena,Final Answer Parser,1.0
3963,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_aime/aime_2025_12,matharena,matharena,Final Answer Parser,1.0
3964,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_aime/aime_2025_13,matharena,matharena,Final Answer Parser,1.0
3965,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_aime/aime_2025_14,matharena,matharena,Final Answer Parser,0.25
3966,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_aime/aime_2025_15,matharena,matharena,Final Answer Parser,0.0
3967,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_aime/aime_2025_16,matharena,matharena,Final Answer Parser,1.0
3968,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_aime/aime_2025_17,matharena,matharena,Final Answer Parser,1.0
3969,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_aime/aime_2025_18,matharena,matharena,Final Answer Parser,1.0
3970,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_aime/aime_2025_19,matharena,matharena,Final Answer Parser,1.0
3971,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_aime/aime_2025_2,matharena,matharena,Final Answer Parser,1.0
3972,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_aime/aime_2025_20,matharena,matharena,Final Answer Parser,1.0
3973,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_aime/aime_2025_21,matharena,matharena,Final Answer Parser,1.0
3974,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_aime/aime_2025_22,matharena,matharena,Final Answer Parser,1.0
3975,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_aime/aime_2025_23,matharena,matharena,Final Answer Parser,1.0
3976,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_aime/aime_2025_24,matharena,matharena,Final Answer Parser,1.0
3977,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_aime/aime_2025_25,matharena,matharena,Final Answer Parser,1.0
3978,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_aime/aime_2025_26,matharena,matharena,Final Answer Parser,1.0
3979,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_aime/aime_2025_27,matharena,matharena,Final Answer Parser,1.0
3980,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_aime/aime_2025_28,matharena,matharena,Final Answer Parser,1.0
3981,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_aime/aime_2025_29,matharena,matharena,Final Answer Parser,0.75
3982,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_aime/aime_2025_3,matharena,matharena,Final Answer Parser,1.0
3983,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_aime/aime_2025_30,matharena,matharena,Final Answer Parser,0.5
3984,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_aime/aime_2025_4,matharena,matharena,Final Answer Parser,1.0
3985,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_aime/aime_2025_5,matharena,matharena,Final Answer Parser,1.0
3986,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_aime/aime_2025_6,matharena,matharena,Final Answer Parser,1.0
3987,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_aime/aime_2025_7,matharena,matharena,Final Answer Parser,1.0
3988,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_aime/aime_2025_8,matharena,matharena,Final Answer Parser,1.0
3989,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_aime/aime_2025_9,matharena,matharena,Final Answer Parser,1.0
3990,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_aime/aime_2025_1,matharena,matharena,Final Answer Parser,1.0
3991,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_aime/aime_2025_10,matharena,matharena,Final Answer Parser,1.0
3992,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_aime/aime_2025_11,matharena,matharena,Final Answer Parser,1.0
3993,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_aime/aime_2025_12,matharena,matharena,Final Answer Parser,1.0
3994,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_aime/aime_2025_13,matharena,matharena,Final Answer Parser,0.75
3995,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_aime/aime_2025_14,matharena,matharena,Final Answer Parser,0.0
3996,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_aime/aime_2025_15,matharena,matharena,Final Answer Parser,0.0
3997,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_aime/aime_2025_16,matharena,matharena,Final Answer Parser,1.0
3998,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_aime/aime_2025_17,matharena,matharena,Final Answer Parser,1.0
3999,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_aime/aime_2025_18,matharena,matharena,Final Answer Parser,1.0
4000,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_aime/aime_2025_19,matharena,matharena,Final Answer Parser,1.0
4001,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_aime/aime_2025_2,matharena,matharena,Final Answer Parser,0.75
4002,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_aime/aime_2025_20,matharena,matharena,Final Answer Parser,0.5
4003,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_aime/aime_2025_21,matharena,matharena,Final Answer Parser,1.0
4004,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_aime/aime_2025_22,matharena,matharena,Final Answer Parser,1.0
4005,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_aime/aime_2025_23,matharena,matharena,Final Answer Parser,0.75
4006,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_aime/aime_2025_24,matharena,matharena,Final Answer Parser,1.0
4007,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_aime/aime_2025_25,matharena,matharena,Final Answer Parser,0.75
4008,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_aime/aime_2025_26,matharena,matharena,Final Answer Parser,1.0
4009,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_aime/aime_2025_27,matharena,matharena,Final Answer Parser,1.0
4010,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_aime/aime_2025_28,matharena,matharena,Final Answer Parser,1.0
4011,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_aime/aime_2025_29,matharena,matharena,Final Answer Parser,0.75
4012,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_aime/aime_2025_3,matharena,matharena,Final Answer Parser,1.0
4013,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_aime/aime_2025_30,matharena,matharena,Final Answer Parser,1.0
4014,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_aime/aime_2025_4,matharena,matharena,Final Answer Parser,1.0
4015,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_aime/aime_2025_5,matharena,matharena,Final Answer Parser,1.0
4016,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_aime/aime_2025_6,matharena,matharena,Final Answer Parser,1.0
4017,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_aime/aime_2025_7,matharena,matharena,Final Answer Parser,1.0
4018,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_aime/aime_2025_8,matharena,matharena,Final Answer Parser,1.0
4019,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_aime/aime_2025_9,matharena,matharena,Final Answer Parser,1.0
4020,o4-mini (high),openai/o4-mini--high,matharena_aime/aime_2025_1,matharena,matharena,Final Answer Parser,1.0
4021,o4-mini (high),openai/o4-mini--high,matharena_aime/aime_2025_10,matharena,matharena,Final Answer Parser,1.0
4022,o4-mini (high),openai/o4-mini--high,matharena_aime/aime_2025_11,matharena,matharena,Final Answer Parser,1.0
4023,o4-mini (high),openai/o4-mini--high,matharena_aime/aime_2025_12,matharena,matharena,Final Answer Parser,1.0
4024,o4-mini (high),openai/o4-mini--high,matharena_aime/aime_2025_13,matharena,matharena,Final Answer Parser,0.75
4025,o4-mini (high),openai/o4-mini--high,matharena_aime/aime_2025_14,matharena,matharena,Final Answer Parser,0.25
4026,o4-mini (high),openai/o4-mini--high,matharena_aime/aime_2025_15,matharena,matharena,Final Answer Parser,0.0
4027,o4-mini (high),openai/o4-mini--high,matharena_aime/aime_2025_16,matharena,matharena,Final Answer Parser,1.0
4028,o4-mini (high),openai/o4-mini--high,matharena_aime/aime_2025_17,matharena,matharena,Final Answer Parser,1.0
4029,o4-mini (high),openai/o4-mini--high,matharena_aime/aime_2025_18,matharena,matharena,Final Answer Parser,1.0
4030,o4-mini (high),openai/o4-mini--high,matharena_aime/aime_2025_19,matharena,matharena,Final Answer Parser,1.0
4031,o4-mini (high),openai/o4-mini--high,matharena_aime/aime_2025_2,matharena,matharena,Final Answer Parser,1.0
4032,o4-mini (high),openai/o4-mini--high,matharena_aime/aime_2025_20,matharena,matharena,Final Answer Parser,1.0
4033,o4-mini (high),openai/o4-mini--high,matharena_aime/aime_2025_21,matharena,matharena,Final Answer Parser,1.0
4034,o4-mini (high),openai/o4-mini--high,matharena_aime/aime_2025_22,matharena,matharena,Final Answer Parser,1.0
4035,o4-mini (high),openai/o4-mini--high,matharena_aime/aime_2025_23,matharena,matharena,Final Answer Parser,1.0
4036,o4-mini (high),openai/o4-mini--high,matharena_aime/aime_2025_24,matharena,matharena,Final Answer Parser,1.0
4037,o4-mini (high),openai/o4-mini--high,matharena_aime/aime_2025_25,matharena,matharena,Final Answer Parser,1.0
4038,o4-mini (high),openai/o4-mini--high,matharena_aime/aime_2025_26,matharena,matharena,Final Answer Parser,1.0
4039,o4-mini (high),openai/o4-mini--high,matharena_aime/aime_2025_27,matharena,matharena,Final Answer Parser,1.0
4040,o4-mini (high),openai/o4-mini--high,matharena_aime/aime_2025_28,matharena,matharena,Final Answer Parser,1.0
4041,o4-mini (high),openai/o4-mini--high,matharena_aime/aime_2025_29,matharena,matharena,Final Answer Parser,1.0
4042,o4-mini (high),openai/o4-mini--high,matharena_aime/aime_2025_3,matharena,matharena,Final Answer Parser,1.0
4043,o4-mini (high),openai/o4-mini--high,matharena_aime/aime_2025_30,matharena,matharena,Final Answer Parser,1.0
4044,o4-mini (high),openai/o4-mini--high,matharena_aime/aime_2025_4,matharena,matharena,Final Answer Parser,1.0
4045,o4-mini (high),openai/o4-mini--high,matharena_aime/aime_2025_5,matharena,matharena,Final Answer Parser,1.0
4046,o4-mini (high),openai/o4-mini--high,matharena_aime/aime_2025_6,matharena,matharena,Final Answer Parser,1.0
4047,o4-mini (high),openai/o4-mini--high,matharena_aime/aime_2025_7,matharena,matharena,Final Answer Parser,0.75
4048,o4-mini (high),openai/o4-mini--high,matharena_aime/aime_2025_8,matharena,matharena,Final Answer Parser,0.75
4049,o4-mini (high),openai/o4-mini--high,matharena_aime/aime_2025_9,matharena,matharena,Final Answer Parser,1.0
4050,GPT-5-mini (high),openai/gpt-5-mini,matharena_aime/aime_2025_1,matharena,matharena,Final Answer Parser,1.0
4051,GPT-5-mini (high),openai/gpt-5-mini,matharena_aime/aime_2025_10,matharena,matharena,Final Answer Parser,1.0
4052,GPT-5-mini (high),openai/gpt-5-mini,matharena_aime/aime_2025_11,matharena,matharena,Final Answer Parser,1.0
4053,GPT-5-mini (high),openai/gpt-5-mini,matharena_aime/aime_2025_12,matharena,matharena,Final Answer Parser,1.0
4054,GPT-5-mini (high),openai/gpt-5-mini,matharena_aime/aime_2025_13,matharena,matharena,Final Answer Parser,0.25
4055,GPT-5-mini (high),openai/gpt-5-mini,matharena_aime/aime_2025_14,matharena,matharena,Final Answer Parser,0.0
4056,GPT-5-mini (high),openai/gpt-5-mini,matharena_aime/aime_2025_15,matharena,matharena,Final Answer Parser,0.0
4057,GPT-5-mini (high),openai/gpt-5-mini,matharena_aime/aime_2025_16,matharena,matharena,Final Answer Parser,1.0
4058,GPT-5-mini (high),openai/gpt-5-mini,matharena_aime/aime_2025_17,matharena,matharena,Final Answer Parser,1.0
4059,GPT-5-mini (high),openai/gpt-5-mini,matharena_aime/aime_2025_18,matharena,matharena,Final Answer Parser,0.75
4060,GPT-5-mini (high),openai/gpt-5-mini,matharena_aime/aime_2025_19,matharena,matharena,Final Answer Parser,1.0
4061,GPT-5-mini (high),openai/gpt-5-mini,matharena_aime/aime_2025_2,matharena,matharena,Final Answer Parser,1.0
4062,GPT-5-mini (high),openai/gpt-5-mini,matharena_aime/aime_2025_20,matharena,matharena,Final Answer Parser,0.75
4063,GPT-5-mini (high),openai/gpt-5-mini,matharena_aime/aime_2025_21,matharena,matharena,Final Answer Parser,1.0
4064,GPT-5-mini (high),openai/gpt-5-mini,matharena_aime/aime_2025_22,matharena,matharena,Final Answer Parser,1.0
4065,GPT-5-mini (high),openai/gpt-5-mini,matharena_aime/aime_2025_23,matharena,matharena,Final Answer Parser,1.0
4066,GPT-5-mini (high),openai/gpt-5-mini,matharena_aime/aime_2025_24,matharena,matharena,Final Answer Parser,1.0
4067,GPT-5-mini (high),openai/gpt-5-mini,matharena_aime/aime_2025_25,matharena,matharena,Final Answer Parser,1.0
4068,GPT-5-mini (high),openai/gpt-5-mini,matharena_aime/aime_2025_26,matharena,matharena,Final Answer Parser,1.0
4069,GPT-5-mini (high),openai/gpt-5-mini,matharena_aime/aime_2025_27,matharena,matharena,Final Answer Parser,1.0
4070,GPT-5-mini (high),openai/gpt-5-mini,matharena_aime/aime_2025_28,matharena,matharena,Final Answer Parser,0.75
4071,GPT-5-mini (high),openai/gpt-5-mini,matharena_aime/aime_2025_29,matharena,matharena,Final Answer Parser,1.0
4072,GPT-5-mini (high),openai/gpt-5-mini,matharena_aime/aime_2025_3,matharena,matharena,Final Answer Parser,1.0
4073,GPT-5-mini (high),openai/gpt-5-mini,matharena_aime/aime_2025_30,matharena,matharena,Final Answer Parser,0.75
4074,GPT-5-mini (high),openai/gpt-5-mini,matharena_aime/aime_2025_4,matharena,matharena,Final Answer Parser,1.0
4075,GPT-5-mini (high),openai/gpt-5-mini,matharena_aime/aime_2025_5,matharena,matharena,Final Answer Parser,1.0
4076,GPT-5-mini (high),openai/gpt-5-mini,matharena_aime/aime_2025_6,matharena,matharena,Final Answer Parser,1.0
4077,GPT-5-mini (high),openai/gpt-5-mini,matharena_aime/aime_2025_7,matharena,matharena,Final Answer Parser,1.0
4078,GPT-5-mini (high),openai/gpt-5-mini,matharena_aime/aime_2025_8,matharena,matharena,Final Answer Parser,1.0
4079,GPT-5-mini (high),openai/gpt-5-mini,matharena_aime/aime_2025_9,matharena,matharena,Final Answer Parser,1.0
4080,GPT-5 (high),openai/gpt-5,matharena_aime/aime_2025_1,matharena,matharena,Final Answer Parser,1.0
4081,GPT-5 (high),openai/gpt-5,matharena_aime/aime_2025_10,matharena,matharena,Final Answer Parser,1.0
4082,GPT-5 (high),openai/gpt-5,matharena_aime/aime_2025_11,matharena,matharena,Final Answer Parser,1.0
4083,GPT-5 (high),openai/gpt-5,matharena_aime/aime_2025_12,matharena,matharena,Final Answer Parser,1.0
4084,GPT-5 (high),openai/gpt-5,matharena_aime/aime_2025_13,matharena,matharena,Final Answer Parser,1.0
4085,GPT-5 (high),openai/gpt-5,matharena_aime/aime_2025_14,matharena,matharena,Final Answer Parser,0.25
4086,GPT-5 (high),openai/gpt-5,matharena_aime/aime_2025_15,matharena,matharena,Final Answer Parser,0.5
4087,GPT-5 (high),openai/gpt-5,matharena_aime/aime_2025_16,matharena,matharena,Final Answer Parser,1.0
4088,GPT-5 (high),openai/gpt-5,matharena_aime/aime_2025_17,matharena,matharena,Final Answer Parser,1.0
4089,GPT-5 (high),openai/gpt-5,matharena_aime/aime_2025_18,matharena,matharena,Final Answer Parser,1.0
4090,GPT-5 (high),openai/gpt-5,matharena_aime/aime_2025_19,matharena,matharena,Final Answer Parser,1.0
4091,GPT-5 (high),openai/gpt-5,matharena_aime/aime_2025_2,matharena,matharena,Final Answer Parser,1.0
4092,GPT-5 (high),openai/gpt-5,matharena_aime/aime_2025_20,matharena,matharena,Final Answer Parser,1.0
4093,GPT-5 (high),openai/gpt-5,matharena_aime/aime_2025_21,matharena,matharena,Final Answer Parser,1.0
4094,GPT-5 (high),openai/gpt-5,matharena_aime/aime_2025_22,matharena,matharena,Final Answer Parser,1.0
4095,GPT-5 (high),openai/gpt-5,matharena_aime/aime_2025_23,matharena,matharena,Final Answer Parser,1.0
4096,GPT-5 (high),openai/gpt-5,matharena_aime/aime_2025_24,matharena,matharena,Final Answer Parser,1.0
4097,GPT-5 (high),openai/gpt-5,matharena_aime/aime_2025_25,matharena,matharena,Final Answer Parser,1.0
4098,GPT-5 (high),openai/gpt-5,matharena_aime/aime_2025_26,matharena,matharena,Final Answer Parser,1.0
4099,GPT-5 (high),openai/gpt-5,matharena_aime/aime_2025_27,matharena,matharena,Final Answer Parser,1.0
4100,GPT-5 (high),openai/gpt-5,matharena_aime/aime_2025_28,matharena,matharena,Final Answer Parser,0.75
4101,GPT-5 (high),openai/gpt-5,matharena_aime/aime_2025_29,matharena,matharena,Final Answer Parser,1.0
4102,GPT-5 (high),openai/gpt-5,matharena_aime/aime_2025_3,matharena,matharena,Final Answer Parser,1.0
4103,GPT-5 (high),openai/gpt-5,matharena_aime/aime_2025_30,matharena,matharena,Final Answer Parser,1.0
4104,GPT-5 (high),openai/gpt-5,matharena_aime/aime_2025_4,matharena,matharena,Final Answer Parser,1.0
4105,GPT-5 (high),openai/gpt-5,matharena_aime/aime_2025_5,matharena,matharena,Final Answer Parser,1.0
4106,GPT-5 (high),openai/gpt-5,matharena_aime/aime_2025_6,matharena,matharena,Final Answer Parser,1.0
4107,GPT-5 (high),openai/gpt-5,matharena_aime/aime_2025_7,matharena,matharena,Final Answer Parser,1.0
4108,GPT-5 (high),openai/gpt-5,matharena_aime/aime_2025_8,matharena,matharena,Final Answer Parser,1.0
4109,GPT-5 (high),openai/gpt-5,matharena_aime/aime_2025_9,matharena,matharena,Final Answer Parser,1.0
4110,GPT OSS 120B (high),openai/oss-20b,matharena_aime/aime_2025_1,matharena,matharena,Final Answer Parser,1.0
4111,GPT OSS 120B (high),openai/oss-20b,matharena_aime/aime_2025_10,matharena,matharena,Final Answer Parser,1.0
4112,GPT OSS 120B (high),openai/oss-20b,matharena_aime/aime_2025_11,matharena,matharena,Final Answer Parser,1.0
4113,GPT OSS 120B (high),openai/oss-20b,matharena_aime/aime_2025_12,matharena,matharena,Final Answer Parser,1.0
4114,GPT OSS 120B (high),openai/oss-20b,matharena_aime/aime_2025_13,matharena,matharena,Final Answer Parser,0.75
4115,GPT OSS 120B (high),openai/oss-20b,matharena_aime/aime_2025_14,matharena,matharena,Final Answer Parser,0.25
4116,GPT OSS 120B (high),openai/oss-20b,matharena_aime/aime_2025_15,matharena,matharena,Final Answer Parser,0.0
4117,GPT OSS 120B (high),openai/oss-20b,matharena_aime/aime_2025_16,matharena,matharena,Final Answer Parser,1.0
4118,GPT OSS 120B (high),openai/oss-20b,matharena_aime/aime_2025_17,matharena,matharena,Final Answer Parser,1.0
4119,GPT OSS 120B (high),openai/oss-20b,matharena_aime/aime_2025_18,matharena,matharena,Final Answer Parser,1.0
4120,GPT OSS 120B (high),openai/oss-20b,matharena_aime/aime_2025_19,matharena,matharena,Final Answer Parser,1.0
4121,GPT OSS 120B (high),openai/oss-20b,matharena_aime/aime_2025_2,matharena,matharena,Final Answer Parser,1.0
4122,GPT OSS 120B (high),openai/oss-20b,matharena_aime/aime_2025_20,matharena,matharena,Final Answer Parser,1.0
4123,GPT OSS 120B (high),openai/oss-20b,matharena_aime/aime_2025_21,matharena,matharena,Final Answer Parser,1.0
4124,GPT OSS 120B (high),openai/oss-20b,matharena_aime/aime_2025_22,matharena,matharena,Final Answer Parser,1.0
4125,GPT OSS 120B (high),openai/oss-20b,matharena_aime/aime_2025_23,matharena,matharena,Final Answer Parser,1.0
4126,GPT OSS 120B (high),openai/oss-20b,matharena_aime/aime_2025_24,matharena,matharena,Final Answer Parser,1.0
4127,GPT OSS 120B (high),openai/oss-20b,matharena_aime/aime_2025_25,matharena,matharena,Final Answer Parser,0.75
4128,GPT OSS 120B (high),openai/oss-20b,matharena_aime/aime_2025_26,matharena,matharena,Final Answer Parser,1.0
4129,GPT OSS 120B (high),openai/oss-20b,matharena_aime/aime_2025_27,matharena,matharena,Final Answer Parser,1.0
4130,GPT OSS 120B (high),openai/oss-20b,matharena_aime/aime_2025_28,matharena,matharena,Final Answer Parser,0.75
4131,GPT OSS 120B (high),openai/oss-20b,matharena_aime/aime_2025_29,matharena,matharena,Final Answer Parser,1.0
4132,GPT OSS 120B (high),openai/oss-20b,matharena_aime/aime_2025_3,matharena,matharena,Final Answer Parser,1.0
4133,GPT OSS 120B (high),openai/oss-20b,matharena_aime/aime_2025_30,matharena,matharena,Final Answer Parser,0.5
4134,GPT OSS 120B (high),openai/oss-20b,matharena_aime/aime_2025_4,matharena,matharena,Final Answer Parser,1.0
4135,GPT OSS 120B (high),openai/oss-20b,matharena_aime/aime_2025_5,matharena,matharena,Final Answer Parser,1.0
4136,GPT OSS 120B (high),openai/oss-20b,matharena_aime/aime_2025_6,matharena,matharena,Final Answer Parser,1.0
4137,GPT OSS 120B (high),openai/oss-20b,matharena_aime/aime_2025_7,matharena,matharena,Final Answer Parser,0.75
4138,GPT OSS 120B (high),openai/oss-20b,matharena_aime/aime_2025_8,matharena,matharena,Final Answer Parser,1.0
4139,GPT OSS 120B (high),openai/oss-20b,matharena_aime/aime_2025_9,matharena,matharena,Final Answer Parser,1.0
4140,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_aime/aime_2025_1,matharena,matharena,Final Answer Parser,1.0
4141,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_aime/aime_2025_10,matharena,matharena,Final Answer Parser,0.75
4142,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_aime/aime_2025_11,matharena,matharena,Final Answer Parser,1.0
4143,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_aime/aime_2025_12,matharena,matharena,Final Answer Parser,1.0
4144,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_aime/aime_2025_13,matharena,matharena,Final Answer Parser,0.25
4145,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_aime/aime_2025_14,matharena,matharena,Final Answer Parser,0.0
4146,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_aime/aime_2025_15,matharena,matharena,Final Answer Parser,0.0
4147,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_aime/aime_2025_16,matharena,matharena,Final Answer Parser,1.0
4148,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_aime/aime_2025_17,matharena,matharena,Final Answer Parser,1.0
4149,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_aime/aime_2025_18,matharena,matharena,Final Answer Parser,1.0
4150,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_aime/aime_2025_19,matharena,matharena,Final Answer Parser,1.0
4151,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_aime/aime_2025_2,matharena,matharena,Final Answer Parser,1.0
4152,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_aime/aime_2025_20,matharena,matharena,Final Answer Parser,0.75
4153,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_aime/aime_2025_21,matharena,matharena,Final Answer Parser,1.0
4154,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_aime/aime_2025_22,matharena,matharena,Final Answer Parser,1.0
4155,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_aime/aime_2025_23,matharena,matharena,Final Answer Parser,1.0
4156,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_aime/aime_2025_24,matharena,matharena,Final Answer Parser,1.0
4157,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_aime/aime_2025_25,matharena,matharena,Final Answer Parser,1.0
4158,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_aime/aime_2025_26,matharena,matharena,Final Answer Parser,1.0
4159,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_aime/aime_2025_27,matharena,matharena,Final Answer Parser,1.0
4160,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_aime/aime_2025_28,matharena,matharena,Final Answer Parser,0.25
4161,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_aime/aime_2025_29,matharena,matharena,Final Answer Parser,0.25
4162,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_aime/aime_2025_3,matharena,matharena,Final Answer Parser,1.0
4163,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_aime/aime_2025_30,matharena,matharena,Final Answer Parser,0.0
4164,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_aime/aime_2025_4,matharena,matharena,Final Answer Parser,1.0
4165,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_aime/aime_2025_5,matharena,matharena,Final Answer Parser,1.0
4166,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_aime/aime_2025_6,matharena,matharena,Final Answer Parser,1.0
4167,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_aime/aime_2025_7,matharena,matharena,Final Answer Parser,1.0
4168,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_aime/aime_2025_8,matharena,matharena,Final Answer Parser,1.0
4169,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_aime/aime_2025_9,matharena,matharena,Final Answer Parser,1.0
4170,Grok 4,xai/grok-4,matharena_aime/aime_2025_1,matharena,matharena,Final Answer Parser,1.0
4171,Grok 4,xai/grok-4,matharena_aime/aime_2025_10,matharena,matharena,Final Answer Parser,1.0
4172,Grok 4,xai/grok-4,matharena_aime/aime_2025_11,matharena,matharena,Final Answer Parser,1.0
4173,Grok 4,xai/grok-4,matharena_aime/aime_2025_12,matharena,matharena,Final Answer Parser,1.0
4174,Grok 4,xai/grok-4,matharena_aime/aime_2025_13,matharena,matharena,Final Answer Parser,1.0
4175,Grok 4,xai/grok-4,matharena_aime/aime_2025_14,matharena,matharena,Final Answer Parser,0.5
4176,Grok 4,xai/grok-4,matharena_aime/aime_2025_15,matharena,matharena,Final Answer Parser,0.0
4177,Grok 4,xai/grok-4,matharena_aime/aime_2025_16,matharena,matharena,Final Answer Parser,1.0
4178,Grok 4,xai/grok-4,matharena_aime/aime_2025_17,matharena,matharena,Final Answer Parser,1.0
4179,Grok 4,xai/grok-4,matharena_aime/aime_2025_18,matharena,matharena,Final Answer Parser,1.0
4180,Grok 4,xai/grok-4,matharena_aime/aime_2025_19,matharena,matharena,Final Answer Parser,1.0
4181,Grok 4,xai/grok-4,matharena_aime/aime_2025_2,matharena,matharena,Final Answer Parser,1.0
4182,Grok 4,xai/grok-4,matharena_aime/aime_2025_20,matharena,matharena,Final Answer Parser,1.0
4183,Grok 4,xai/grok-4,matharena_aime/aime_2025_21,matharena,matharena,Final Answer Parser,1.0
4184,Grok 4,xai/grok-4,matharena_aime/aime_2025_22,matharena,matharena,Final Answer Parser,1.0
4185,Grok 4,xai/grok-4,matharena_aime/aime_2025_23,matharena,matharena,Final Answer Parser,1.0
4186,Grok 4,xai/grok-4,matharena_aime/aime_2025_24,matharena,matharena,Final Answer Parser,1.0
4187,Grok 4,xai/grok-4,matharena_aime/aime_2025_25,matharena,matharena,Final Answer Parser,1.0
4188,Grok 4,xai/grok-4,matharena_aime/aime_2025_26,matharena,matharena,Final Answer Parser,1.0
4189,Grok 4,xai/grok-4,matharena_aime/aime_2025_27,matharena,matharena,Final Answer Parser,1.0
4190,Grok 4,xai/grok-4,matharena_aime/aime_2025_28,matharena,matharena,Final Answer Parser,0.25
4191,Grok 4,xai/grok-4,matharena_aime/aime_2025_29,matharena,matharena,Final Answer Parser,1.0
4192,Grok 4,xai/grok-4,matharena_aime/aime_2025_3,matharena,matharena,Final Answer Parser,1.0
4193,Grok 4,xai/grok-4,matharena_aime/aime_2025_30,matharena,matharena,Final Answer Parser,0.5
4194,Grok 4,xai/grok-4,matharena_aime/aime_2025_4,matharena,matharena,Final Answer Parser,1.0
4195,Grok 4,xai/grok-4,matharena_aime/aime_2025_5,matharena,matharena,Final Answer Parser,1.0
4196,Grok 4,xai/grok-4,matharena_aime/aime_2025_6,matharena,matharena,Final Answer Parser,1.0
4197,Grok 4,xai/grok-4,matharena_aime/aime_2025_7,matharena,matharena,Final Answer Parser,1.0
4198,Grok 4,xai/grok-4,matharena_aime/aime_2025_8,matharena,matharena,Final Answer Parser,1.0
4199,Grok 4,xai/grok-4,matharena_aime/aime_2025_9,matharena,matharena,Final Answer Parser,1.0
4200,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_1,matharena,matharena,Final Answer Parser,1.0
4201,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_10,matharena,matharena,Final Answer Parser,1.0
4202,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_11,matharena,matharena,Final Answer Parser,1.0
4203,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_12,matharena,matharena,Final Answer Parser,1.0
4204,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_13,matharena,matharena,Final Answer Parser,1.0
4205,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_14,matharena,matharena,Final Answer Parser,1.0
4206,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_15,matharena,matharena,Final Answer Parser,0.25
4207,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_16,matharena,matharena,Final Answer Parser,1.0
4208,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_17,matharena,matharena,Final Answer Parser,1.0
4209,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_18,matharena,matharena,Final Answer Parser,0.5
4210,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_19,matharena,matharena,Final Answer Parser,1.0
4211,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_2,matharena,matharena,Final Answer Parser,1.0
4212,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_20,matharena,matharena,Final Answer Parser,0.25
4213,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_21,matharena,matharena,Final Answer Parser,0.25
4214,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_22,matharena,matharena,Final Answer Parser,1.0
4215,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_23,matharena,matharena,Final Answer Parser,0.5
4216,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_24,matharena,matharena,Final Answer Parser,1.0
4217,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_25,matharena,matharena,Final Answer Parser,0.75
4218,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_26,matharena,matharena,Final Answer Parser,1.0
4219,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_27,matharena,matharena,Final Answer Parser,1.0
4220,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_28,matharena,matharena,Final Answer Parser,0.5
4221,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_29,matharena,matharena,Final Answer Parser,1.0
4222,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_3,matharena,matharena,Final Answer Parser,1.0
4223,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_30,matharena,matharena,Final Answer Parser,1.0
4224,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_31,matharena,matharena,Final Answer Parser,1.0
4225,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_32,matharena,matharena,Final Answer Parser,0.5
4226,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_33,matharena,matharena,Final Answer Parser,1.0
4227,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_34,matharena,matharena,Final Answer Parser,0.25
4228,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_35,matharena,matharena,Final Answer Parser,0.5
4229,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_36,matharena,matharena,Final Answer Parser,1.0
4230,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_37,matharena,matharena,Final Answer Parser,1.0
4231,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_38,matharena,matharena,Final Answer Parser,0.75
4232,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_39,matharena,matharena,Final Answer Parser,1.0
4233,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_4,matharena,matharena,Final Answer Parser,1.0
4234,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_40,matharena,matharena,Final Answer Parser,0.5
4235,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_5,matharena,matharena,Final Answer Parser,1.0
4236,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_6,matharena,matharena,Final Answer Parser,1.0
4237,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_7,matharena,matharena,Final Answer Parser,0.0
4238,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_8,matharena,matharena,Final Answer Parser,1.0
4239,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_cmimc/cmimc_2025_9,matharena,matharena,Final Answer Parser,1.0
4240,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_1,matharena,matharena,Final Answer Parser,1.0
4241,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_10,matharena,matharena,Final Answer Parser,1.0
4242,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_11,matharena,matharena,Final Answer Parser,1.0
4243,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_12,matharena,matharena,Final Answer Parser,1.0
4244,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_13,matharena,matharena,Final Answer Parser,0.5
4245,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_14,matharena,matharena,Final Answer Parser,0.75
4246,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_15,matharena,matharena,Final Answer Parser,0.0
4247,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_16,matharena,matharena,Final Answer Parser,0.0
4248,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_17,matharena,matharena,Final Answer Parser,1.0
4249,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_18,matharena,matharena,Final Answer Parser,1.0
4250,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_19,matharena,matharena,Final Answer Parser,0.5
4251,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_2,matharena,matharena,Final Answer Parser,1.0
4252,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_20,matharena,matharena,Final Answer Parser,0.0
4253,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_21,matharena,matharena,Final Answer Parser,0.5
4254,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_22,matharena,matharena,Final Answer Parser,1.0
4255,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_23,matharena,matharena,Final Answer Parser,1.0
4256,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_24,matharena,matharena,Final Answer Parser,1.0
4257,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_25,matharena,matharena,Final Answer Parser,0.5
4258,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_26,matharena,matharena,Final Answer Parser,1.0
4259,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_27,matharena,matharena,Final Answer Parser,1.0
4260,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_28,matharena,matharena,Final Answer Parser,0.0
4261,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_29,matharena,matharena,Final Answer Parser,1.0
4262,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_3,matharena,matharena,Final Answer Parser,0.5
4263,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_30,matharena,matharena,Final Answer Parser,0.0
4264,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_31,matharena,matharena,Final Answer Parser,1.0
4265,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_32,matharena,matharena,Final Answer Parser,0.0
4266,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_33,matharena,matharena,Final Answer Parser,1.0
4267,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_34,matharena,matharena,Final Answer Parser,0.0
4268,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_35,matharena,matharena,Final Answer Parser,0.75
4269,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_36,matharena,matharena,Final Answer Parser,0.5
4270,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_37,matharena,matharena,Final Answer Parser,0.0
4271,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_38,matharena,matharena,Final Answer Parser,0.0
4272,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_39,matharena,matharena,Final Answer Parser,0.0
4273,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_4,matharena,matharena,Final Answer Parser,1.0
4274,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_40,matharena,matharena,Final Answer Parser,0.0
4275,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_5,matharena,matharena,Final Answer Parser,0.25
4276,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_6,matharena,matharena,Final Answer Parser,1.0
4277,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_7,matharena,matharena,Final Answer Parser,0.0
4278,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_8,matharena,matharena,Final Answer Parser,1.0
4279,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_cmimc/cmimc_2025_9,matharena,matharena,Final Answer Parser,0.5
4280,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_1,matharena,matharena,Final Answer Parser,0.5
4281,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_10,matharena,matharena,Final Answer Parser,1.0
4282,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_11,matharena,matharena,Final Answer Parser,1.0
4283,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_12,matharena,matharena,Final Answer Parser,1.0
4284,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_13,matharena,matharena,Final Answer Parser,1.0
4285,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_14,matharena,matharena,Final Answer Parser,1.0
4286,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_15,matharena,matharena,Final Answer Parser,0.25
4287,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_16,matharena,matharena,Final Answer Parser,1.0
4288,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_17,matharena,matharena,Final Answer Parser,1.0
4289,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_18,matharena,matharena,Final Answer Parser,0.5
4290,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_19,matharena,matharena,Final Answer Parser,1.0
4291,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_2,matharena,matharena,Final Answer Parser,1.0
4292,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_20,matharena,matharena,Final Answer Parser,1.0
4293,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_21,matharena,matharena,Final Answer Parser,1.0
4294,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_22,matharena,matharena,Final Answer Parser,1.0
4295,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_23,matharena,matharena,Final Answer Parser,0.5
4296,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_24,matharena,matharena,Final Answer Parser,1.0
4297,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_25,matharena,matharena,Final Answer Parser,1.0
4298,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_26,matharena,matharena,Final Answer Parser,1.0
4299,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_27,matharena,matharena,Final Answer Parser,1.0
4300,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_28,matharena,matharena,Final Answer Parser,0.5
4301,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_29,matharena,matharena,Final Answer Parser,1.0
4302,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_3,matharena,matharena,Final Answer Parser,1.0
4303,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_30,matharena,matharena,Final Answer Parser,0.5
4304,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_31,matharena,matharena,Final Answer Parser,1.0
4305,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_32,matharena,matharena,Final Answer Parser,0.5
4306,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_33,matharena,matharena,Final Answer Parser,1.0
4307,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_34,matharena,matharena,Final Answer Parser,0.5
4308,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_35,matharena,matharena,Final Answer Parser,0.5
4309,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_36,matharena,matharena,Final Answer Parser,0.75
4310,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_37,matharena,matharena,Final Answer Parser,1.0
4311,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_38,matharena,matharena,Final Answer Parser,0.25
4312,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_39,matharena,matharena,Final Answer Parser,1.0
4313,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_4,matharena,matharena,Final Answer Parser,1.0
4314,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_40,matharena,matharena,Final Answer Parser,0.75
4315,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_5,matharena,matharena,Final Answer Parser,1.0
4316,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_6,matharena,matharena,Final Answer Parser,0.75
4317,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_7,matharena,matharena,Final Answer Parser,0.5
4318,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_8,matharena,matharena,Final Answer Parser,1.0
4319,GPT-5-mini (high),openai/gpt-5-mini,matharena_cmimc/cmimc_2025_9,matharena,matharena,Final Answer Parser,1.0
4320,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_1,matharena,matharena,Final Answer Parser,1.0
4321,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_10,matharena,matharena,Final Answer Parser,1.0
4322,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_11,matharena,matharena,Final Answer Parser,1.0
4323,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_12,matharena,matharena,Final Answer Parser,1.0
4324,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_13,matharena,matharena,Final Answer Parser,1.0
4325,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_14,matharena,matharena,Final Answer Parser,1.0
4326,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_15,matharena,matharena,Final Answer Parser,0.75
4327,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_16,matharena,matharena,Final Answer Parser,1.0
4328,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_17,matharena,matharena,Final Answer Parser,1.0
4329,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_18,matharena,matharena,Final Answer Parser,0.75
4330,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_19,matharena,matharena,Final Answer Parser,1.0
4331,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_2,matharena,matharena,Final Answer Parser,1.0
4332,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_20,matharena,matharena,Final Answer Parser,0.75
4333,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_21,matharena,matharena,Final Answer Parser,1.0
4334,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_22,matharena,matharena,Final Answer Parser,1.0
4335,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_23,matharena,matharena,Final Answer Parser,0.75
4336,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_24,matharena,matharena,Final Answer Parser,1.0
4337,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_25,matharena,matharena,Final Answer Parser,1.0
4338,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_26,matharena,matharena,Final Answer Parser,1.0
4339,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_27,matharena,matharena,Final Answer Parser,1.0
4340,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_28,matharena,matharena,Final Answer Parser,0.25
4341,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_29,matharena,matharena,Final Answer Parser,0.75
4342,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_3,matharena,matharena,Final Answer Parser,1.0
4343,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_30,matharena,matharena,Final Answer Parser,0.75
4344,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_31,matharena,matharena,Final Answer Parser,1.0
4345,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_32,matharena,matharena,Final Answer Parser,0.5
4346,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_33,matharena,matharena,Final Answer Parser,1.0
4347,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_34,matharena,matharena,Final Answer Parser,0.5
4348,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_35,matharena,matharena,Final Answer Parser,1.0
4349,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_36,matharena,matharena,Final Answer Parser,1.0
4350,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_37,matharena,matharena,Final Answer Parser,1.0
4351,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_38,matharena,matharena,Final Answer Parser,1.0
4352,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_39,matharena,matharena,Final Answer Parser,0.75
4353,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_4,matharena,matharena,Final Answer Parser,1.0
4354,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_40,matharena,matharena,Final Answer Parser,0.75
4355,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_5,matharena,matharena,Final Answer Parser,1.0
4356,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_6,matharena,matharena,Final Answer Parser,1.0
4357,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_7,matharena,matharena,Final Answer Parser,0.75
4358,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_8,matharena,matharena,Final Answer Parser,1.0
4359,GPT-5 (high),openai/gpt-5,matharena_cmimc/cmimc_2025_9,matharena,matharena,Final Answer Parser,1.0
4360,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_1,matharena,matharena,Final Answer Parser,1.0
4361,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_10,matharena,matharena,Final Answer Parser,1.0
4362,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_11,matharena,matharena,Final Answer Parser,1.0
4363,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_12,matharena,matharena,Final Answer Parser,0.75
4364,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_13,matharena,matharena,Final Answer Parser,1.0
4365,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_14,matharena,matharena,Final Answer Parser,1.0
4366,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_15,matharena,matharena,Final Answer Parser,0.5
4367,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_16,matharena,matharena,Final Answer Parser,1.0
4368,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_17,matharena,matharena,Final Answer Parser,1.0
4369,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_18,matharena,matharena,Final Answer Parser,0.5
4370,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_19,matharena,matharena,Final Answer Parser,1.0
4371,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_2,matharena,matharena,Final Answer Parser,1.0
4372,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_20,matharena,matharena,Final Answer Parser,1.0
4373,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_21,matharena,matharena,Final Answer Parser,0.5
4374,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_22,matharena,matharena,Final Answer Parser,1.0
4375,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_23,matharena,matharena,Final Answer Parser,1.0
4376,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_24,matharena,matharena,Final Answer Parser,1.0
4377,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_25,matharena,matharena,Final Answer Parser,1.0
4378,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_26,matharena,matharena,Final Answer Parser,1.0
4379,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_27,matharena,matharena,Final Answer Parser,1.0
4380,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_28,matharena,matharena,Final Answer Parser,0.5
4381,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_29,matharena,matharena,Final Answer Parser,1.0
4382,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_3,matharena,matharena,Final Answer Parser,1.0
4383,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_30,matharena,matharena,Final Answer Parser,0.25
4384,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_31,matharena,matharena,Final Answer Parser,1.0
4385,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_32,matharena,matharena,Final Answer Parser,0.75
4386,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_33,matharena,matharena,Final Answer Parser,1.0
4387,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_34,matharena,matharena,Final Answer Parser,0.5
4388,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_35,matharena,matharena,Final Answer Parser,0.75
4389,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_36,matharena,matharena,Final Answer Parser,0.5
4390,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_37,matharena,matharena,Final Answer Parser,1.0
4391,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_38,matharena,matharena,Final Answer Parser,1.0
4392,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_39,matharena,matharena,Final Answer Parser,0.5
4393,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_4,matharena,matharena,Final Answer Parser,1.0
4394,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_40,matharena,matharena,Final Answer Parser,1.0
4395,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_5,matharena,matharena,Final Answer Parser,0.5
4396,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_6,matharena,matharena,Final Answer Parser,1.0
4397,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_7,matharena,matharena,Final Answer Parser,0.25
4398,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_8,matharena,matharena,Final Answer Parser,1.0
4399,o4-mini (high),openai/o4-mini--high,matharena_cmimc/cmimc_2025_9,matharena,matharena,Final Answer Parser,1.0
4400,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_1,matharena,matharena,Final Answer Parser,1.0
4401,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_10,matharena,matharena,Final Answer Parser,1.0
4402,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_11,matharena,matharena,Final Answer Parser,1.0
4403,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_12,matharena,matharena,Final Answer Parser,1.0
4404,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_13,matharena,matharena,Final Answer Parser,0.5
4405,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_14,matharena,matharena,Final Answer Parser,0.75
4406,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_15,matharena,matharena,Final Answer Parser,0.25
4407,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_16,matharena,matharena,Final Answer Parser,0.75
4408,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_17,matharena,matharena,Final Answer Parser,1.0
4409,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_18,matharena,matharena,Final Answer Parser,0.0
4410,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_19,matharena,matharena,Final Answer Parser,1.0
4411,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_2,matharena,matharena,Final Answer Parser,1.0
4412,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_20,matharena,matharena,Final Answer Parser,0.25
4413,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_21,matharena,matharena,Final Answer Parser,1.0
4414,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_22,matharena,matharena,Final Answer Parser,1.0
4415,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_23,matharena,matharena,Final Answer Parser,0.5
4416,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_24,matharena,matharena,Final Answer Parser,1.0
4417,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_25,matharena,matharena,Final Answer Parser,1.0
4418,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_26,matharena,matharena,Final Answer Parser,1.0
4419,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_27,matharena,matharena,Final Answer Parser,0.75
4420,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_28,matharena,matharena,Final Answer Parser,0.25
4421,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_29,matharena,matharena,Final Answer Parser,0.5
4422,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_3,matharena,matharena,Final Answer Parser,1.0
4423,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_30,matharena,matharena,Final Answer Parser,0.0
4424,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_31,matharena,matharena,Final Answer Parser,1.0
4425,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_32,matharena,matharena,Final Answer Parser,0.5
4426,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_33,matharena,matharena,Final Answer Parser,1.0
4427,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_34,matharena,matharena,Final Answer Parser,0.5
4428,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_35,matharena,matharena,Final Answer Parser,1.0
4429,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_36,matharena,matharena,Final Answer Parser,1.0
4430,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_37,matharena,matharena,Final Answer Parser,1.0
4431,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_38,matharena,matharena,Final Answer Parser,1.0
4432,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_39,matharena,matharena,Final Answer Parser,0.25
4433,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_4,matharena,matharena,Final Answer Parser,1.0
4434,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_40,matharena,matharena,Final Answer Parser,0.5
4435,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_5,matharena,matharena,Final Answer Parser,0.0
4436,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_6,matharena,matharena,Final Answer Parser,1.0
4437,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_7,matharena,matharena,Final Answer Parser,0.0
4438,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_8,matharena,matharena,Final Answer Parser,1.0
4439,GPT OSS 120B (high),openai/oss-20b,matharena_cmimc/cmimc_2025_9,matharena,matharena,Final Answer Parser,0.75
4440,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_1,matharena,matharena,Final Answer Parser,1.0
4441,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_10,matharena,matharena,Final Answer Parser,1.0
4442,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_11,matharena,matharena,Final Answer Parser,1.0
4443,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_12,matharena,matharena,Final Answer Parser,1.0
4444,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_13,matharena,matharena,Final Answer Parser,1.0
4445,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_14,matharena,matharena,Final Answer Parser,1.0
4446,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_15,matharena,matharena,Final Answer Parser,0.0
4447,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_16,matharena,matharena,Final Answer Parser,0.75
4448,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_17,matharena,matharena,Final Answer Parser,1.0
4449,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_18,matharena,matharena,Final Answer Parser,0.5
4450,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_19,matharena,matharena,Final Answer Parser,1.0
4451,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_2,matharena,matharena,Final Answer Parser,1.0
4452,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_20,matharena,matharena,Final Answer Parser,1.0
4453,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_21,matharena,matharena,Final Answer Parser,1.0
4454,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_22,matharena,matharena,Final Answer Parser,0.75
4455,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_23,matharena,matharena,Final Answer Parser,0.0
4456,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_24,matharena,matharena,Final Answer Parser,1.0
4457,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_25,matharena,matharena,Final Answer Parser,1.0
4458,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_26,matharena,matharena,Final Answer Parser,1.0
4459,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_27,matharena,matharena,Final Answer Parser,1.0
4460,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_28,matharena,matharena,Final Answer Parser,0.25
4461,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_29,matharena,matharena,Final Answer Parser,1.0
4462,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_3,matharena,matharena,Final Answer Parser,1.0
4463,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_30,matharena,matharena,Final Answer Parser,0.75
4464,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_31,matharena,matharena,Final Answer Parser,1.0
4465,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_32,matharena,matharena,Final Answer Parser,0.75
4466,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_33,matharena,matharena,Final Answer Parser,1.0
4467,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_34,matharena,matharena,Final Answer Parser,0.75
4468,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_35,matharena,matharena,Final Answer Parser,1.0
4469,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_36,matharena,matharena,Final Answer Parser,1.0
4470,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_37,matharena,matharena,Final Answer Parser,1.0
4471,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_38,matharena,matharena,Final Answer Parser,0.5
4472,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_39,matharena,matharena,Final Answer Parser,1.0
4473,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_4,matharena,matharena,Final Answer Parser,1.0
4474,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_40,matharena,matharena,Final Answer Parser,0.0
4475,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_5,matharena,matharena,Final Answer Parser,1.0
4476,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_6,matharena,matharena,Final Answer Parser,1.0
4477,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_7,matharena,matharena,Final Answer Parser,0.5
4478,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_8,matharena,matharena,Final Answer Parser,1.0
4479,Grok 4,xai/grok-4,matharena_cmimc/cmimc_2025_9,matharena,matharena,Final Answer Parser,0.75
4480,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_hmmt/hmmt_feb_2025_1,matharena,matharena,Final Answer Parser,1.0
4481,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_hmmt/hmmt_feb_2025_10,matharena,matharena,Final Answer Parser,1.0
4482,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_hmmt/hmmt_feb_2025_11,matharena,matharena,Final Answer Parser,1.0
4483,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_hmmt/hmmt_feb_2025_12,matharena,matharena,Final Answer Parser,1.0
4484,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_hmmt/hmmt_feb_2025_13,matharena,matharena,Final Answer Parser,0.5
4485,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_hmmt/hmmt_feb_2025_14,matharena,matharena,Final Answer Parser,0.5
4486,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_hmmt/hmmt_feb_2025_15,matharena,matharena,Final Answer Parser,0.75
4487,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_hmmt/hmmt_feb_2025_16,matharena,matharena,Final Answer Parser,1.0
4488,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_hmmt/hmmt_feb_2025_17,matharena,matharena,Final Answer Parser,0.75
4489,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_hmmt/hmmt_feb_2025_18,matharena,matharena,Final Answer Parser,1.0
4490,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_hmmt/hmmt_feb_2025_19,matharena,matharena,Final Answer Parser,0.0
4491,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_hmmt/hmmt_feb_2025_2,matharena,matharena,Final Answer Parser,1.0
4492,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_hmmt/hmmt_feb_2025_20,matharena,matharena,Final Answer Parser,0.25
4493,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_hmmt/hmmt_feb_2025_21,matharena,matharena,Final Answer Parser,1.0
4494,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_hmmt/hmmt_feb_2025_22,matharena,matharena,Final Answer Parser,1.0
4495,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_hmmt/hmmt_feb_2025_23,matharena,matharena,Final Answer Parser,1.0
4496,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_hmmt/hmmt_feb_2025_24,matharena,matharena,Final Answer Parser,0.75
4497,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_hmmt/hmmt_feb_2025_25,matharena,matharena,Final Answer Parser,1.0
4498,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_hmmt/hmmt_feb_2025_26,matharena,matharena,Final Answer Parser,1.0
4499,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_hmmt/hmmt_feb_2025_27,matharena,matharena,Final Answer Parser,1.0
4500,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_hmmt/hmmt_feb_2025_28,matharena,matharena,Final Answer Parser,1.0
4501,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_hmmt/hmmt_feb_2025_29,matharena,matharena,Final Answer Parser,1.0
4502,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_hmmt/hmmt_feb_2025_3,matharena,matharena,Final Answer Parser,0.75
4503,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_hmmt/hmmt_feb_2025_30,matharena,matharena,Final Answer Parser,0.75
4504,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_hmmt/hmmt_feb_2025_4,matharena,matharena,Final Answer Parser,1.0
4505,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_hmmt/hmmt_feb_2025_5,matharena,matharena,Final Answer Parser,1.0
4506,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_hmmt/hmmt_feb_2025_6,matharena,matharena,Final Answer Parser,0.75
4507,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_hmmt/hmmt_feb_2025_7,matharena,matharena,Final Answer Parser,1.0
4508,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_hmmt/hmmt_feb_2025_8,matharena,matharena,Final Answer Parser,1.0
4509,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_hmmt/hmmt_feb_2025_9,matharena,matharena,Final Answer Parser,1.0
4510,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_hmmt/hmmt_feb_2025_1,matharena,matharena,Final Answer Parser,1.0
4511,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_hmmt/hmmt_feb_2025_10,matharena,matharena,Final Answer Parser,1.0
4512,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_hmmt/hmmt_feb_2025_11,matharena,matharena,Final Answer Parser,0.75
4513,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_hmmt/hmmt_feb_2025_12,matharena,matharena,Final Answer Parser,1.0
4514,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_hmmt/hmmt_feb_2025_13,matharena,matharena,Final Answer Parser,0.75
4515,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_hmmt/hmmt_feb_2025_14,matharena,matharena,Final Answer Parser,0.0
4516,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_hmmt/hmmt_feb_2025_15,matharena,matharena,Final Answer Parser,0.5
4517,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_hmmt/hmmt_feb_2025_16,matharena,matharena,Final Answer Parser,1.0
4518,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_hmmt/hmmt_feb_2025_17,matharena,matharena,Final Answer Parser,0.75
4519,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_hmmt/hmmt_feb_2025_18,matharena,matharena,Final Answer Parser,0.5
4520,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_hmmt/hmmt_feb_2025_19,matharena,matharena,Final Answer Parser,0.0
4521,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_hmmt/hmmt_feb_2025_2,matharena,matharena,Final Answer Parser,1.0
4522,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_hmmt/hmmt_feb_2025_20,matharena,matharena,Final Answer Parser,0.0
4523,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_hmmt/hmmt_feb_2025_21,matharena,matharena,Final Answer Parser,1.0
4524,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_hmmt/hmmt_feb_2025_22,matharena,matharena,Final Answer Parser,1.0
4525,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_hmmt/hmmt_feb_2025_23,matharena,matharena,Final Answer Parser,1.0
4526,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_hmmt/hmmt_feb_2025_24,matharena,matharena,Final Answer Parser,1.0
4527,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_hmmt/hmmt_feb_2025_25,matharena,matharena,Final Answer Parser,0.75
4528,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_hmmt/hmmt_feb_2025_26,matharena,matharena,Final Answer Parser,1.0
4529,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_hmmt/hmmt_feb_2025_27,matharena,matharena,Final Answer Parser,1.0
4530,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_hmmt/hmmt_feb_2025_28,matharena,matharena,Final Answer Parser,1.0
4531,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_hmmt/hmmt_feb_2025_29,matharena,matharena,Final Answer Parser,1.0
4532,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_hmmt/hmmt_feb_2025_3,matharena,matharena,Final Answer Parser,1.0
4533,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_hmmt/hmmt_feb_2025_30,matharena,matharena,Final Answer Parser,0.75
4534,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_hmmt/hmmt_feb_2025_4,matharena,matharena,Final Answer Parser,1.0
4535,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_hmmt/hmmt_feb_2025_5,matharena,matharena,Final Answer Parser,1.0
4536,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_hmmt/hmmt_feb_2025_6,matharena,matharena,Final Answer Parser,1.0
4537,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_hmmt/hmmt_feb_2025_7,matharena,matharena,Final Answer Parser,1.0
4538,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_hmmt/hmmt_feb_2025_8,matharena,matharena,Final Answer Parser,1.0
4539,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_hmmt/hmmt_feb_2025_9,matharena,matharena,Final Answer Parser,1.0
4540,o4-mini (high),openai/o4-mini--high,matharena_hmmt/hmmt_feb_2025_1,matharena,matharena,Final Answer Parser,1.0
4541,o4-mini (high),openai/o4-mini--high,matharena_hmmt/hmmt_feb_2025_10,matharena,matharena,Final Answer Parser,1.0
4542,o4-mini (high),openai/o4-mini--high,matharena_hmmt/hmmt_feb_2025_11,matharena,matharena,Final Answer Parser,1.0
4543,o4-mini (high),openai/o4-mini--high,matharena_hmmt/hmmt_feb_2025_12,matharena,matharena,Final Answer Parser,1.0
4544,o4-mini (high),openai/o4-mini--high,matharena_hmmt/hmmt_feb_2025_13,matharena,matharena,Final Answer Parser,1.0
4545,o4-mini (high),openai/o4-mini--high,matharena_hmmt/hmmt_feb_2025_14,matharena,matharena,Final Answer Parser,1.0
4546,o4-mini (high),openai/o4-mini--high,matharena_hmmt/hmmt_feb_2025_15,matharena,matharena,Final Answer Parser,1.0
4547,o4-mini (high),openai/o4-mini--high,matharena_hmmt/hmmt_feb_2025_16,matharena,matharena,Final Answer Parser,0.75
4548,o4-mini (high),openai/o4-mini--high,matharena_hmmt/hmmt_feb_2025_17,matharena,matharena,Final Answer Parser,0.25
4549,o4-mini (high),openai/o4-mini--high,matharena_hmmt/hmmt_feb_2025_18,matharena,matharena,Final Answer Parser,0.75
4550,o4-mini (high),openai/o4-mini--high,matharena_hmmt/hmmt_feb_2025_19,matharena,matharena,Final Answer Parser,0.0
4551,o4-mini (high),openai/o4-mini--high,matharena_hmmt/hmmt_feb_2025_2,matharena,matharena,Final Answer Parser,1.0
4552,o4-mini (high),openai/o4-mini--high,matharena_hmmt/hmmt_feb_2025_20,matharena,matharena,Final Answer Parser,0.0
4553,o4-mini (high),openai/o4-mini--high,matharena_hmmt/hmmt_feb_2025_21,matharena,matharena,Final Answer Parser,1.0
4554,o4-mini (high),openai/o4-mini--high,matharena_hmmt/hmmt_feb_2025_22,matharena,matharena,Final Answer Parser,1.0
4555,o4-mini (high),openai/o4-mini--high,matharena_hmmt/hmmt_feb_2025_23,matharena,matharena,Final Answer Parser,1.0
4556,o4-mini (high),openai/o4-mini--high,matharena_hmmt/hmmt_feb_2025_24,matharena,matharena,Final Answer Parser,1.0
4557,o4-mini (high),openai/o4-mini--high,matharena_hmmt/hmmt_feb_2025_25,matharena,matharena,Final Answer Parser,1.0
4558,o4-mini (high),openai/o4-mini--high,matharena_hmmt/hmmt_feb_2025_26,matharena,matharena,Final Answer Parser,0.75
4559,o4-mini (high),openai/o4-mini--high,matharena_hmmt/hmmt_feb_2025_27,matharena,matharena,Final Answer Parser,0.75
4560,o4-mini (high),openai/o4-mini--high,matharena_hmmt/hmmt_feb_2025_28,matharena,matharena,Final Answer Parser,1.0
4561,o4-mini (high),openai/o4-mini--high,matharena_hmmt/hmmt_feb_2025_29,matharena,matharena,Final Answer Parser,1.0
4562,o4-mini (high),openai/o4-mini--high,matharena_hmmt/hmmt_feb_2025_3,matharena,matharena,Final Answer Parser,1.0
4563,o4-mini (high),openai/o4-mini--high,matharena_hmmt/hmmt_feb_2025_30,matharena,matharena,Final Answer Parser,0.0
4564,o4-mini (high),openai/o4-mini--high,matharena_hmmt/hmmt_feb_2025_4,matharena,matharena,Final Answer Parser,1.0
4565,o4-mini (high),openai/o4-mini--high,matharena_hmmt/hmmt_feb_2025_5,matharena,matharena,Final Answer Parser,0.75
4566,o4-mini (high),openai/o4-mini--high,matharena_hmmt/hmmt_feb_2025_6,matharena,matharena,Final Answer Parser,1.0
4567,o4-mini (high),openai/o4-mini--high,matharena_hmmt/hmmt_feb_2025_7,matharena,matharena,Final Answer Parser,1.0
4568,o4-mini (high),openai/o4-mini--high,matharena_hmmt/hmmt_feb_2025_8,matharena,matharena,Final Answer Parser,1.0
4569,o4-mini (high),openai/o4-mini--high,matharena_hmmt/hmmt_feb_2025_9,matharena,matharena,Final Answer Parser,0.75
4570,GPT-5-mini (high),openai/gpt-5-mini,matharena_hmmt/hmmt_feb_2025_1,matharena,matharena,Final Answer Parser,1.0
4571,GPT-5-mini (high),openai/gpt-5-mini,matharena_hmmt/hmmt_feb_2025_10,matharena,matharena,Final Answer Parser,1.0
4572,GPT-5-mini (high),openai/gpt-5-mini,matharena_hmmt/hmmt_feb_2025_11,matharena,matharena,Final Answer Parser,1.0
4573,GPT-5-mini (high),openai/gpt-5-mini,matharena_hmmt/hmmt_feb_2025_12,matharena,matharena,Final Answer Parser,1.0
4574,GPT-5-mini (high),openai/gpt-5-mini,matharena_hmmt/hmmt_feb_2025_13,matharena,matharena,Final Answer Parser,0.75
4575,GPT-5-mini (high),openai/gpt-5-mini,matharena_hmmt/hmmt_feb_2025_14,matharena,matharena,Final Answer Parser,1.0
4576,GPT-5-mini (high),openai/gpt-5-mini,matharena_hmmt/hmmt_feb_2025_15,matharena,matharena,Final Answer Parser,1.0
4577,GPT-5-mini (high),openai/gpt-5-mini,matharena_hmmt/hmmt_feb_2025_16,matharena,matharena,Final Answer Parser,1.0
4578,GPT-5-mini (high),openai/gpt-5-mini,matharena_hmmt/hmmt_feb_2025_17,matharena,matharena,Final Answer Parser,0.5
4579,GPT-5-mini (high),openai/gpt-5-mini,matharena_hmmt/hmmt_feb_2025_18,matharena,matharena,Final Answer Parser,1.0
4580,GPT-5-mini (high),openai/gpt-5-mini,matharena_hmmt/hmmt_feb_2025_19,matharena,matharena,Final Answer Parser,0.25
4581,GPT-5-mini (high),openai/gpt-5-mini,matharena_hmmt/hmmt_feb_2025_2,matharena,matharena,Final Answer Parser,1.0
4582,GPT-5-mini (high),openai/gpt-5-mini,matharena_hmmt/hmmt_feb_2025_20,matharena,matharena,Final Answer Parser,0.0
4583,GPT-5-mini (high),openai/gpt-5-mini,matharena_hmmt/hmmt_feb_2025_21,matharena,matharena,Final Answer Parser,1.0
4584,GPT-5-mini (high),openai/gpt-5-mini,matharena_hmmt/hmmt_feb_2025_22,matharena,matharena,Final Answer Parser,1.0
4585,GPT-5-mini (high),openai/gpt-5-mini,matharena_hmmt/hmmt_feb_2025_23,matharena,matharena,Final Answer Parser,1.0
4586,GPT-5-mini (high),openai/gpt-5-mini,matharena_hmmt/hmmt_feb_2025_24,matharena,matharena,Final Answer Parser,1.0
4587,GPT-5-mini (high),openai/gpt-5-mini,matharena_hmmt/hmmt_feb_2025_25,matharena,matharena,Final Answer Parser,0.75
4588,GPT-5-mini (high),openai/gpt-5-mini,matharena_hmmt/hmmt_feb_2025_26,matharena,matharena,Final Answer Parser,1.0
4589,GPT-5-mini (high),openai/gpt-5-mini,matharena_hmmt/hmmt_feb_2025_27,matharena,matharena,Final Answer Parser,1.0
4590,GPT-5-mini (high),openai/gpt-5-mini,matharena_hmmt/hmmt_feb_2025_28,matharena,matharena,Final Answer Parser,1.0
4591,GPT-5-mini (high),openai/gpt-5-mini,matharena_hmmt/hmmt_feb_2025_29,matharena,matharena,Final Answer Parser,1.0
4592,GPT-5-mini (high),openai/gpt-5-mini,matharena_hmmt/hmmt_feb_2025_3,matharena,matharena,Final Answer Parser,1.0
4593,GPT-5-mini (high),openai/gpt-5-mini,matharena_hmmt/hmmt_feb_2025_30,matharena,matharena,Final Answer Parser,0.5
4594,GPT-5-mini (high),openai/gpt-5-mini,matharena_hmmt/hmmt_feb_2025_4,matharena,matharena,Final Answer Parser,1.0
4595,GPT-5-mini (high),openai/gpt-5-mini,matharena_hmmt/hmmt_feb_2025_5,matharena,matharena,Final Answer Parser,1.0
4596,GPT-5-mini (high),openai/gpt-5-mini,matharena_hmmt/hmmt_feb_2025_6,matharena,matharena,Final Answer Parser,1.0
4597,GPT-5-mini (high),openai/gpt-5-mini,matharena_hmmt/hmmt_feb_2025_7,matharena,matharena,Final Answer Parser,1.0
4598,GPT-5-mini (high),openai/gpt-5-mini,matharena_hmmt/hmmt_feb_2025_8,matharena,matharena,Final Answer Parser,1.0
4599,GPT-5-mini (high),openai/gpt-5-mini,matharena_hmmt/hmmt_feb_2025_9,matharena,matharena,Final Answer Parser,1.0
4600,GPT-5 (high),openai/gpt-5,matharena_hmmt/hmmt_feb_2025_1,matharena,matharena,Final Answer Parser,1.0
4601,GPT-5 (high),openai/gpt-5,matharena_hmmt/hmmt_feb_2025_10,matharena,matharena,Final Answer Parser,1.0
4602,GPT-5 (high),openai/gpt-5,matharena_hmmt/hmmt_feb_2025_11,matharena,matharena,Final Answer Parser,1.0
4603,GPT-5 (high),openai/gpt-5,matharena_hmmt/hmmt_feb_2025_12,matharena,matharena,Final Answer Parser,1.0
4604,GPT-5 (high),openai/gpt-5,matharena_hmmt/hmmt_feb_2025_13,matharena,matharena,Final Answer Parser,1.0
4605,GPT-5 (high),openai/gpt-5,matharena_hmmt/hmmt_feb_2025_14,matharena,matharena,Final Answer Parser,1.0
4606,GPT-5 (high),openai/gpt-5,matharena_hmmt/hmmt_feb_2025_15,matharena,matharena,Final Answer Parser,1.0
4607,GPT-5 (high),openai/gpt-5,matharena_hmmt/hmmt_feb_2025_16,matharena,matharena,Final Answer Parser,1.0
4608,GPT-5 (high),openai/gpt-5,matharena_hmmt/hmmt_feb_2025_17,matharena,matharena,Final Answer Parser,0.25
4609,GPT-5 (high),openai/gpt-5,matharena_hmmt/hmmt_feb_2025_18,matharena,matharena,Final Answer Parser,0.5
4610,GPT-5 (high),openai/gpt-5,matharena_hmmt/hmmt_feb_2025_19,matharena,matharena,Final Answer Parser,0.5
4611,GPT-5 (high),openai/gpt-5,matharena_hmmt/hmmt_feb_2025_2,matharena,matharena,Final Answer Parser,1.0
4612,GPT-5 (high),openai/gpt-5,matharena_hmmt/hmmt_feb_2025_20,matharena,matharena,Final Answer Parser,0.75
4613,GPT-5 (high),openai/gpt-5,matharena_hmmt/hmmt_feb_2025_21,matharena,matharena,Final Answer Parser,1.0
4614,GPT-5 (high),openai/gpt-5,matharena_hmmt/hmmt_feb_2025_22,matharena,matharena,Final Answer Parser,1.0
4615,GPT-5 (high),openai/gpt-5,matharena_hmmt/hmmt_feb_2025_23,matharena,matharena,Final Answer Parser,1.0
4616,GPT-5 (high),openai/gpt-5,matharena_hmmt/hmmt_feb_2025_24,matharena,matharena,Final Answer Parser,1.0
4617,GPT-5 (high),openai/gpt-5,matharena_hmmt/hmmt_feb_2025_25,matharena,matharena,Final Answer Parser,0.75
4618,GPT-5 (high),openai/gpt-5,matharena_hmmt/hmmt_feb_2025_26,matharena,matharena,Final Answer Parser,1.0
4619,GPT-5 (high),openai/gpt-5,matharena_hmmt/hmmt_feb_2025_27,matharena,matharena,Final Answer Parser,0.75
4620,GPT-5 (high),openai/gpt-5,matharena_hmmt/hmmt_feb_2025_28,matharena,matharena,Final Answer Parser,1.0
4621,GPT-5 (high),openai/gpt-5,matharena_hmmt/hmmt_feb_2025_29,matharena,matharena,Final Answer Parser,1.0
4622,GPT-5 (high),openai/gpt-5,matharena_hmmt/hmmt_feb_2025_3,matharena,matharena,Final Answer Parser,1.0
4623,GPT-5 (high),openai/gpt-5,matharena_hmmt/hmmt_feb_2025_30,matharena,matharena,Final Answer Parser,0.0
4624,GPT-5 (high),openai/gpt-5,matharena_hmmt/hmmt_feb_2025_4,matharena,matharena,Final Answer Parser,1.0
4625,GPT-5 (high),openai/gpt-5,matharena_hmmt/hmmt_feb_2025_5,matharena,matharena,Final Answer Parser,1.0
4626,GPT-5 (high),openai/gpt-5,matharena_hmmt/hmmt_feb_2025_6,matharena,matharena,Final Answer Parser,1.0
4627,GPT-5 (high),openai/gpt-5,matharena_hmmt/hmmt_feb_2025_7,matharena,matharena,Final Answer Parser,1.0
4628,GPT-5 (high),openai/gpt-5,matharena_hmmt/hmmt_feb_2025_8,matharena,matharena,Final Answer Parser,1.0
4629,GPT-5 (high),openai/gpt-5,matharena_hmmt/hmmt_feb_2025_9,matharena,matharena,Final Answer Parser,1.0
4630,GPT OSS 120B (high),openai/oss-20b,matharena_hmmt/hmmt_feb_2025_1,matharena,matharena,Final Answer Parser,1.0
4631,GPT OSS 120B (high),openai/oss-20b,matharena_hmmt/hmmt_feb_2025_10,matharena,matharena,Final Answer Parser,0.25
4632,GPT OSS 120B (high),openai/oss-20b,matharena_hmmt/hmmt_feb_2025_11,matharena,matharena,Final Answer Parser,0.75
4633,GPT OSS 120B (high),openai/oss-20b,matharena_hmmt/hmmt_feb_2025_12,matharena,matharena,Final Answer Parser,1.0
4634,GPT OSS 120B (high),openai/oss-20b,matharena_hmmt/hmmt_feb_2025_13,matharena,matharena,Final Answer Parser,1.0
4635,GPT OSS 120B (high),openai/oss-20b,matharena_hmmt/hmmt_feb_2025_14,matharena,matharena,Final Answer Parser,0.25
4636,GPT OSS 120B (high),openai/oss-20b,matharena_hmmt/hmmt_feb_2025_15,matharena,matharena,Final Answer Parser,1.0
4637,GPT OSS 120B (high),openai/oss-20b,matharena_hmmt/hmmt_feb_2025_16,matharena,matharena,Final Answer Parser,0.5
4638,GPT OSS 120B (high),openai/oss-20b,matharena_hmmt/hmmt_feb_2025_17,matharena,matharena,Final Answer Parser,0.5
4639,GPT OSS 120B (high),openai/oss-20b,matharena_hmmt/hmmt_feb_2025_18,matharena,matharena,Final Answer Parser,0.25
4640,GPT OSS 120B (high),openai/oss-20b,matharena_hmmt/hmmt_feb_2025_19,matharena,matharena,Final Answer Parser,0.0
4641,GPT OSS 120B (high),openai/oss-20b,matharena_hmmt/hmmt_feb_2025_2,matharena,matharena,Final Answer Parser,1.0
4642,GPT OSS 120B (high),openai/oss-20b,matharena_hmmt/hmmt_feb_2025_20,matharena,matharena,Final Answer Parser,0.0
4643,GPT OSS 120B (high),openai/oss-20b,matharena_hmmt/hmmt_feb_2025_21,matharena,matharena,Final Answer Parser,1.0
4644,GPT OSS 120B (high),openai/oss-20b,matharena_hmmt/hmmt_feb_2025_22,matharena,matharena,Final Answer Parser,1.0
4645,GPT OSS 120B (high),openai/oss-20b,matharena_hmmt/hmmt_feb_2025_23,matharena,matharena,Final Answer Parser,1.0
4646,GPT OSS 120B (high),openai/oss-20b,matharena_hmmt/hmmt_feb_2025_24,matharena,matharena,Final Answer Parser,0.75
4647,GPT OSS 120B (high),openai/oss-20b,matharena_hmmt/hmmt_feb_2025_25,matharena,matharena,Final Answer Parser,1.0
4648,GPT OSS 120B (high),openai/oss-20b,matharena_hmmt/hmmt_feb_2025_26,matharena,matharena,Final Answer Parser,1.0
4649,GPT OSS 120B (high),openai/oss-20b,matharena_hmmt/hmmt_feb_2025_27,matharena,matharena,Final Answer Parser,1.0
4650,GPT OSS 120B (high),openai/oss-20b,matharena_hmmt/hmmt_feb_2025_28,matharena,matharena,Final Answer Parser,1.0
4651,GPT OSS 120B (high),openai/oss-20b,matharena_hmmt/hmmt_feb_2025_29,matharena,matharena,Final Answer Parser,0.0
4652,GPT OSS 120B (high),openai/oss-20b,matharena_hmmt/hmmt_feb_2025_3,matharena,matharena,Final Answer Parser,1.0
4653,GPT OSS 120B (high),openai/oss-20b,matharena_hmmt/hmmt_feb_2025_30,matharena,matharena,Final Answer Parser,0.25
4654,GPT OSS 120B (high),openai/oss-20b,matharena_hmmt/hmmt_feb_2025_4,matharena,matharena,Final Answer Parser,1.0
4655,GPT OSS 120B (high),openai/oss-20b,matharena_hmmt/hmmt_feb_2025_5,matharena,matharena,Final Answer Parser,1.0
4656,GPT OSS 120B (high),openai/oss-20b,matharena_hmmt/hmmt_feb_2025_6,matharena,matharena,Final Answer Parser,1.0
4657,GPT OSS 120B (high),openai/oss-20b,matharena_hmmt/hmmt_feb_2025_7,matharena,matharena,Final Answer Parser,1.0
4658,GPT OSS 120B (high),openai/oss-20b,matharena_hmmt/hmmt_feb_2025_8,matharena,matharena,Final Answer Parser,1.0
4659,GPT OSS 120B (high),openai/oss-20b,matharena_hmmt/hmmt_feb_2025_9,matharena,matharena,Final Answer Parser,1.0
4660,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_hmmt/hmmt_feb_2025_1,matharena,matharena,Final Answer Parser,1.0
4661,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_hmmt/hmmt_feb_2025_10,matharena,matharena,Final Answer Parser,0.75
4662,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_hmmt/hmmt_feb_2025_11,matharena,matharena,Final Answer Parser,0.75
4663,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_hmmt/hmmt_feb_2025_12,matharena,matharena,Final Answer Parser,0.25
4664,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_hmmt/hmmt_feb_2025_13,matharena,matharena,Final Answer Parser,0.0
4665,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_hmmt/hmmt_feb_2025_14,matharena,matharena,Final Answer Parser,0.0
4666,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_hmmt/hmmt_feb_2025_15,matharena,matharena,Final Answer Parser,0.25
4667,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_hmmt/hmmt_feb_2025_16,matharena,matharena,Final Answer Parser,0.75
4668,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_hmmt/hmmt_feb_2025_17,matharena,matharena,Final Answer Parser,0.0
4669,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_hmmt/hmmt_feb_2025_18,matharena,matharena,Final Answer Parser,0.75
4670,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_hmmt/hmmt_feb_2025_19,matharena,matharena,Final Answer Parser,0.0
4671,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_hmmt/hmmt_feb_2025_2,matharena,matharena,Final Answer Parser,1.0
4672,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_hmmt/hmmt_feb_2025_20,matharena,matharena,Final Answer Parser,0.0
4673,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_hmmt/hmmt_feb_2025_21,matharena,matharena,Final Answer Parser,1.0
4674,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_hmmt/hmmt_feb_2025_22,matharena,matharena,Final Answer Parser,1.0
4675,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_hmmt/hmmt_feb_2025_23,matharena,matharena,Final Answer Parser,1.0
4676,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_hmmt/hmmt_feb_2025_24,matharena,matharena,Final Answer Parser,0.5
4677,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_hmmt/hmmt_feb_2025_25,matharena,matharena,Final Answer Parser,0.0
4678,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_hmmt/hmmt_feb_2025_26,matharena,matharena,Final Answer Parser,0.75
4679,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_hmmt/hmmt_feb_2025_27,matharena,matharena,Final Answer Parser,1.0
4680,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_hmmt/hmmt_feb_2025_28,matharena,matharena,Final Answer Parser,1.0
4681,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_hmmt/hmmt_feb_2025_29,matharena,matharena,Final Answer Parser,0.5
4682,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_hmmt/hmmt_feb_2025_3,matharena,matharena,Final Answer Parser,1.0
4683,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_hmmt/hmmt_feb_2025_30,matharena,matharena,Final Answer Parser,0.0
4684,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_hmmt/hmmt_feb_2025_4,matharena,matharena,Final Answer Parser,1.0
4685,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_hmmt/hmmt_feb_2025_5,matharena,matharena,Final Answer Parser,1.0
4686,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_hmmt/hmmt_feb_2025_6,matharena,matharena,Final Answer Parser,1.0
4687,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_hmmt/hmmt_feb_2025_7,matharena,matharena,Final Answer Parser,0.75
4688,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_hmmt/hmmt_feb_2025_8,matharena,matharena,Final Answer Parser,1.0
4689,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_hmmt/hmmt_feb_2025_9,matharena,matharena,Final Answer Parser,0.75
4690,Grok 4,xai/grok-4,matharena_hmmt/hmmt_feb_2025_1,matharena,matharena,Final Answer Parser,1.0
4691,Grok 4,xai/grok-4,matharena_hmmt/hmmt_feb_2025_10,matharena,matharena,Final Answer Parser,1.0
4692,Grok 4,xai/grok-4,matharena_hmmt/hmmt_feb_2025_11,matharena,matharena,Final Answer Parser,1.0
4693,Grok 4,xai/grok-4,matharena_hmmt/hmmt_feb_2025_12,matharena,matharena,Final Answer Parser,1.0
4694,Grok 4,xai/grok-4,matharena_hmmt/hmmt_feb_2025_13,matharena,matharena,Final Answer Parser,0.75
4695,Grok 4,xai/grok-4,matharena_hmmt/hmmt_feb_2025_14,matharena,matharena,Final Answer Parser,1.0
4696,Grok 4,xai/grok-4,matharena_hmmt/hmmt_feb_2025_15,matharena,matharena,Final Answer Parser,1.0
4697,Grok 4,xai/grok-4,matharena_hmmt/hmmt_feb_2025_16,matharena,matharena,Final Answer Parser,1.0
4698,Grok 4,xai/grok-4,matharena_hmmt/hmmt_feb_2025_17,matharena,matharena,Final Answer Parser,0.75
4699,Grok 4,xai/grok-4,matharena_hmmt/hmmt_feb_2025_18,matharena,matharena,Final Answer Parser,1.0
4700,Grok 4,xai/grok-4,matharena_hmmt/hmmt_feb_2025_19,matharena,matharena,Final Answer Parser,0.5
4701,Grok 4,xai/grok-4,matharena_hmmt/hmmt_feb_2025_2,matharena,matharena,Final Answer Parser,1.0
4702,Grok 4,xai/grok-4,matharena_hmmt/hmmt_feb_2025_20,matharena,matharena,Final Answer Parser,0.5
4703,Grok 4,xai/grok-4,matharena_hmmt/hmmt_feb_2025_21,matharena,matharena,Final Answer Parser,1.0
4704,Grok 4,xai/grok-4,matharena_hmmt/hmmt_feb_2025_22,matharena,matharena,Final Answer Parser,1.0
4705,Grok 4,xai/grok-4,matharena_hmmt/hmmt_feb_2025_23,matharena,matharena,Final Answer Parser,1.0
4706,Grok 4,xai/grok-4,matharena_hmmt/hmmt_feb_2025_24,matharena,matharena,Final Answer Parser,1.0
4707,Grok 4,xai/grok-4,matharena_hmmt/hmmt_feb_2025_25,matharena,matharena,Final Answer Parser,1.0
4708,Grok 4,xai/grok-4,matharena_hmmt/hmmt_feb_2025_26,matharena,matharena,Final Answer Parser,1.0
4709,Grok 4,xai/grok-4,matharena_hmmt/hmmt_feb_2025_27,matharena,matharena,Final Answer Parser,1.0
4710,Grok 4,xai/grok-4,matharena_hmmt/hmmt_feb_2025_28,matharena,matharena,Final Answer Parser,1.0
4711,Grok 4,xai/grok-4,matharena_hmmt/hmmt_feb_2025_29,matharena,matharena,Final Answer Parser,0.75
4712,Grok 4,xai/grok-4,matharena_hmmt/hmmt_feb_2025_3,matharena,matharena,Final Answer Parser,1.0
4713,Grok 4,xai/grok-4,matharena_hmmt/hmmt_feb_2025_30,matharena,matharena,Final Answer Parser,0.5
4714,Grok 4,xai/grok-4,matharena_hmmt/hmmt_feb_2025_4,matharena,matharena,Final Answer Parser,1.0
4715,Grok 4,xai/grok-4,matharena_hmmt/hmmt_feb_2025_5,matharena,matharena,Final Answer Parser,1.0
4716,Grok 4,xai/grok-4,matharena_hmmt/hmmt_feb_2025_6,matharena,matharena,Final Answer Parser,1.0
4717,Grok 4,xai/grok-4,matharena_hmmt/hmmt_feb_2025_7,matharena,matharena,Final Answer Parser,1.0
4718,Grok 4,xai/grok-4,matharena_hmmt/hmmt_feb_2025_8,matharena,matharena,Final Answer Parser,1.0
4719,Grok 4,xai/grok-4,matharena_hmmt/hmmt_feb_2025_9,matharena,matharena,Final Answer Parser,1.0
4720,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_1,matharena,matharena,Final Answer Parser,1.0
4721,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_10,matharena,matharena,Final Answer Parser,1.0
4722,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_11,matharena,matharena,Final Answer Parser,1.0
4723,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_12,matharena,matharena,Final Answer Parser,1.0
4724,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_13,matharena,matharena,Final Answer Parser,1.0
4725,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_14,matharena,matharena,Final Answer Parser,1.0
4726,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_15,matharena,matharena,Final Answer Parser,1.0
4727,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_16,matharena,matharena,Final Answer Parser,1.0
4728,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_17,matharena,matharena,Final Answer Parser,1.0
4729,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_18,matharena,matharena,Final Answer Parser,1.0
4730,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_19,matharena,matharena,Final Answer Parser,1.0
4731,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_2,matharena,matharena,Final Answer Parser,1.0
4732,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_20,matharena,matharena,Final Answer Parser,0.0
4733,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_21,matharena,matharena,Final Answer Parser,1.0
4734,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_22,matharena,matharena,Final Answer Parser,0.5
4735,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_23,matharena,matharena,Final Answer Parser,1.0
4736,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_24,matharena,matharena,Final Answer Parser,1.0
4737,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_25,matharena,matharena,Final Answer Parser,1.0
4738,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_26,matharena,matharena,Final Answer Parser,1.0
4739,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_27,matharena,matharena,Final Answer Parser,0.0
4740,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_28,matharena,matharena,Final Answer Parser,1.0
4741,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_29,matharena,matharena,Final Answer Parser,1.0
4742,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_3,matharena,matharena,Final Answer Parser,1.0
4743,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_30,matharena,matharena,Final Answer Parser,0.5
4744,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_31,matharena,matharena,Final Answer Parser,1.0
4745,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_32,matharena,matharena,Final Answer Parser,1.0
4746,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_33,matharena,matharena,Final Answer Parser,1.0
4747,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_34,matharena,matharena,Final Answer Parser,1.0
4748,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_35,matharena,matharena,Final Answer Parser,1.0
4749,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_36,matharena,matharena,Final Answer Parser,1.0
4750,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_37,matharena,matharena,Final Answer Parser,0.5
4751,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_38,matharena,matharena,Final Answer Parser,0.75
4752,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_39,matharena,matharena,Final Answer Parser,1.0
4753,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_4,matharena,matharena,Final Answer Parser,1.0
4754,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_40,matharena,matharena,Final Answer Parser,0.75
4755,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_41,matharena,matharena,Final Answer Parser,1.0
4756,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_42,matharena,matharena,Final Answer Parser,0.0
4757,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_43,matharena,matharena,Final Answer Parser,0.0
4758,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_44,matharena,matharena,Final Answer Parser,1.0
4759,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_45,matharena,matharena,Final Answer Parser,1.0
4760,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_46,matharena,matharena,Final Answer Parser,1.0
4761,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_47,matharena,matharena,Final Answer Parser,1.0
4762,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_48,matharena,matharena,Final Answer Parser,1.0
4763,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_49,matharena,matharena,Final Answer Parser,1.0
4764,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_5,matharena,matharena,Final Answer Parser,1.0
4765,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_50,matharena,matharena,Final Answer Parser,0.0
4766,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_51,matharena,matharena,Final Answer Parser,1.0
4767,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_52,matharena,matharena,Final Answer Parser,1.0
4768,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_53,matharena,matharena,Final Answer Parser,0.5
4769,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_6,matharena,matharena,Final Answer Parser,1.0
4770,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_7,matharena,matharena,Final Answer Parser,1.0
4771,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_8,matharena,matharena,Final Answer Parser,0.0
4772,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_smt/smt_2025_9,matharena,matharena,Final Answer Parser,1.0
4773,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_1,matharena,matharena,Final Answer Parser,1.0
4774,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_10,matharena,matharena,Final Answer Parser,1.0
4775,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_11,matharena,matharena,Final Answer Parser,1.0
4776,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_12,matharena,matharena,Final Answer Parser,1.0
4777,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_13,matharena,matharena,Final Answer Parser,0.75
4778,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_14,matharena,matharena,Final Answer Parser,1.0
4779,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_15,matharena,matharena,Final Answer Parser,1.0
4780,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_16,matharena,matharena,Final Answer Parser,1.0
4781,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_17,matharena,matharena,Final Answer Parser,0.5
4782,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_18,matharena,matharena,Final Answer Parser,0.75
4783,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_19,matharena,matharena,Final Answer Parser,1.0
4784,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_2,matharena,matharena,Final Answer Parser,1.0
4785,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_20,matharena,matharena,Final Answer Parser,0.0
4786,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_21,matharena,matharena,Final Answer Parser,1.0
4787,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_22,matharena,matharena,Final Answer Parser,0.25
4788,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_23,matharena,matharena,Final Answer Parser,1.0
4789,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_24,matharena,matharena,Final Answer Parser,1.0
4790,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_25,matharena,matharena,Final Answer Parser,1.0
4791,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_26,matharena,matharena,Final Answer Parser,1.0
4792,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_27,matharena,matharena,Final Answer Parser,1.0
4793,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_28,matharena,matharena,Final Answer Parser,1.0
4794,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_29,matharena,matharena,Final Answer Parser,1.0
4795,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_3,matharena,matharena,Final Answer Parser,1.0
4796,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_30,matharena,matharena,Final Answer Parser,0.25
4797,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_31,matharena,matharena,Final Answer Parser,1.0
4798,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_32,matharena,matharena,Final Answer Parser,1.0
4799,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_33,matharena,matharena,Final Answer Parser,1.0
4800,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_34,matharena,matharena,Final Answer Parser,0.75
4801,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_35,matharena,matharena,Final Answer Parser,1.0
4802,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_36,matharena,matharena,Final Answer Parser,1.0
4803,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_37,matharena,matharena,Final Answer Parser,0.5
4804,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_38,matharena,matharena,Final Answer Parser,0.75
4805,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_39,matharena,matharena,Final Answer Parser,1.0
4806,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_4,matharena,matharena,Final Answer Parser,1.0
4807,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_40,matharena,matharena,Final Answer Parser,1.0
4808,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_41,matharena,matharena,Final Answer Parser,1.0
4809,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_42,matharena,matharena,Final Answer Parser,0.0
4810,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_43,matharena,matharena,Final Answer Parser,0.0
4811,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_44,matharena,matharena,Final Answer Parser,1.0
4812,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_45,matharena,matharena,Final Answer Parser,1.0
4813,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_46,matharena,matharena,Final Answer Parser,1.0
4814,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_47,matharena,matharena,Final Answer Parser,1.0
4815,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_48,matharena,matharena,Final Answer Parser,1.0
4816,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_49,matharena,matharena,Final Answer Parser,1.0
4817,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_5,matharena,matharena,Final Answer Parser,1.0
4818,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_50,matharena,matharena,Final Answer Parser,1.0
4819,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_51,matharena,matharena,Final Answer Parser,1.0
4820,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_52,matharena,matharena,Final Answer Parser,1.0
4821,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_53,matharena,matharena,Final Answer Parser,0.5
4822,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_6,matharena,matharena,Final Answer Parser,1.0
4823,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_7,matharena,matharena,Final Answer Parser,1.0
4824,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_8,matharena,matharena,Final Answer Parser,0.0
4825,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_smt/smt_2025_9,matharena,matharena,Final Answer Parser,1.0
4826,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_1,matharena,matharena,Final Answer Parser,1.0
4827,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_10,matharena,matharena,Final Answer Parser,1.0
4828,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_11,matharena,matharena,Final Answer Parser,1.0
4829,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_12,matharena,matharena,Final Answer Parser,1.0
4830,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_13,matharena,matharena,Final Answer Parser,0.5
4831,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_14,matharena,matharena,Final Answer Parser,1.0
4832,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_15,matharena,matharena,Final Answer Parser,1.0
4833,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_16,matharena,matharena,Final Answer Parser,1.0
4834,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_17,matharena,matharena,Final Answer Parser,1.0
4835,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_18,matharena,matharena,Final Answer Parser,1.0
4836,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_19,matharena,matharena,Final Answer Parser,1.0
4837,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_2,matharena,matharena,Final Answer Parser,1.0
4838,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_20,matharena,matharena,Final Answer Parser,0.0
4839,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_21,matharena,matharena,Final Answer Parser,1.0
4840,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_22,matharena,matharena,Final Answer Parser,1.0
4841,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_23,matharena,matharena,Final Answer Parser,1.0
4842,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_24,matharena,matharena,Final Answer Parser,0.5
4843,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_25,matharena,matharena,Final Answer Parser,1.0
4844,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_26,matharena,matharena,Final Answer Parser,1.0
4845,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_27,matharena,matharena,Final Answer Parser,0.75
4846,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_28,matharena,matharena,Final Answer Parser,1.0
4847,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_29,matharena,matharena,Final Answer Parser,1.0
4848,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_3,matharena,matharena,Final Answer Parser,1.0
4849,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_30,matharena,matharena,Final Answer Parser,1.0
4850,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_31,matharena,matharena,Final Answer Parser,1.0
4851,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_32,matharena,matharena,Final Answer Parser,1.0
4852,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_33,matharena,matharena,Final Answer Parser,1.0
4853,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_34,matharena,matharena,Final Answer Parser,1.0
4854,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_35,matharena,matharena,Final Answer Parser,1.0
4855,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_36,matharena,matharena,Final Answer Parser,1.0
4856,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_37,matharena,matharena,Final Answer Parser,1.0
4857,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_38,matharena,matharena,Final Answer Parser,1.0
4858,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_39,matharena,matharena,Final Answer Parser,1.0
4859,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_4,matharena,matharena,Final Answer Parser,1.0
4860,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_40,matharena,matharena,Final Answer Parser,1.0
4861,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_41,matharena,matharena,Final Answer Parser,0.75
4862,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_42,matharena,matharena,Final Answer Parser,0.0
4863,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_43,matharena,matharena,Final Answer Parser,0.0
4864,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_44,matharena,matharena,Final Answer Parser,1.0
4865,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_45,matharena,matharena,Final Answer Parser,1.0
4866,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_46,matharena,matharena,Final Answer Parser,1.0
4867,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_47,matharena,matharena,Final Answer Parser,1.0
4868,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_48,matharena,matharena,Final Answer Parser,1.0
4869,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_49,matharena,matharena,Final Answer Parser,1.0
4870,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_5,matharena,matharena,Final Answer Parser,1.0
4871,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_50,matharena,matharena,Final Answer Parser,1.0
4872,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_51,matharena,matharena,Final Answer Parser,1.0
4873,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_52,matharena,matharena,Final Answer Parser,1.0
4874,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_53,matharena,matharena,Final Answer Parser,0.5
4875,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_6,matharena,matharena,Final Answer Parser,1.0
4876,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_7,matharena,matharena,Final Answer Parser,1.0
4877,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_8,matharena,matharena,Final Answer Parser,0.0
4878,GPT-5-mini (high),openai/gpt-5-mini,matharena_smt/smt_2025_9,matharena,matharena,Final Answer Parser,1.0
4879,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_1,matharena,matharena,Final Answer Parser,1.0
4880,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_10,matharena,matharena,Final Answer Parser,1.0
4881,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_11,matharena,matharena,Final Answer Parser,1.0
4882,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_12,matharena,matharena,Final Answer Parser,1.0
4883,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_13,matharena,matharena,Final Answer Parser,1.0
4884,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_14,matharena,matharena,Final Answer Parser,1.0
4885,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_15,matharena,matharena,Final Answer Parser,1.0
4886,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_16,matharena,matharena,Final Answer Parser,1.0
4887,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_17,matharena,matharena,Final Answer Parser,1.0
4888,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_18,matharena,matharena,Final Answer Parser,1.0
4889,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_19,matharena,matharena,Final Answer Parser,1.0
4890,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_2,matharena,matharena,Final Answer Parser,1.0
4891,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_20,matharena,matharena,Final Answer Parser,0.5
4892,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_21,matharena,matharena,Final Answer Parser,1.0
4893,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_22,matharena,matharena,Final Answer Parser,1.0
4894,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_23,matharena,matharena,Final Answer Parser,1.0
4895,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_24,matharena,matharena,Final Answer Parser,1.0
4896,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_25,matharena,matharena,Final Answer Parser,1.0
4897,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_26,matharena,matharena,Final Answer Parser,1.0
4898,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_27,matharena,matharena,Final Answer Parser,0.75
4899,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_28,matharena,matharena,Final Answer Parser,1.0
4900,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_29,matharena,matharena,Final Answer Parser,1.0
4901,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_3,matharena,matharena,Final Answer Parser,1.0
4902,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_30,matharena,matharena,Final Answer Parser,1.0
4903,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_31,matharena,matharena,Final Answer Parser,1.0
4904,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_32,matharena,matharena,Final Answer Parser,1.0
4905,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_33,matharena,matharena,Final Answer Parser,1.0
4906,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_34,matharena,matharena,Final Answer Parser,1.0
4907,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_35,matharena,matharena,Final Answer Parser,1.0
4908,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_36,matharena,matharena,Final Answer Parser,1.0
4909,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_37,matharena,matharena,Final Answer Parser,1.0
4910,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_38,matharena,matharena,Final Answer Parser,1.0
4911,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_39,matharena,matharena,Final Answer Parser,1.0
4912,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_4,matharena,matharena,Final Answer Parser,1.0
4913,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_40,matharena,matharena,Final Answer Parser,1.0
4914,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_41,matharena,matharena,Final Answer Parser,1.0
4915,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_42,matharena,matharena,Final Answer Parser,0.0
4916,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_43,matharena,matharena,Final Answer Parser,0.0
4917,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_44,matharena,matharena,Final Answer Parser,1.0
4918,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_45,matharena,matharena,Final Answer Parser,1.0
4919,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_46,matharena,matharena,Final Answer Parser,1.0
4920,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_47,matharena,matharena,Final Answer Parser,1.0
4921,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_48,matharena,matharena,Final Answer Parser,1.0
4922,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_49,matharena,matharena,Final Answer Parser,1.0
4923,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_5,matharena,matharena,Final Answer Parser,1.0
4924,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_50,matharena,matharena,Final Answer Parser,1.0
4925,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_51,matharena,matharena,Final Answer Parser,1.0
4926,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_52,matharena,matharena,Final Answer Parser,1.0
4927,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_53,matharena,matharena,Final Answer Parser,0.5
4928,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_6,matharena,matharena,Final Answer Parser,1.0
4929,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_7,matharena,matharena,Final Answer Parser,1.0
4930,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_8,matharena,matharena,Final Answer Parser,0.0
4931,GPT-5 (high),openai/gpt-5,matharena_smt/smt_2025_9,matharena,matharena,Final Answer Parser,1.0
4932,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_1,matharena,matharena,Final Answer Parser,1.0
4933,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_10,matharena,matharena,Final Answer Parser,1.0
4934,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_11,matharena,matharena,Final Answer Parser,1.0
4935,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_12,matharena,matharena,Final Answer Parser,1.0
4936,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_13,matharena,matharena,Final Answer Parser,0.75
4937,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_14,matharena,matharena,Final Answer Parser,1.0
4938,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_15,matharena,matharena,Final Answer Parser,1.0
4939,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_16,matharena,matharena,Final Answer Parser,1.0
4940,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_17,matharena,matharena,Final Answer Parser,1.0
4941,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_18,matharena,matharena,Final Answer Parser,1.0
4942,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_19,matharena,matharena,Final Answer Parser,1.0
4943,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_2,matharena,matharena,Final Answer Parser,1.0
4944,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_20,matharena,matharena,Final Answer Parser,0.0
4945,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_21,matharena,matharena,Final Answer Parser,1.0
4946,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_22,matharena,matharena,Final Answer Parser,1.0
4947,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_23,matharena,matharena,Final Answer Parser,1.0
4948,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_24,matharena,matharena,Final Answer Parser,1.0
4949,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_25,matharena,matharena,Final Answer Parser,1.0
4950,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_26,matharena,matharena,Final Answer Parser,1.0
4951,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_27,matharena,matharena,Final Answer Parser,0.75
4952,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_28,matharena,matharena,Final Answer Parser,1.0
4953,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_29,matharena,matharena,Final Answer Parser,1.0
4954,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_3,matharena,matharena,Final Answer Parser,1.0
4955,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_30,matharena,matharena,Final Answer Parser,1.0
4956,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_31,matharena,matharena,Final Answer Parser,1.0
4957,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_32,matharena,matharena,Final Answer Parser,0.75
4958,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_33,matharena,matharena,Final Answer Parser,0.75
4959,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_34,matharena,matharena,Final Answer Parser,0.75
4960,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_35,matharena,matharena,Final Answer Parser,1.0
4961,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_36,matharena,matharena,Final Answer Parser,1.0
4962,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_37,matharena,matharena,Final Answer Parser,0.75
4963,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_38,matharena,matharena,Final Answer Parser,1.0
4964,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_39,matharena,matharena,Final Answer Parser,1.0
4965,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_4,matharena,matharena,Final Answer Parser,1.0
4966,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_40,matharena,matharena,Final Answer Parser,1.0
4967,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_41,matharena,matharena,Final Answer Parser,1.0
4968,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_42,matharena,matharena,Final Answer Parser,0.0
4969,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_43,matharena,matharena,Final Answer Parser,0.0
4970,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_44,matharena,matharena,Final Answer Parser,1.0
4971,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_45,matharena,matharena,Final Answer Parser,1.0
4972,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_46,matharena,matharena,Final Answer Parser,1.0
4973,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_47,matharena,matharena,Final Answer Parser,1.0
4974,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_48,matharena,matharena,Final Answer Parser,0.75
4975,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_49,matharena,matharena,Final Answer Parser,1.0
4976,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_5,matharena,matharena,Final Answer Parser,1.0
4977,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_50,matharena,matharena,Final Answer Parser,1.0
4978,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_51,matharena,matharena,Final Answer Parser,1.0
4979,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_52,matharena,matharena,Final Answer Parser,1.0
4980,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_53,matharena,matharena,Final Answer Parser,0.75
4981,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_6,matharena,matharena,Final Answer Parser,1.0
4982,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_7,matharena,matharena,Final Answer Parser,1.0
4983,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_8,matharena,matharena,Final Answer Parser,0.0
4984,o4-mini (high),openai/o4-mini--high,matharena_smt/smt_2025_9,matharena,matharena,Final Answer Parser,1.0
4985,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_1,matharena,matharena,Final Answer Parser,1.0
4986,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_10,matharena,matharena,Final Answer Parser,1.0
4987,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_11,matharena,matharena,Final Answer Parser,1.0
4988,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_12,matharena,matharena,Final Answer Parser,1.0
4989,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_13,matharena,matharena,Final Answer Parser,0.5
4990,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_14,matharena,matharena,Final Answer Parser,1.0
4991,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_15,matharena,matharena,Final Answer Parser,1.0
4992,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_16,matharena,matharena,Final Answer Parser,1.0
4993,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_17,matharena,matharena,Final Answer Parser,0.75
4994,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_18,matharena,matharena,Final Answer Parser,1.0
4995,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_19,matharena,matharena,Final Answer Parser,0.75
4996,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_2,matharena,matharena,Final Answer Parser,1.0
4997,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_20,matharena,matharena,Final Answer Parser,0.0
4998,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_21,matharena,matharena,Final Answer Parser,1.0
4999,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_22,matharena,matharena,Final Answer Parser,0.5
5000,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_23,matharena,matharena,Final Answer Parser,1.0
5001,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_24,matharena,matharena,Final Answer Parser,1.0
5002,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_25,matharena,matharena,Final Answer Parser,1.0
5003,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_26,matharena,matharena,Final Answer Parser,1.0
5004,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_27,matharena,matharena,Final Answer Parser,0.25
5005,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_28,matharena,matharena,Final Answer Parser,1.0
5006,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_29,matharena,matharena,Final Answer Parser,1.0
5007,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_3,matharena,matharena,Final Answer Parser,1.0
5008,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_30,matharena,matharena,Final Answer Parser,0.5
5009,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_31,matharena,matharena,Final Answer Parser,1.0
5010,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_32,matharena,matharena,Final Answer Parser,0.25
5011,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_33,matharena,matharena,Final Answer Parser,0.25
5012,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_34,matharena,matharena,Final Answer Parser,1.0
5013,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_35,matharena,matharena,Final Answer Parser,1.0
5014,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_36,matharena,matharena,Final Answer Parser,1.0
5015,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_37,matharena,matharena,Final Answer Parser,1.0
5016,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_38,matharena,matharena,Final Answer Parser,1.0
5017,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_39,matharena,matharena,Final Answer Parser,0.75
5018,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_4,matharena,matharena,Final Answer Parser,1.0
5019,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_40,matharena,matharena,Final Answer Parser,1.0
5020,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_41,matharena,matharena,Final Answer Parser,1.0
5021,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_42,matharena,matharena,Final Answer Parser,0.0
5022,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_43,matharena,matharena,Final Answer Parser,0.0
5023,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_44,matharena,matharena,Final Answer Parser,1.0
5024,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_45,matharena,matharena,Final Answer Parser,1.0
5025,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_46,matharena,matharena,Final Answer Parser,1.0
5026,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_47,matharena,matharena,Final Answer Parser,1.0
5027,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_48,matharena,matharena,Final Answer Parser,1.0
5028,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_49,matharena,matharena,Final Answer Parser,0.75
5029,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_5,matharena,matharena,Final Answer Parser,1.0
5030,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_50,matharena,matharena,Final Answer Parser,1.0
5031,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_51,matharena,matharena,Final Answer Parser,1.0
5032,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_52,matharena,matharena,Final Answer Parser,1.0
5033,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_53,matharena,matharena,Final Answer Parser,0.0
5034,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_6,matharena,matharena,Final Answer Parser,1.0
5035,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_7,matharena,matharena,Final Answer Parser,1.0
5036,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_8,matharena,matharena,Final Answer Parser,0.0
5037,GPT OSS 120B (high),openai/oss-20b,matharena_smt/smt_2025_9,matharena,matharena,Final Answer Parser,1.0
5038,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_1,matharena,matharena,Final Answer Parser,1.0
5039,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_10,matharena,matharena,Final Answer Parser,1.0
5040,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_11,matharena,matharena,Final Answer Parser,1.0
5041,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_12,matharena,matharena,Final Answer Parser,1.0
5042,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_13,matharena,matharena,Final Answer Parser,0.0
5043,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_14,matharena,matharena,Final Answer Parser,1.0
5044,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_15,matharena,matharena,Final Answer Parser,1.0
5045,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_16,matharena,matharena,Final Answer Parser,1.0
5046,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_17,matharena,matharena,Final Answer Parser,1.0
5047,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_18,matharena,matharena,Final Answer Parser,1.0
5048,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_19,matharena,matharena,Final Answer Parser,0.5
5049,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_2,matharena,matharena,Final Answer Parser,1.0
5050,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_20,matharena,matharena,Final Answer Parser,0.0
5051,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_21,matharena,matharena,Final Answer Parser,1.0
5052,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_22,matharena,matharena,Final Answer Parser,0.75
5053,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_23,matharena,matharena,Final Answer Parser,1.0
5054,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_24,matharena,matharena,Final Answer Parser,0.75
5055,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_25,matharena,matharena,Final Answer Parser,1.0
5056,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_26,matharena,matharena,Final Answer Parser,1.0
5057,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_27,matharena,matharena,Final Answer Parser,0.0
5058,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_28,matharena,matharena,Final Answer Parser,1.0
5059,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_29,matharena,matharena,Final Answer Parser,1.0
5060,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_3,matharena,matharena,Final Answer Parser,1.0
5061,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_30,matharena,matharena,Final Answer Parser,0.75
5062,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_31,matharena,matharena,Final Answer Parser,1.0
5063,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_32,matharena,matharena,Final Answer Parser,1.0
5064,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_33,matharena,matharena,Final Answer Parser,1.0
5065,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_34,matharena,matharena,Final Answer Parser,0.75
5066,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_35,matharena,matharena,Final Answer Parser,1.0
5067,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_36,matharena,matharena,Final Answer Parser,0.75
5068,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_37,matharena,matharena,Final Answer Parser,1.0
5069,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_38,matharena,matharena,Final Answer Parser,0.0
5070,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_39,matharena,matharena,Final Answer Parser,0.75
5071,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_4,matharena,matharena,Final Answer Parser,1.0
5072,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_40,matharena,matharena,Final Answer Parser,1.0
5073,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_41,matharena,matharena,Final Answer Parser,0.25
5074,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_42,matharena,matharena,Final Answer Parser,0.0
5075,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_43,matharena,matharena,Final Answer Parser,0.0
5076,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_44,matharena,matharena,Final Answer Parser,1.0
5077,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_45,matharena,matharena,Final Answer Parser,1.0
5078,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_46,matharena,matharena,Final Answer Parser,1.0
5079,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_47,matharena,matharena,Final Answer Parser,1.0
5080,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_48,matharena,matharena,Final Answer Parser,0.75
5081,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_49,matharena,matharena,Final Answer Parser,1.0
5082,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_5,matharena,matharena,Final Answer Parser,1.0
5083,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_50,matharena,matharena,Final Answer Parser,0.0
5084,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_51,matharena,matharena,Final Answer Parser,0.75
5085,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_52,matharena,matharena,Final Answer Parser,0.75
5086,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_53,matharena,matharena,Final Answer Parser,0.5
5087,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_6,matharena,matharena,Final Answer Parser,1.0
5088,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_7,matharena,matharena,Final Answer Parser,1.0
5089,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_8,matharena,matharena,Final Answer Parser,0.0
5090,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_smt/smt_2025_9,matharena,matharena,Final Answer Parser,0.75
5091,Grok 4,xai/grok-4,matharena_smt/smt_2025_1,matharena,matharena,Final Answer Parser,1.0
5092,Grok 4,xai/grok-4,matharena_smt/smt_2025_10,matharena,matharena,Final Answer Parser,1.0
5093,Grok 4,xai/grok-4,matharena_smt/smt_2025_11,matharena,matharena,Final Answer Parser,1.0
5094,Grok 4,xai/grok-4,matharena_smt/smt_2025_12,matharena,matharena,Final Answer Parser,1.0
5095,Grok 4,xai/grok-4,matharena_smt/smt_2025_13,matharena,matharena,Final Answer Parser,1.0
5096,Grok 4,xai/grok-4,matharena_smt/smt_2025_14,matharena,matharena,Final Answer Parser,1.0
5097,Grok 4,xai/grok-4,matharena_smt/smt_2025_15,matharena,matharena,Final Answer Parser,1.0
5098,Grok 4,xai/grok-4,matharena_smt/smt_2025_16,matharena,matharena,Final Answer Parser,1.0
5099,Grok 4,xai/grok-4,matharena_smt/smt_2025_17,matharena,matharena,Final Answer Parser,1.0
5100,Grok 4,xai/grok-4,matharena_smt/smt_2025_18,matharena,matharena,Final Answer Parser,1.0
5101,Grok 4,xai/grok-4,matharena_smt/smt_2025_19,matharena,matharena,Final Answer Parser,1.0
5102,Grok 4,xai/grok-4,matharena_smt/smt_2025_2,matharena,matharena,Final Answer Parser,1.0
5103,Grok 4,xai/grok-4,matharena_smt/smt_2025_20,matharena,matharena,Final Answer Parser,0.0
5104,Grok 4,xai/grok-4,matharena_smt/smt_2025_21,matharena,matharena,Final Answer Parser,1.0
5105,Grok 4,xai/grok-4,matharena_smt/smt_2025_22,matharena,matharena,Final Answer Parser,1.0
5106,Grok 4,xai/grok-4,matharena_smt/smt_2025_23,matharena,matharena,Final Answer Parser,1.0
5107,Grok 4,xai/grok-4,matharena_smt/smt_2025_24,matharena,matharena,Final Answer Parser,1.0
5108,Grok 4,xai/grok-4,matharena_smt/smt_2025_25,matharena,matharena,Final Answer Parser,1.0
5109,Grok 4,xai/grok-4,matharena_smt/smt_2025_26,matharena,matharena,Final Answer Parser,1.0
5110,Grok 4,xai/grok-4,matharena_smt/smt_2025_27,matharena,matharena,Final Answer Parser,0.0
5111,Grok 4,xai/grok-4,matharena_smt/smt_2025_28,matharena,matharena,Final Answer Parser,1.0
5112,Grok 4,xai/grok-4,matharena_smt/smt_2025_29,matharena,matharena,Final Answer Parser,1.0
5113,Grok 4,xai/grok-4,matharena_smt/smt_2025_3,matharena,matharena,Final Answer Parser,1.0
5114,Grok 4,xai/grok-4,matharena_smt/smt_2025_30,matharena,matharena,Final Answer Parser,1.0
5115,Grok 4,xai/grok-4,matharena_smt/smt_2025_31,matharena,matharena,Final Answer Parser,1.0
5116,Grok 4,xai/grok-4,matharena_smt/smt_2025_32,matharena,matharena,Final Answer Parser,1.0
5117,Grok 4,xai/grok-4,matharena_smt/smt_2025_33,matharena,matharena,Final Answer Parser,1.0
5118,Grok 4,xai/grok-4,matharena_smt/smt_2025_34,matharena,matharena,Final Answer Parser,1.0
5119,Grok 4,xai/grok-4,matharena_smt/smt_2025_35,matharena,matharena,Final Answer Parser,1.0
5120,Grok 4,xai/grok-4,matharena_smt/smt_2025_36,matharena,matharena,Final Answer Parser,1.0
5121,Grok 4,xai/grok-4,matharena_smt/smt_2025_37,matharena,matharena,Final Answer Parser,0.75
5122,Grok 4,xai/grok-4,matharena_smt/smt_2025_38,matharena,matharena,Final Answer Parser,0.25
5123,Grok 4,xai/grok-4,matharena_smt/smt_2025_39,matharena,matharena,Final Answer Parser,1.0
5124,Grok 4,xai/grok-4,matharena_smt/smt_2025_4,matharena,matharena,Final Answer Parser,0.75
5125,Grok 4,xai/grok-4,matharena_smt/smt_2025_40,matharena,matharena,Final Answer Parser,1.0
5126,Grok 4,xai/grok-4,matharena_smt/smt_2025_41,matharena,matharena,Final Answer Parser,1.0
5127,Grok 4,xai/grok-4,matharena_smt/smt_2025_42,matharena,matharena,Final Answer Parser,0.0
5128,Grok 4,xai/grok-4,matharena_smt/smt_2025_43,matharena,matharena,Final Answer Parser,0.0
5129,Grok 4,xai/grok-4,matharena_smt/smt_2025_44,matharena,matharena,Final Answer Parser,1.0
5130,Grok 4,xai/grok-4,matharena_smt/smt_2025_45,matharena,matharena,Final Answer Parser,1.0
5131,Grok 4,xai/grok-4,matharena_smt/smt_2025_46,matharena,matharena,Final Answer Parser,1.0
5132,Grok 4,xai/grok-4,matharena_smt/smt_2025_47,matharena,matharena,Final Answer Parser,1.0
5133,Grok 4,xai/grok-4,matharena_smt/smt_2025_48,matharena,matharena,Final Answer Parser,1.0
5134,Grok 4,xai/grok-4,matharena_smt/smt_2025_49,matharena,matharena,Final Answer Parser,1.0
5135,Grok 4,xai/grok-4,matharena_smt/smt_2025_5,matharena,matharena,Final Answer Parser,1.0
5136,Grok 4,xai/grok-4,matharena_smt/smt_2025_50,matharena,matharena,Final Answer Parser,0.75
5137,Grok 4,xai/grok-4,matharena_smt/smt_2025_51,matharena,matharena,Final Answer Parser,1.0
5138,Grok 4,xai/grok-4,matharena_smt/smt_2025_52,matharena,matharena,Final Answer Parser,1.0
5139,Grok 4,xai/grok-4,matharena_smt/smt_2025_53,matharena,matharena,Final Answer Parser,0.0
5140,Grok 4,xai/grok-4,matharena_smt/smt_2025_6,matharena,matharena,Final Answer Parser,1.0
5141,Grok 4,xai/grok-4,matharena_smt/smt_2025_7,matharena,matharena,Final Answer Parser,1.0
5142,Grok 4,xai/grok-4,matharena_smt/smt_2025_8,matharena,matharena,Final Answer Parser,0.0
5143,Grok 4,xai/grok-4,matharena_smt/smt_2025_9,matharena,matharena,Final Answer Parser,1.0
5144,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_brumo/brumo_2025_1,matharena,matharena,Final Answer Parser,1.0
5145,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_brumo/brumo_2025_10,matharena,matharena,Final Answer Parser,1.0
5146,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_brumo/brumo_2025_11,matharena,matharena,Final Answer Parser,1.0
5147,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_brumo/brumo_2025_12,matharena,matharena,Final Answer Parser,0.75
5148,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_brumo/brumo_2025_13,matharena,matharena,Final Answer Parser,0.25
5149,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_brumo/brumo_2025_14,matharena,matharena,Final Answer Parser,1.0
5150,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_brumo/brumo_2025_15,matharena,matharena,Final Answer Parser,1.0
5151,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_brumo/brumo_2025_16,matharena,matharena,Final Answer Parser,1.0
5152,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_brumo/brumo_2025_17,matharena,matharena,Final Answer Parser,1.0
5153,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_brumo/brumo_2025_18,matharena,matharena,Final Answer Parser,1.0
5154,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_brumo/brumo_2025_19,matharena,matharena,Final Answer Parser,1.0
5155,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_brumo/brumo_2025_2,matharena,matharena,Final Answer Parser,1.0
5156,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_brumo/brumo_2025_20,matharena,matharena,Final Answer Parser,1.0
5157,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_brumo/brumo_2025_21,matharena,matharena,Final Answer Parser,1.0
5158,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_brumo/brumo_2025_22,matharena,matharena,Final Answer Parser,1.0
5159,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_brumo/brumo_2025_23,matharena,matharena,Final Answer Parser,1.0
5160,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_brumo/brumo_2025_24,matharena,matharena,Final Answer Parser,1.0
5161,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_brumo/brumo_2025_25,matharena,matharena,Final Answer Parser,0.5
5162,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_brumo/brumo_2025_26,matharena,matharena,Final Answer Parser,1.0
5163,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_brumo/brumo_2025_27,matharena,matharena,Final Answer Parser,1.0
5164,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_brumo/brumo_2025_28,matharena,matharena,Final Answer Parser,0.5
5165,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_brumo/brumo_2025_29,matharena,matharena,Final Answer Parser,1.0
5166,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_brumo/brumo_2025_3,matharena,matharena,Final Answer Parser,1.0
5167,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_brumo/brumo_2025_30,matharena,matharena,Final Answer Parser,0.25
5168,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_brumo/brumo_2025_4,matharena,matharena,Final Answer Parser,1.0
5169,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_brumo/brumo_2025_5,matharena,matharena,Final Answer Parser,1.0
5170,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_brumo/brumo_2025_6,matharena,matharena,Final Answer Parser,0.75
5171,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_brumo/brumo_2025_7,matharena,matharena,Final Answer Parser,1.0
5172,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_brumo/brumo_2025_8,matharena,matharena,Final Answer Parser,1.0
5173,DeepSeek-v3.1 (Think),deepseek/deepseek_v31,matharena_brumo/brumo_2025_9,matharena,matharena,Final Answer Parser,1.0
5174,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_brumo/brumo_2025_10,matharena,matharena,Final Answer Parser,1.0
5175,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_brumo/brumo_2025_12,matharena,matharena,Final Answer Parser,0.5
5176,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_brumo/brumo_2025_14,matharena,matharena,Final Answer Parser,1.0
5177,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_brumo/brumo_2025_15,matharena,matharena,Final Answer Parser,1.0
5178,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_brumo/brumo_2025_16,matharena,matharena,Final Answer Parser,1.0
5179,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_brumo/brumo_2025_19,matharena,matharena,Final Answer Parser,1.0
5180,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_brumo/brumo_2025_20,matharena,matharena,Final Answer Parser,1.0
5181,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_brumo/brumo_2025_21,matharena,matharena,Final Answer Parser,1.0
5182,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_brumo/brumo_2025_22,matharena,matharena,Final Answer Parser,0.75
5183,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_brumo/brumo_2025_23,matharena,matharena,Final Answer Parser,1.0
5184,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_brumo/brumo_2025_24,matharena,matharena,Final Answer Parser,1.0
5185,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_brumo/brumo_2025_26,matharena,matharena,Final Answer Parser,0.75
5186,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_brumo/brumo_2025_27,matharena,matharena,Final Answer Parser,1.0
5187,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_brumo/brumo_2025_5,matharena,matharena,Final Answer Parser,1.0
5188,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_brumo/brumo_2025_6,matharena,matharena,Final Answer Parser,1.0
5189,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_brumo/brumo_2025_7,matharena,matharena,Final Answer Parser,1.0
5190,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_brumo/brumo_2025_8,matharena,matharena,Final Answer Parser,1.0
5191,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_brumo/brumo_2025_9,matharena,matharena,Final Answer Parser,1.0
5192,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_brumo/brumo_2025_1,matharena,matharena,Final Answer Parser,1.0
5193,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_brumo/brumo_2025_11,matharena,matharena,Final Answer Parser,0.75
5194,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_brumo/brumo_2025_13,matharena,matharena,Final Answer Parser,0.5
5195,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_brumo/brumo_2025_17,matharena,matharena,Final Answer Parser,1.0
5196,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_brumo/brumo_2025_18,matharena,matharena,Final Answer Parser,1.0
5197,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_brumo/brumo_2025_2,matharena,matharena,Final Answer Parser,1.0
5198,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_brumo/brumo_2025_25,matharena,matharena,Final Answer Parser,1.0
5199,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_brumo/brumo_2025_28,matharena,matharena,Final Answer Parser,0.75
5200,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_brumo/brumo_2025_29,matharena,matharena,Final Answer Parser,1.0
5201,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_brumo/brumo_2025_3,matharena,matharena,Final Answer Parser,1.0
5202,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_brumo/brumo_2025_30,matharena,matharena,Final Answer Parser,0.0
5203,gemini-2.5-pro,gemini/gemini-pro-2.5,matharena_brumo/brumo_2025_4,matharena,matharena,Final Answer Parser,1.0
5204,o4-mini (high),openai/o4-mini--high,matharena_brumo/brumo_2025_10,matharena,matharena,Final Answer Parser,1.0
5205,o4-mini (high),openai/o4-mini--high,matharena_brumo/brumo_2025_12,matharena,matharena,Final Answer Parser,1.0
5206,o4-mini (high),openai/o4-mini--high,matharena_brumo/brumo_2025_14,matharena,matharena,Final Answer Parser,1.0
5207,o4-mini (high),openai/o4-mini--high,matharena_brumo/brumo_2025_15,matharena,matharena,Final Answer Parser,0.75
5208,o4-mini (high),openai/o4-mini--high,matharena_brumo/brumo_2025_16,matharena,matharena,Final Answer Parser,1.0
5209,o4-mini (high),openai/o4-mini--high,matharena_brumo/brumo_2025_19,matharena,matharena,Final Answer Parser,1.0
5210,o4-mini (high),openai/o4-mini--high,matharena_brumo/brumo_2025_20,matharena,matharena,Final Answer Parser,1.0
5211,o4-mini (high),openai/o4-mini--high,matharena_brumo/brumo_2025_21,matharena,matharena,Final Answer Parser,1.0
5212,o4-mini (high),openai/o4-mini--high,matharena_brumo/brumo_2025_22,matharena,matharena,Final Answer Parser,1.0
5213,o4-mini (high),openai/o4-mini--high,matharena_brumo/brumo_2025_23,matharena,matharena,Final Answer Parser,1.0
5214,o4-mini (high),openai/o4-mini--high,matharena_brumo/brumo_2025_24,matharena,matharena,Final Answer Parser,1.0
5215,o4-mini (high),openai/o4-mini--high,matharena_brumo/brumo_2025_26,matharena,matharena,Final Answer Parser,1.0
5216,o4-mini (high),openai/o4-mini--high,matharena_brumo/brumo_2025_27,matharena,matharena,Final Answer Parser,1.0
5217,o4-mini (high),openai/o4-mini--high,matharena_brumo/brumo_2025_5,matharena,matharena,Final Answer Parser,1.0
5218,o4-mini (high),openai/o4-mini--high,matharena_brumo/brumo_2025_6,matharena,matharena,Final Answer Parser,0.75
5219,o4-mini (high),openai/o4-mini--high,matharena_brumo/brumo_2025_7,matharena,matharena,Final Answer Parser,1.0
5220,o4-mini (high),openai/o4-mini--high,matharena_brumo/brumo_2025_8,matharena,matharena,Final Answer Parser,1.0
5221,o4-mini (high),openai/o4-mini--high,matharena_brumo/brumo_2025_9,matharena,matharena,Final Answer Parser,0.75
5222,o4-mini (high),openai/o4-mini--high,matharena_brumo/brumo_2025_1,matharena,matharena,Final Answer Parser,1.0
5223,o4-mini (high),openai/o4-mini--high,matharena_brumo/brumo_2025_11,matharena,matharena,Final Answer Parser,1.0
5224,o4-mini (high),openai/o4-mini--high,matharena_brumo/brumo_2025_13,matharena,matharena,Final Answer Parser,0.5
5225,o4-mini (high),openai/o4-mini--high,matharena_brumo/brumo_2025_17,matharena,matharena,Final Answer Parser,1.0
5226,o4-mini (high),openai/o4-mini--high,matharena_brumo/brumo_2025_18,matharena,matharena,Final Answer Parser,1.0
5227,o4-mini (high),openai/o4-mini--high,matharena_brumo/brumo_2025_2,matharena,matharena,Final Answer Parser,1.0
5228,o4-mini (high),openai/o4-mini--high,matharena_brumo/brumo_2025_25,matharena,matharena,Final Answer Parser,0.25
5229,o4-mini (high),openai/o4-mini--high,matharena_brumo/brumo_2025_28,matharena,matharena,Final Answer Parser,0.25
5230,o4-mini (high),openai/o4-mini--high,matharena_brumo/brumo_2025_29,matharena,matharena,Final Answer Parser,0.75
5231,o4-mini (high),openai/o4-mini--high,matharena_brumo/brumo_2025_3,matharena,matharena,Final Answer Parser,1.0
5232,o4-mini (high),openai/o4-mini--high,matharena_brumo/brumo_2025_30,matharena,matharena,Final Answer Parser,0.0
5233,o4-mini (high),openai/o4-mini--high,matharena_brumo/brumo_2025_4,matharena,matharena,Final Answer Parser,1.0
5234,GPT-5-mini (high),openai/gpt-5-mini,matharena_brumo/brumo_2025_1,matharena,matharena,Final Answer Parser,1.0
5235,GPT-5-mini (high),openai/gpt-5-mini,matharena_brumo/brumo_2025_10,matharena,matharena,Final Answer Parser,1.0
5236,GPT-5-mini (high),openai/gpt-5-mini,matharena_brumo/brumo_2025_11,matharena,matharena,Final Answer Parser,1.0
5237,GPT-5-mini (high),openai/gpt-5-mini,matharena_brumo/brumo_2025_12,matharena,matharena,Final Answer Parser,1.0
5238,GPT-5-mini (high),openai/gpt-5-mini,matharena_brumo/brumo_2025_13,matharena,matharena,Final Answer Parser,0.25
5239,GPT-5-mini (high),openai/gpt-5-mini,matharena_brumo/brumo_2025_14,matharena,matharena,Final Answer Parser,0.75
5240,GPT-5-mini (high),openai/gpt-5-mini,matharena_brumo/brumo_2025_15,matharena,matharena,Final Answer Parser,1.0
5241,GPT-5-mini (high),openai/gpt-5-mini,matharena_brumo/brumo_2025_16,matharena,matharena,Final Answer Parser,1.0
5242,GPT-5-mini (high),openai/gpt-5-mini,matharena_brumo/brumo_2025_17,matharena,matharena,Final Answer Parser,0.75
5243,GPT-5-mini (high),openai/gpt-5-mini,matharena_brumo/brumo_2025_18,matharena,matharena,Final Answer Parser,1.0
5244,GPT-5-mini (high),openai/gpt-5-mini,matharena_brumo/brumo_2025_19,matharena,matharena,Final Answer Parser,1.0
5245,GPT-5-mini (high),openai/gpt-5-mini,matharena_brumo/brumo_2025_2,matharena,matharena,Final Answer Parser,1.0
5246,GPT-5-mini (high),openai/gpt-5-mini,matharena_brumo/brumo_2025_20,matharena,matharena,Final Answer Parser,1.0
5247,GPT-5-mini (high),openai/gpt-5-mini,matharena_brumo/brumo_2025_21,matharena,matharena,Final Answer Parser,1.0
5248,GPT-5-mini (high),openai/gpt-5-mini,matharena_brumo/brumo_2025_22,matharena,matharena,Final Answer Parser,1.0
5249,GPT-5-mini (high),openai/gpt-5-mini,matharena_brumo/brumo_2025_23,matharena,matharena,Final Answer Parser,1.0
5250,GPT-5-mini (high),openai/gpt-5-mini,matharena_brumo/brumo_2025_24,matharena,matharena,Final Answer Parser,1.0
5251,GPT-5-mini (high),openai/gpt-5-mini,matharena_brumo/brumo_2025_25,matharena,matharena,Final Answer Parser,0.5
5252,GPT-5-mini (high),openai/gpt-5-mini,matharena_brumo/brumo_2025_26,matharena,matharena,Final Answer Parser,1.0
5253,GPT-5-mini (high),openai/gpt-5-mini,matharena_brumo/brumo_2025_27,matharena,matharena,Final Answer Parser,1.0
5254,GPT-5-mini (high),openai/gpt-5-mini,matharena_brumo/brumo_2025_28,matharena,matharena,Final Answer Parser,1.0
5255,GPT-5-mini (high),openai/gpt-5-mini,matharena_brumo/brumo_2025_29,matharena,matharena,Final Answer Parser,1.0
5256,GPT-5-mini (high),openai/gpt-5-mini,matharena_brumo/brumo_2025_3,matharena,matharena,Final Answer Parser,1.0
5257,GPT-5-mini (high),openai/gpt-5-mini,matharena_brumo/brumo_2025_30,matharena,matharena,Final Answer Parser,0.0
5258,GPT-5-mini (high),openai/gpt-5-mini,matharena_brumo/brumo_2025_4,matharena,matharena,Final Answer Parser,1.0
5259,GPT-5-mini (high),openai/gpt-5-mini,matharena_brumo/brumo_2025_5,matharena,matharena,Final Answer Parser,1.0
5260,GPT-5-mini (high),openai/gpt-5-mini,matharena_brumo/brumo_2025_6,matharena,matharena,Final Answer Parser,1.0
5261,GPT-5-mini (high),openai/gpt-5-mini,matharena_brumo/brumo_2025_7,matharena,matharena,Final Answer Parser,0.75
5262,GPT-5-mini (high),openai/gpt-5-mini,matharena_brumo/brumo_2025_8,matharena,matharena,Final Answer Parser,1.0
5263,GPT-5-mini (high),openai/gpt-5-mini,matharena_brumo/brumo_2025_9,matharena,matharena,Final Answer Parser,1.0
5264,GPT-5 (high),openai/gpt-5,matharena_brumo/brumo_2025_1,matharena,matharena,Final Answer Parser,1.0
5265,GPT-5 (high),openai/gpt-5,matharena_brumo/brumo_2025_10,matharena,matharena,Final Answer Parser,1.0
5266,GPT-5 (high),openai/gpt-5,matharena_brumo/brumo_2025_11,matharena,matharena,Final Answer Parser,1.0
5267,GPT-5 (high),openai/gpt-5,matharena_brumo/brumo_2025_12,matharena,matharena,Final Answer Parser,1.0
5268,GPT-5 (high),openai/gpt-5,matharena_brumo/brumo_2025_13,matharena,matharena,Final Answer Parser,0.25
5269,GPT-5 (high),openai/gpt-5,matharena_brumo/brumo_2025_14,matharena,matharena,Final Answer Parser,1.0
5270,GPT-5 (high),openai/gpt-5,matharena_brumo/brumo_2025_15,matharena,matharena,Final Answer Parser,1.0
5271,GPT-5 (high),openai/gpt-5,matharena_brumo/brumo_2025_16,matharena,matharena,Final Answer Parser,1.0
5272,GPT-5 (high),openai/gpt-5,matharena_brumo/brumo_2025_17,matharena,matharena,Final Answer Parser,0.5
5273,GPT-5 (high),openai/gpt-5,matharena_brumo/brumo_2025_18,matharena,matharena,Final Answer Parser,1.0
5274,GPT-5 (high),openai/gpt-5,matharena_brumo/brumo_2025_19,matharena,matharena,Final Answer Parser,1.0
5275,GPT-5 (high),openai/gpt-5,matharena_brumo/brumo_2025_2,matharena,matharena,Final Answer Parser,1.0
5276,GPT-5 (high),openai/gpt-5,matharena_brumo/brumo_2025_20,matharena,matharena,Final Answer Parser,1.0
5277,GPT-5 (high),openai/gpt-5,matharena_brumo/brumo_2025_21,matharena,matharena,Final Answer Parser,1.0
5278,GPT-5 (high),openai/gpt-5,matharena_brumo/brumo_2025_22,matharena,matharena,Final Answer Parser,1.0
5279,GPT-5 (high),openai/gpt-5,matharena_brumo/brumo_2025_23,matharena,matharena,Final Answer Parser,1.0
5280,GPT-5 (high),openai/gpt-5,matharena_brumo/brumo_2025_24,matharena,matharena,Final Answer Parser,1.0
5281,GPT-5 (high),openai/gpt-5,matharena_brumo/brumo_2025_25,matharena,matharena,Final Answer Parser,0.5
5282,GPT-5 (high),openai/gpt-5,matharena_brumo/brumo_2025_26,matharena,matharena,Final Answer Parser,1.0
5283,GPT-5 (high),openai/gpt-5,matharena_brumo/brumo_2025_27,matharena,matharena,Final Answer Parser,1.0
5284,GPT-5 (high),openai/gpt-5,matharena_brumo/brumo_2025_28,matharena,matharena,Final Answer Parser,1.0
5285,GPT-5 (high),openai/gpt-5,matharena_brumo/brumo_2025_29,matharena,matharena,Final Answer Parser,1.0
5286,GPT-5 (high),openai/gpt-5,matharena_brumo/brumo_2025_3,matharena,matharena,Final Answer Parser,1.0
5287,GPT-5 (high),openai/gpt-5,matharena_brumo/brumo_2025_30,matharena,matharena,Final Answer Parser,0.25
5288,GPT-5 (high),openai/gpt-5,matharena_brumo/brumo_2025_4,matharena,matharena,Final Answer Parser,1.0
5289,GPT-5 (high),openai/gpt-5,matharena_brumo/brumo_2025_5,matharena,matharena,Final Answer Parser,1.0
5290,GPT-5 (high),openai/gpt-5,matharena_brumo/brumo_2025_6,matharena,matharena,Final Answer Parser,1.0
5291,GPT-5 (high),openai/gpt-5,matharena_brumo/brumo_2025_7,matharena,matharena,Final Answer Parser,1.0
5292,GPT-5 (high),openai/gpt-5,matharena_brumo/brumo_2025_8,matharena,matharena,Final Answer Parser,1.0
5293,GPT-5 (high),openai/gpt-5,matharena_brumo/brumo_2025_9,matharena,matharena,Final Answer Parser,1.0
5294,GPT OSS 120B (high),openai/oss-20b,matharena_brumo/brumo_2025_1,matharena,matharena,Final Answer Parser,1.0
5295,GPT OSS 120B (high),openai/oss-20b,matharena_brumo/brumo_2025_10,matharena,matharena,Final Answer Parser,1.0
5296,GPT OSS 120B (high),openai/oss-20b,matharena_brumo/brumo_2025_11,matharena,matharena,Final Answer Parser,0.75
5297,GPT OSS 120B (high),openai/oss-20b,matharena_brumo/brumo_2025_12,matharena,matharena,Final Answer Parser,0.75
5298,GPT OSS 120B (high),openai/oss-20b,matharena_brumo/brumo_2025_13,matharena,matharena,Final Answer Parser,0.75
5299,GPT OSS 120B (high),openai/oss-20b,matharena_brumo/brumo_2025_14,matharena,matharena,Final Answer Parser,1.0
5300,GPT OSS 120B (high),openai/oss-20b,matharena_brumo/brumo_2025_15,matharena,matharena,Final Answer Parser,0.75
5301,GPT OSS 120B (high),openai/oss-20b,matharena_brumo/brumo_2025_16,matharena,matharena,Final Answer Parser,1.0
5302,GPT OSS 120B (high),openai/oss-20b,matharena_brumo/brumo_2025_17,matharena,matharena,Final Answer Parser,0.75
5303,GPT OSS 120B (high),openai/oss-20b,matharena_brumo/brumo_2025_18,matharena,matharena,Final Answer Parser,1.0
5304,GPT OSS 120B (high),openai/oss-20b,matharena_brumo/brumo_2025_19,matharena,matharena,Final Answer Parser,1.0
5305,GPT OSS 120B (high),openai/oss-20b,matharena_brumo/brumo_2025_2,matharena,matharena,Final Answer Parser,1.0
5306,GPT OSS 120B (high),openai/oss-20b,matharena_brumo/brumo_2025_20,matharena,matharena,Final Answer Parser,1.0
5307,GPT OSS 120B (high),openai/oss-20b,matharena_brumo/brumo_2025_21,matharena,matharena,Final Answer Parser,1.0
5308,GPT OSS 120B (high),openai/oss-20b,matharena_brumo/brumo_2025_22,matharena,matharena,Final Answer Parser,0.75
5309,GPT OSS 120B (high),openai/oss-20b,matharena_brumo/brumo_2025_23,matharena,matharena,Final Answer Parser,0.75
5310,GPT OSS 120B (high),openai/oss-20b,matharena_brumo/brumo_2025_24,matharena,matharena,Final Answer Parser,0.75
5311,GPT OSS 120B (high),openai/oss-20b,matharena_brumo/brumo_2025_25,matharena,matharena,Final Answer Parser,0.75
5312,GPT OSS 120B (high),openai/oss-20b,matharena_brumo/brumo_2025_26,matharena,matharena,Final Answer Parser,1.0
5313,GPT OSS 120B (high),openai/oss-20b,matharena_brumo/brumo_2025_27,matharena,matharena,Final Answer Parser,0.75
5314,GPT OSS 120B (high),openai/oss-20b,matharena_brumo/brumo_2025_28,matharena,matharena,Final Answer Parser,0.0
5315,GPT OSS 120B (high),openai/oss-20b,matharena_brumo/brumo_2025_29,matharena,matharena,Final Answer Parser,0.75
5316,GPT OSS 120B (high),openai/oss-20b,matharena_brumo/brumo_2025_3,matharena,matharena,Final Answer Parser,1.0
5317,GPT OSS 120B (high),openai/oss-20b,matharena_brumo/brumo_2025_30,matharena,matharena,Final Answer Parser,0.25
5318,GPT OSS 120B (high),openai/oss-20b,matharena_brumo/brumo_2025_4,matharena,matharena,Final Answer Parser,1.0
5319,GPT OSS 120B (high),openai/oss-20b,matharena_brumo/brumo_2025_5,matharena,matharena,Final Answer Parser,1.0
5320,GPT OSS 120B (high),openai/oss-20b,matharena_brumo/brumo_2025_6,matharena,matharena,Final Answer Parser,1.0
5321,GPT OSS 120B (high),openai/oss-20b,matharena_brumo/brumo_2025_7,matharena,matharena,Final Answer Parser,1.0
5322,GPT OSS 120B (high),openai/oss-20b,matharena_brumo/brumo_2025_8,matharena,matharena,Final Answer Parser,1.0
5323,GPT OSS 120B (high),openai/oss-20b,matharena_brumo/brumo_2025_9,matharena,matharena,Final Answer Parser,1.0
5324,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_brumo/brumo_2025_1,matharena,matharena,Final Answer Parser,1.0
5325,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_brumo/brumo_2025_12,matharena,matharena,Final Answer Parser,0.25
5326,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_brumo/brumo_2025_13,matharena,matharena,Final Answer Parser,0.75
5327,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_brumo/brumo_2025_15,matharena,matharena,Final Answer Parser,0.5
5328,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_brumo/brumo_2025_17,matharena,matharena,Final Answer Parser,0.75
5329,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_brumo/brumo_2025_18,matharena,matharena,Final Answer Parser,1.0
5330,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_brumo/brumo_2025_19,matharena,matharena,Final Answer Parser,1.0
5331,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_brumo/brumo_2025_2,matharena,matharena,Final Answer Parser,1.0
5332,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_brumo/brumo_2025_20,matharena,matharena,Final Answer Parser,1.0
5333,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_brumo/brumo_2025_21,matharena,matharena,Final Answer Parser,1.0
5334,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_brumo/brumo_2025_22,matharena,matharena,Final Answer Parser,1.0
5335,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_brumo/brumo_2025_23,matharena,matharena,Final Answer Parser,1.0
5336,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_brumo/brumo_2025_24,matharena,matharena,Final Answer Parser,1.0
5337,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_brumo/brumo_2025_26,matharena,matharena,Final Answer Parser,1.0
5338,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_brumo/brumo_2025_27,matharena,matharena,Final Answer Parser,0.75
5339,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_brumo/brumo_2025_28,matharena,matharena,Final Answer Parser,0.25
5340,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_brumo/brumo_2025_4,matharena,matharena,Final Answer Parser,1.0
5341,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_brumo/brumo_2025_5,matharena,matharena,Final Answer Parser,1.0
5342,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_brumo/brumo_2025_9,matharena,matharena,Final Answer Parser,1.0
5343,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_brumo/brumo_2025_10,matharena,matharena,Final Answer Parser,0.75
5344,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_brumo/brumo_2025_11,matharena,matharena,Final Answer Parser,1.0
5345,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_brumo/brumo_2025_14,matharena,matharena,Final Answer Parser,1.0
5346,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_brumo/brumo_2025_16,matharena,matharena,Final Answer Parser,1.0
5347,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_brumo/brumo_2025_25,matharena,matharena,Final Answer Parser,1.0
5348,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_brumo/brumo_2025_29,matharena,matharena,Final Answer Parser,1.0
5349,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_brumo/brumo_2025_3,matharena,matharena,Final Answer Parser,1.0
5350,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_brumo/brumo_2025_30,matharena,matharena,Final Answer Parser,0.0
5351,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_brumo/brumo_2025_6,matharena,matharena,Final Answer Parser,1.0
5352,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_brumo/brumo_2025_7,matharena,matharena,Final Answer Parser,1.0
5353,Qwen3-235B-A22B,qwen/qwen3_235b_a22b,matharena_brumo/brumo_2025_8,matharena,matharena,Final Answer Parser,1.0
5354,Grok 4,xai/grok-4,matharena_brumo/brumo_2025_1,matharena,matharena,Final Answer Parser,1.0
5355,Grok 4,xai/grok-4,matharena_brumo/brumo_2025_10,matharena,matharena,Final Answer Parser,1.0
5356,Grok 4,xai/grok-4,matharena_brumo/brumo_2025_11,matharena,matharena,Final Answer Parser,1.0
5357,Grok 4,xai/grok-4,matharena_brumo/brumo_2025_12,matharena,matharena,Final Answer Parser,0.75
5358,Grok 4,xai/grok-4,matharena_brumo/brumo_2025_13,matharena,matharena,Final Answer Parser,1.0
5359,Grok 4,xai/grok-4,matharena_brumo/brumo_2025_14,matharena,matharena,Final Answer Parser,1.0
5360,Grok 4,xai/grok-4,matharena_brumo/brumo_2025_15,matharena,matharena,Final Answer Parser,1.0
5361,Grok 4,xai/grok-4,matharena_brumo/brumo_2025_16,matharena,matharena,Final Answer Parser,1.0
5362,Grok 4,xai/grok-4,matharena_brumo/brumo_2025_17,matharena,matharena,Final Answer Parser,1.0
5363,Grok 4,xai/grok-4,matharena_brumo/brumo_2025_18,matharena,matharena,Final Answer Parser,1.0
5364,Grok 4,xai/grok-4,matharena_brumo/brumo_2025_19,matharena,matharena,Final Answer Parser,1.0
5365,Grok 4,xai/grok-4,matharena_brumo/brumo_2025_2,matharena,matharena,Final Answer Parser,1.0
5366,Grok 4,xai/grok-4,matharena_brumo/brumo_2025_20,matharena,matharena,Final Answer Parser,1.0
5367,Grok 4,xai/grok-4,matharena_brumo/brumo_2025_21,matharena,matharena,Final Answer Parser,1.0
5368,Grok 4,xai/grok-4,matharena_brumo/brumo_2025_22,matharena,matharena,Final Answer Parser,1.0
5369,Grok 4,xai/grok-4,matharena_brumo/brumo_2025_23,matharena,matharena,Final Answer Parser,1.0
5370,Grok 4,xai/grok-4,matharena_brumo/brumo_2025_24,matharena,matharena,Final Answer Parser,1.0
5371,Grok 4,xai/grok-4,matharena_brumo/brumo_2025_25,matharena,matharena,Final Answer Parser,1.0
5372,Grok 4,xai/grok-4,matharena_brumo/brumo_2025_26,matharena,matharena,Final Answer Parser,1.0
5373,Grok 4,xai/grok-4,matharena_brumo/brumo_2025_27,matharena,matharena,Final Answer Parser,0.75
5374,Grok 4,xai/grok-4,matharena_brumo/brumo_2025_28,matharena,matharena,Final Answer Parser,0.75
5375,Grok 4,xai/grok-4,matharena_brumo/brumo_2025_29,matharena,matharena,Final Answer Parser,1.0
5376,Grok 4,xai/grok-4,matharena_brumo/brumo_2025_3,matharena,matharena,Final Answer Parser,1.0
5377,Grok 4,xai/grok-4,matharena_brumo/brumo_2025_30,matharena,matharena,Final Answer Parser,0.5
5378,Grok 4,xai/grok-4,matharena_brumo/brumo_2025_4,matharena,matharena,Final Answer Parser,1.0
5379,Grok 4,xai/grok-4,matharena_brumo/brumo_2025_5,matharena,matharena,Final Answer Parser,1.0
5380,Grok 4,xai/grok-4,matharena_brumo/brumo_2025_6,matharena,matharena,Final Answer Parser,0.75
5381,Grok 4,xai/grok-4,matharena_brumo/brumo_2025_7,matharena,matharena,Final Answer Parser,1.0
5382,Grok 4,xai/grok-4,matharena_brumo/brumo_2025_8,matharena,matharena,Final Answer Parser,1.0
5383,Grok 4,xai/grok-4,matharena_brumo/brumo_2025_9,matharena,matharena,Final Answer Parser,1.0
5384,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,usamo_2025_6,usamo,proofs,OPC R1 8B,0.0
5385,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,usamo_2025_2,usamo,proofs,OPC R1 8B,0.0
5386,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,usamo_2025_1,usamo,proofs,OPC R1 8B,1.0
5387,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,usamo_2025_5,usamo,proofs,OPC R1 8B,0.0
5388,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,usamo_2025_3,usamo,proofs,OPC R1 8B,1.0
5389,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,usamo_2025_4,usamo,proofs,OPC R1 8B,1.0
5390,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,romania_tst_2025_3,romania,proofs,OPC R1 8B,0.0
5391,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,romania_10_2025_2,romania,proofs,OPC R1 8B,1.0
5392,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,romania_12_2025_2,romania,proofs,OPC R1 8B,1.0
5393,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,romania_12_2025_3,romania,proofs,OPC R1 8B,1.0
5394,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,romania_tst_2025_1,romania,proofs,OPC R1 8B,0.0
5395,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,romania_11_2025_3,romania,proofs,OPC R1 8B,1.0
5396,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,romania_12_2025_1,romania,proofs,OPC R1 8B,1.0
5397,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,romania_tst_2025_2,romania,proofs,OPC R1 8B,1.0
5398,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,romania_11_2025_1,romania,proofs,OPC R1 8B,1.0
5399,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,romania_10_2025_1,romania,proofs,OPC R1 8B,1.0
5400,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,romania_9_2025_2,romania,proofs,OPC R1 8B,0.0
5401,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,romania_9_2025_1,romania,proofs,OPC R1 8B,1.0
5402,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,romania_11_2025_2,romania,proofs,OPC R1 8B,1.0
5403,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,romania_10_2025_3,romania,proofs,OPC R1 8B,1.0
5404,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,thai_2025_7,thai,proofs,OPC R1 8B,0.0
5405,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,thai_2025_6,thai,proofs,OPC R1 8B,1.0
5406,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,thai_2025_9,thai,proofs,OPC R1 8B,1.0
5407,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,thai_2025_2,thai,proofs,OPC R1 8B,1.0
5408,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,thai_2025_10,thai,proofs,OPC R1 8B,1.0
5409,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,thai_2025_8,thai,proofs,OPC R1 8B,1.0
5410,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,thai_2025_1,thai,proofs,OPC R1 8B,1.0
5411,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,thai_2025_5,thai,proofs,OPC R1 8B,1.0
5412,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,thai_2025_3,thai,proofs,OPC R1 8B,1.0
5413,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,thai_2025_4,thai,proofs,OPC R1 8B,1.0
5414,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,rmm_2025_6,rmm,proofs,OPC R1 8B,1.0
5415,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,rmm_2025_2,rmm,proofs,OPC R1 8B,0.0
5416,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,rmm_2025_1,rmm,proofs,OPC R1 8B,1.0
5417,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,rmm_2025_5,rmm,proofs,OPC R1 8B,1.0
5418,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,rmm_2025_3,rmm,proofs,OPC R1 8B,0.0
5419,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,rmm_2025_4,rmm,proofs,OPC R1 8B,0.0
5420,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,egmo_2025_6,egmo,proofs,OPC R1 8B,1.0
5421,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,egmo_2025_2,egmo,proofs,OPC R1 8B,1.0
5422,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,egmo_2025_1,egmo,proofs,OPC R1 8B,1.0
5423,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,egmo_2025_5,egmo,proofs,OPC R1 8B,1.0
5424,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,egmo_2025_3,egmo,proofs,OPC R1 8B,0.0
5425,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,egmo_2025_4,egmo,proofs,OPC R1 8B,0.0
5426,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,bmo_2025_2,bmo,proofs,OPC R1 8B,0.0
5427,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,bmo_2025_1,bmo,proofs,OPC R1 8B,1.0
5428,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,bmo_2025_3,bmo,proofs,OPC R1 8B,0.0
5429,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,bmo_2025_4,bmo,proofs,OPC R1 8B,1.0
5430,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,bulgaria_2025_6,bulgaria,proofs,OPC R1 8B,0.0
5431,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,bulgaria_2025_2,bulgaria,proofs,OPC R1 8B,1.0
5432,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,bulgaria_2025_1,bulgaria,proofs,OPC R1 8B,1.0
5433,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,bulgaria_2025_5,bulgaria,proofs,OPC R1 8B,1.0
5434,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,bulgaria_2025_3,bulgaria,proofs,OPC R1 8B,0.0
5435,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,bulgaria_2025_4,bulgaria,proofs,OPC R1 8B,1.0
5436,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,elmosl_A_2025_1,elmosl,proofs,OPC R1 8B,0.0
5437,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,elmosl_G_2025_6,elmosl,proofs,OPC R1 8B,1.0
5438,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,elmosl_C_2025_9,elmosl,proofs,OPC R1 8B,0.0
5439,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,elmosl_A_2025_7,elmosl,proofs,OPC R1 8B,0.0
5440,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,elmosl_C_2025_5,elmosl,proofs,OPC R1 8B,0.0
5441,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,elmosl_G_2025_9,elmosl,proofs,OPC R1 8B,0.0
5442,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,elmosl_NT_2025_4,elmosl,proofs,OPC R1 8B,1.0
5443,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,elmosl_NT_2025_6,elmosl,proofs,OPC R1 8B,0.0
5444,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,elmosl_G_2025_2,elmosl,proofs,OPC R1 8B,0.0
5445,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,elmosl_C_2025_6,elmosl,proofs,OPC R1 8B,0.0
5446,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,elmosl_NT_2025_2,elmosl,proofs,OPC R1 8B,0.0
5447,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,elmosl_G_2025_8,elmosl,proofs,OPC R1 8B,0.0
5448,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,elmosl_C_2025_1,elmosl,proofs,OPC R1 8B,0.0
5449,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,elmosl_G_2025_7,elmosl,proofs,OPC R1 8B,0.0
5450,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,elmosl_C_2025_2,elmosl,proofs,OPC R1 8B,0.0
5451,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,elmosl_C_2025_4,elmosl,proofs,OPC R1 8B,0.0
5452,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,elmosl_G_2025_1,elmosl,proofs,OPC R1 8B,1.0
5453,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,elmosl_NT_2025_3,elmosl,proofs,OPC R1 8B,1.0
5454,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,elmosl_G_2025_5,elmosl,proofs,OPC R1 8B,1.0
5455,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,elmosl_NT_2025_5,elmosl,proofs,OPC R1 8B,1.0
5456,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,elmosl_A_2025_5,elmosl,proofs,OPC R1 8B,0.0
5457,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,elmosl_C_2025_3,elmosl,proofs,OPC R1 8B,1.0
5458,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,elmosl_C_2025_7,elmosl,proofs,OPC R1 8B,0.0
5459,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,elmosl_A_2025_3,elmosl,proofs,OPC R1 8B,1.0
5460,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,elmosl_NT_2025_7,elmosl,proofs,OPC R1 8B,0.0
5461,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,elmosl_C_2025_8,elmosl,proofs,OPC R1 8B,1.0
5462,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,elmosl_G_2025_3,elmosl,proofs,OPC R1 8B,1.0
5463,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,elmosl_NT_2025_1,elmosl,proofs,OPC R1 8B,1.0
5464,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,elmosl_A_2025_8,elmosl,proofs,OPC R1 8B,0.0
5465,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,elmosl_A_2025_6,elmosl,proofs,OPC R1 8B,1.0
5466,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,elmosl_A_2025_2,elmosl,proofs,OPC R1 8B,1.0
5467,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,elmosl_G_2025_4,elmosl,proofs,OPC R1 8B,1.0
5468,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,usatst_2025_7,usatst,proofs,OPC R1 8B,1.0
5469,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,usatst_2025_6,usatst,proofs,OPC R1 8B,1.0
5470,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,usatst_2025_9,usatst,proofs,OPC R1 8B,0.0
5471,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,usatst_2025_2,usatst,proofs,OPC R1 8B,0.0
5472,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,usatst_2025_8,usatst,proofs,OPC R1 8B,0.0
5473,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,usatst_2025_1,usatst,proofs,OPC R1 8B,1.0
5474,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,usatst_2025_5,usatst,proofs,OPC R1 8B,0.0
5475,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,usatst_2025_3,usatst,proofs,OPC R1 8B,0.0
5476,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,usatst_2025_4,usatst,proofs,OPC R1 8B,0.0
5477,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,vietnam_2025_6,vietnam,proofs,OPC R1 8B,0.0
5478,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,vietnam_2025_2,vietnam,proofs,OPC R1 8B,1.0
5479,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,vietnam_2025_1,vietnam,proofs,OPC R1 8B,1.0
5480,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,vietnam_2025_5,vietnam,proofs,OPC R1 8B,0.0
5481,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,vietnam_2025_3,vietnam,proofs,OPC R1 8B,0.0
5482,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,vietnam_2025_4,vietnam,proofs,OPC R1 8B,0.0
5483,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,allrussian_2025_7,allrussian,proofs,OPC R1 8B,0.0
5484,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,allrussian_2025_6,allrussian,proofs,OPC R1 8B,1.0
5485,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,allrussian_2025_9,allrussian,proofs,OPC R1 8B,1.0
5486,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,allrussian_2025_2,allrussian,proofs,OPC R1 8B,1.0
5487,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,allrussian_2025_12,allrussian,proofs,OPC R1 8B,0.0
5488,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,allrussian_2025_10,allrussian,proofs,OPC R1 8B,1.0
5489,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,allrussian_2025_11,allrussian,proofs,OPC R1 8B,0.0
5490,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,allrussian_2025_8,allrussian,proofs,OPC R1 8B,0.0
5491,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,allrussian_2025_16,allrussian,proofs,OPC R1 8B,0.0
5492,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,allrussian_2025_1,allrussian,proofs,OPC R1 8B,0.0
5493,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,allrussian_2025_15,allrussian,proofs,OPC R1 8B,0.0
5494,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,allrussian_2025_5,allrussian,proofs,OPC R1 8B,1.0
5495,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,allrussian_2025_13,allrussian,proofs,OPC R1 8B,1.0
5496,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,allrussian_2025_3,allrussian,proofs,OPC R1 8B,1.0
5497,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,allrussian_2025_14,allrussian,proofs,OPC R1 8B,1.0
5498,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,allrussian_2025_4,allrussian,proofs,OPC R1 8B,0.0
5499,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,jbmo_2025_2,jbmo,proofs,OPC R1 8B,0.0
5500,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,jbmo_2025_1,jbmo,proofs,OPC R1 8B,1.0
5501,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,jbmo_2025_3,jbmo,proofs,OPC R1 8B,1.0
5502,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,jbmo_2025_4,jbmo,proofs,OPC R1 8B,0.0
5503,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,korea_2025_6,korea,proofs,OPC R1 8B,0.0
5504,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,korea_2025_2,korea,proofs,OPC R1 8B,0.0
5505,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,korea_2025_1,korea,proofs,OPC R1 8B,1.0
5506,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,korea_2025_5,korea,proofs,OPC R1 8B,1.0
5507,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,korea_2025_3,korea,proofs,OPC R1 8B,0.0
5508,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,korea_2025_4,korea,proofs,OPC R1 8B,0.0
5509,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,pan_african_2025_6,pan,proofs,OPC R1 8B,1.0
5510,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,pan_african_2025_2,pan,proofs,OPC R1 8B,1.0
5511,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,pan_african_2025_3,pan,proofs,OPC R1 8B,1.0
5512,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,pan_african_2025_5,pan,proofs,OPC R1 8B,1.0
5513,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,pan_african_2025_1,pan,proofs,OPC R1 8B,1.0
5514,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,pan_african_2025_4,pan,proofs,OPC R1 8B,1.0
5515,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,spain_2025_2,spain,proofs,OPC R1 8B,1.0
5516,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,spain_2025_1,spain,proofs,OPC R1 8B,1.0
5517,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,spain_2025_5,spain,proofs,OPC R1 8B,0.0
5518,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,spain_2025_3,spain,proofs,OPC R1 8B,1.0
5519,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,spain_2025_4,spain,proofs,OPC R1 8B,1.0
5520,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,german_2025_2,german,proofs,OPC R1 8B,0.0
5521,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,german_2025_1,german,proofs,OPC R1 8B,1.0
5522,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,german_2025_3,german,proofs,OPC R1 8B,1.0
5523,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,german_2025_4,german,proofs,OPC R1 8B,0.0
5524,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,polish_2025_6,polish,proofs,OPC R1 8B,0.0
5525,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,polish_2025_2,polish,proofs,OPC R1 8B,1.0
5526,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,polish_2025_1,polish,proofs,OPC R1 8B,1.0
5527,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,polish_2025_5,polish,proofs,OPC R1 8B,0.0
5528,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,polish_2025_3,polish,proofs,OPC R1 8B,1.0
5529,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,polish_2025_4,polish,proofs,OPC R1 8B,1.0
5530,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,israel_tst_2025_7,israel,proofs,OPC R1 8B,0.0
5531,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,israel_tst_2025_3,israel,proofs,OPC R1 8B,0.0
5532,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,israel_tst_2025_5,israel,proofs,OPC R1 8B,0.0
5533,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,israel_tst_2025_4,israel,proofs,OPC R1 8B,0.0
5534,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,israel_tst_2025_6,israel,proofs,OPC R1 8B,0.0
5535,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,israel_tst_2025_1,israel,proofs,OPC R1 8B,1.0
5536,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,israel_tst_2025_10,israel,proofs,OPC R1 8B,0.0
5537,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,israel_tst_2025_2,israel,proofs,OPC R1 8B,0.0
5538,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,israel_tst_2025_8,israel,proofs,OPC R1 8B,0.0
5539,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,israel_tst_2025_9,israel,proofs,OPC R1 8B,0.0
5540,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,imosl_2025_7,imosl,proofs,OPC R1 8B,0.0
5541,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,imosl_2025_35,imosl,proofs,OPC R1 8B,0.0
5542,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,imosl_2025_6,imosl,proofs,OPC R1 8B,0.0
5543,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,imosl_2025_9,imosl,proofs,OPC R1 8B,0.0
5544,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,imosl_2025_2,imosl,proofs,OPC R1 8B,1.0
5545,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,imosl_2025_12,imosl,proofs,OPC R1 8B,1.0
5546,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,imosl_2025_25,imosl,proofs,OPC R1 8B,0.0
5547,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,imosl_2025_33,imosl,proofs,OPC R1 8B,0.0
5548,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,imosl_2025_23,imosl,proofs,OPC R1 8B,0.0
5549,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,imosl_2025_31,imosl,proofs,OPC R1 8B,1.0
5550,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,imosl_2025_24,imosl,proofs,OPC R1 8B,0.0
5551,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,imosl_2025_37,imosl,proofs,OPC R1 8B,0.0
5552,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,imosl_2025_10,imosl,proofs,OPC R1 8B,0.0
5553,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,imosl_2025_11,imosl,proofs,OPC R1 8B,0.0
5554,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,imosl_2025_30,imosl,proofs,OPC R1 8B,0.0
5555,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,imosl_2025_17,imosl,proofs,OPC R1 8B,1.0
5556,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,imosl_2025_8,imosl,proofs,OPC R1 8B,0.0
5557,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,imosl_2025_32,imosl,proofs,OPC R1 8B,1.0
5558,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,imosl_2025_16,imosl,proofs,OPC R1 8B,1.0
5559,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,imosl_2025_34,imosl,proofs,OPC R1 8B,0.0
5560,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,imosl_2025_19,imosl,proofs,OPC R1 8B,0.0
5561,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,imosl_2025_20,imosl,proofs,OPC R1 8B,0.0
5562,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,imosl_2025_22,imosl,proofs,OPC R1 8B,0.0
5563,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,imosl_2025_36,imosl,proofs,OPC R1 8B,0.0
5564,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,imosl_2025_1,imosl,proofs,OPC R1 8B,1.0
5565,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,imosl_2025_28,imosl,proofs,OPC R1 8B,0.0
5566,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,imosl_2025_15,imosl,proofs,OPC R1 8B,0.0
5567,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,imosl_2025_18,imosl,proofs,OPC R1 8B,0.0
5568,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,imosl_2025_27,imosl,proofs,OPC R1 8B,1.0
5569,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,imosl_2025_21,imosl,proofs,OPC R1 8B,0.0
5570,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,imosl_2025_5,imosl,proofs,OPC R1 8B,0.0
5571,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,imosl_2025_13,imosl,proofs,OPC R1 8B,1.0
5572,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,imosl_2025_3,imosl,proofs,OPC R1 8B,1.0
5573,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,imosl_2025_29,imosl,proofs,OPC R1 8B,0.0
5574,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,imosl_2025_14,imosl,proofs,OPC R1 8B,0.0
5575,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,imosl_2025_26,imosl,proofs,OPC R1 8B,0.0
5576,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,imosl_2025_4,imosl,proofs,OPC R1 8B,0.0
5577,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_cmimc/cmimc_2025_13,matharena,answer,Final Answer Parser,1.0
5578,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_aime/aime_2025_9,matharena,answer,Final Answer Parser,1.0
5579,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_cmimc/cmimc_2025_40,matharena,answer,Final Answer Parser,1.0
5580,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_hmmt/hmmt_feb_2025_14,matharena,answer,Final Answer Parser,1.0
5581,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_smt/smt_2025_15,matharena,answer,Final Answer Parser,1.0
5582,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_brumo/brumo_2025_10,matharena,answer,Final Answer Parser,1.0
5583,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_smt/smt_2025_5,matharena,answer,Final Answer Parser,1.0
5584,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_aime/aime_2025_17,matharena,answer,Final Answer Parser,1.0
5585,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_hmmt/hmmt_feb_2025_7,matharena,answer,Final Answer Parser,1.0
5586,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_cmimc/cmimc_2025_12,matharena,answer,Final Answer Parser,1.0
5587,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_cmimc/cmimc_2025_32,matharena,answer,Final Answer Parser,1.0
5588,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_aime/aime_2025_16,matharena,answer,Final Answer Parser,1.0
5589,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_smt/smt_2025_40,matharena,answer,Final Answer Parser,1.0
5590,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_brumo/brumo_2025_12,matharena,answer,Final Answer Parser,1.0
5591,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_brumo/brumo_2025_15,matharena,answer,Final Answer Parser,1.0
5592,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_smt/smt_2025_32,matharena,answer,Final Answer Parser,0.0
5593,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_smt/smt_2025_24,matharena,answer,Final Answer Parser,1.0
5594,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_smt/smt_2025_2,matharena,answer,Final Answer Parser,1.0
5595,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_smt/smt_2025_6,matharena,answer,Final Answer Parser,1.0
5596,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_smt/smt_2025_22,matharena,answer,Final Answer Parser,1.0
5597,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_hmmt/hmmt_feb_2025_27,matharena,answer,Final Answer Parser,1.0
5598,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_cmimc/cmimc_2025_36,matharena,answer,Final Answer Parser,1.0
5599,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_hmmt/hmmt_feb_2025_18,matharena,answer,Final Answer Parser,1.0
5600,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_brumo/brumo_2025_11,matharena,answer,Final Answer Parser,1.0
5601,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_aime/aime_2025_18,matharena,answer,Final Answer Parser,1.0
5602,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_brumo/brumo_2025_9,matharena,answer,Final Answer Parser,1.0
5603,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_aime/aime_2025_14,matharena,answer,Final Answer Parser,0.0
5604,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_smt/smt_2025_27,matharena,answer,Final Answer Parser,1.0
5605,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_cmimc/cmimc_2025_24,matharena,answer,Final Answer Parser,1.0
5606,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_smt/smt_2025_37,matharena,answer,Final Answer Parser,1.0
5607,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_cmimc/cmimc_2025_2,matharena,answer,Final Answer Parser,1.0
5608,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_smt/smt_2025_52,matharena,answer,Final Answer Parser,1.0
5609,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_brumo/brumo_2025_17,matharena,answer,Final Answer Parser,1.0
5610,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_smt/smt_2025_19,matharena,answer,Final Answer Parser,1.0
5611,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_brumo/brumo_2025_25,matharena,answer,Final Answer Parser,1.0
5612,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_cmimc/cmimc_2025_4,matharena,answer,Final Answer Parser,1.0
5613,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_aime/aime_2025_21,matharena,answer,Final Answer Parser,1.0
5614,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_smt/smt_2025_34,matharena,answer,Final Answer Parser,1.0
5615,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_brumo/brumo_2025_13,matharena,answer,Final Answer Parser,1.0
5616,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_smt/smt_2025_47,matharena,answer,Final Answer Parser,1.0
5617,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_smt/smt_2025_11,matharena,answer,Final Answer Parser,1.0
5618,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_smt/smt_2025_41,matharena,answer,Final Answer Parser,1.0
5619,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_brumo/brumo_2025_6,matharena,answer,Final Answer Parser,1.0
5620,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_cmimc/cmimc_2025_34,matharena,answer,Final Answer Parser,1.0
5621,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_cmimc/cmimc_2025_22,matharena,answer,Final Answer Parser,1.0
5622,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_cmimc/cmimc_2025_33,matharena,answer,Final Answer Parser,1.0
5623,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_cmimc/cmimc_2025_17,matharena,answer,Final Answer Parser,1.0
5624,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_cmimc/cmimc_2025_30,matharena,answer,Final Answer Parser,1.0
5625,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_brumo/brumo_2025_19,matharena,answer,Final Answer Parser,1.0
5626,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_cmimc/cmimc_2025_10,matharena,answer,Final Answer Parser,1.0
5627,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_smt/smt_2025_20,matharena,answer,Final Answer Parser,0.0
5628,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_hmmt/hmmt_feb_2025_4,matharena,answer,Final Answer Parser,1.0
5629,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_cmimc/cmimc_2025_7,matharena,answer,Final Answer Parser,0.0
5630,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_cmimc/cmimc_2025_21,matharena,answer,Final Answer Parser,1.0
5631,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_cmimc/cmimc_2025_37,matharena,answer,Final Answer Parser,1.0
5632,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_brumo/brumo_2025_14,matharena,answer,Final Answer Parser,1.0
5633,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_brumo/brumo_2025_29,matharena,answer,Final Answer Parser,1.0
5634,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_cmimc/cmimc_2025_23,matharena,answer,Final Answer Parser,1.0
5635,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_hmmt/hmmt_feb_2025_21,matharena,answer,Final Answer Parser,1.0
5636,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_hmmt/hmmt_feb_2025_23,matharena,answer,Final Answer Parser,1.0
5637,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_smt/smt_2025_17,matharena,answer,Final Answer Parser,1.0
5638,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_hmmt/hmmt_feb_2025_29,matharena,answer,Final Answer Parser,0.0
5639,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_aime/aime_2025_19,matharena,answer,Final Answer Parser,1.0
5640,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_hmmt/hmmt_feb_2025_2,matharena,answer,Final Answer Parser,1.0
5641,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_cmimc/cmimc_2025_3,matharena,answer,Final Answer Parser,1.0
5642,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_hmmt/hmmt_feb_2025_11,matharena,answer,Final Answer Parser,1.0
5643,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_cmimc/cmimc_2025_6,matharena,answer,Final Answer Parser,1.0
5644,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_hmmt/hmmt_feb_2025_9,matharena,answer,Final Answer Parser,1.0
5645,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_smt/smt_2025_33,matharena,answer,Final Answer Parser,1.0
5646,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_hmmt/hmmt_feb_2025_8,matharena,answer,Final Answer Parser,1.0
5647,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_hmmt/hmmt_feb_2025_5,matharena,answer,Final Answer Parser,1.0
5648,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_hmmt/hmmt_feb_2025_17,matharena,answer,Final Answer Parser,1.0
5649,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_aime/aime_2025_24,matharena,answer,Final Answer Parser,1.0
5650,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_smt/smt_2025_9,matharena,answer,Final Answer Parser,1.0
5651,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_aime/aime_2025_23,matharena,answer,Final Answer Parser,1.0
5652,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_aime/aime_2025_28,matharena,answer,Final Answer Parser,1.0
5653,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_smt/smt_2025_49,matharena,answer,Final Answer Parser,1.0
5654,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_brumo/brumo_2025_30,matharena,answer,Final Answer Parser,1.0
5655,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_hmmt/hmmt_feb_2025_12,matharena,answer,Final Answer Parser,1.0
5656,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_cmimc/cmimc_2025_35,matharena,answer,Final Answer Parser,1.0
5657,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_brumo/brumo_2025_22,matharena,answer,Final Answer Parser,1.0
5658,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_smt/smt_2025_4,matharena,answer,Final Answer Parser,1.0
5659,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_smt/smt_2025_29,matharena,answer,Final Answer Parser,1.0
5660,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_smt/smt_2025_42,matharena,answer,Final Answer Parser,0.0
5661,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_aime/aime_2025_26,matharena,answer,Final Answer Parser,1.0
5662,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_aime/aime_2025_5,matharena,answer,Final Answer Parser,1.0
5663,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_aime/aime_2025_2,matharena,answer,Final Answer Parser,1.0
5664,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_smt/smt_2025_44,matharena,answer,Final Answer Parser,1.0
5665,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_hmmt/hmmt_feb_2025_19,matharena,answer,Final Answer Parser,1.0
5666,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_smt/smt_2025_23,matharena,answer,Final Answer Parser,1.0
5667,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_cmimc/cmimc_2025_31,matharena,answer,Final Answer Parser,1.0
5668,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_hmmt/hmmt_feb_2025_6,matharena,answer,Final Answer Parser,1.0
5669,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_hmmt/hmmt_feb_2025_3,matharena,answer,Final Answer Parser,1.0
5670,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_cmimc/cmimc_2025_16,matharena,answer,Final Answer Parser,1.0
5671,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_aime/aime_2025_3,matharena,answer,Final Answer Parser,1.0
5672,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_hmmt/hmmt_feb_2025_10,matharena,answer,Final Answer Parser,1.0
5673,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_brumo/brumo_2025_3,matharena,answer,Final Answer Parser,1.0
5674,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_aime/aime_2025_27,matharena,answer,Final Answer Parser,1.0
5675,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_brumo/brumo_2025_27,matharena,answer,Final Answer Parser,1.0
5676,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_brumo/brumo_2025_5,matharena,answer,Final Answer Parser,1.0
5677,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_brumo/brumo_2025_23,matharena,answer,Final Answer Parser,0.0
5678,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_brumo/brumo_2025_20,matharena,answer,Final Answer Parser,1.0
5679,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_smt/smt_2025_43,matharena,answer,Final Answer Parser,1.0
5680,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_smt/smt_2025_12,matharena,answer,Final Answer Parser,1.0
5681,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_smt/smt_2025_13,matharena,answer,Final Answer Parser,1.0
5682,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_cmimc/cmimc_2025_19,matharena,answer,Final Answer Parser,1.0
5683,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_cmimc/cmimc_2025_15,matharena,answer,Final Answer Parser,0.0
5684,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_smt/smt_2025_21,matharena,answer,Final Answer Parser,1.0
5685,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_cmimc/cmimc_2025_39,matharena,answer,Final Answer Parser,1.0
5686,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_aime/aime_2025_11,matharena,answer,Final Answer Parser,1.0
5687,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_aime/aime_2025_29,matharena,answer,Final Answer Parser,1.0
5688,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_hmmt/hmmt_feb_2025_20,matharena,answer,Final Answer Parser,1.0
5689,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_aime/aime_2025_10,matharena,answer,Final Answer Parser,1.0
5690,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_smt/smt_2025_7,matharena,answer,Final Answer Parser,1.0
5691,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_aime/aime_2025_7,matharena,answer,Final Answer Parser,1.0
5692,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_smt/smt_2025_8,matharena,answer,Final Answer Parser,1.0
5693,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_smt/smt_2025_30,matharena,answer,Final Answer Parser,1.0
5694,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_smt/smt_2025_51,matharena,answer,Final Answer Parser,1.0
5695,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_smt/smt_2025_26,matharena,answer,Final Answer Parser,1.0
5696,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_hmmt/hmmt_feb_2025_15,matharena,answer,Final Answer Parser,1.0
5697,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_hmmt/hmmt_feb_2025_13,matharena,answer,Final Answer Parser,1.0
5698,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_hmmt/hmmt_feb_2025_16,matharena,answer,Final Answer Parser,1.0
5699,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_cmimc/cmimc_2025_20,matharena,answer,Final Answer Parser,0.0
5700,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_smt/smt_2025_35,matharena,answer,Final Answer Parser,1.0
5701,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_smt/smt_2025_10,matharena,answer,Final Answer Parser,1.0
5702,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_hmmt/hmmt_feb_2025_22,matharena,answer,Final Answer Parser,1.0
5703,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_aime/aime_2025_8,matharena,answer,Final Answer Parser,1.0
5704,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_aime/aime_2025_6,matharena,answer,Final Answer Parser,1.0
5705,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_cmimc/cmimc_2025_18,matharena,answer,Final Answer Parser,1.0
5706,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_smt/smt_2025_1,matharena,answer,Final Answer Parser,1.0
5707,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_smt/smt_2025_16,matharena,answer,Final Answer Parser,1.0
5708,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_smt/smt_2025_31,matharena,answer,Final Answer Parser,1.0
5709,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_cmimc/cmimc_2025_1,matharena,answer,Final Answer Parser,1.0
5710,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_smt/smt_2025_50,matharena,answer,Final Answer Parser,1.0
5711,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_cmimc/cmimc_2025_28,matharena,answer,Final Answer Parser,0.0
5712,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_aime/aime_2025_4,matharena,answer,Final Answer Parser,1.0
5713,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_cmimc/cmimc_2025_29,matharena,answer,Final Answer Parser,1.0
5714,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_brumo/brumo_2025_8,matharena,answer,Final Answer Parser,1.0
5715,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_cmimc/cmimc_2025_26,matharena,answer,Final Answer Parser,1.0
5716,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_hmmt/hmmt_feb_2025_24,matharena,answer,Final Answer Parser,1.0
5717,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_smt/smt_2025_36,matharena,answer,Final Answer Parser,1.0
5718,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_brumo/brumo_2025_1,matharena,answer,Final Answer Parser,1.0
5719,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_aime/aime_2025_20,matharena,answer,Final Answer Parser,1.0
5720,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_brumo/brumo_2025_21,matharena,answer,Final Answer Parser,1.0
5721,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_aime/aime_2025_25,matharena,answer,Final Answer Parser,1.0
5722,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_aime/aime_2025_30,matharena,answer,Final Answer Parser,1.0
5723,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_smt/smt_2025_28,matharena,answer,Final Answer Parser,1.0
5724,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_hmmt/hmmt_feb_2025_1,matharena,answer,Final Answer Parser,1.0
5725,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_cmimc/cmimc_2025_14,matharena,answer,Final Answer Parser,1.0
5726,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_aime/aime_2025_1,matharena,answer,Final Answer Parser,1.0
5727,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_brumo/brumo_2025_2,matharena,answer,Final Answer Parser,1.0
5728,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_smt/smt_2025_45,matharena,answer,Final Answer Parser,1.0
5729,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_hmmt/hmmt_feb_2025_25,matharena,answer,Final Answer Parser,1.0
5730,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_hmmt/hmmt_feb_2025_28,matharena,answer,Final Answer Parser,1.0
5731,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_brumo/brumo_2025_18,matharena,answer,Final Answer Parser,1.0
5732,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_aime/aime_2025_22,matharena,answer,Final Answer Parser,1.0
5733,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_aime/aime_2025_15,matharena,answer,Final Answer Parser,1.0
5734,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_brumo/brumo_2025_4,matharena,answer,Final Answer Parser,1.0
5735,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_smt/smt_2025_48,matharena,answer,Final Answer Parser,1.0
5736,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_smt/smt_2025_46,matharena,answer,Final Answer Parser,1.0
5737,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_aime/aime_2025_12,matharena,answer,Final Answer Parser,1.0
5738,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_smt/smt_2025_3,matharena,answer,Final Answer Parser,1.0
5739,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_brumo/brumo_2025_26,matharena,answer,Final Answer Parser,1.0
5740,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_aime/aime_2025_13,matharena,answer,Final Answer Parser,1.0
5741,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_brumo/brumo_2025_24,matharena,answer,Final Answer Parser,1.0
5742,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_cmimc/cmimc_2025_27,matharena,answer,Final Answer Parser,1.0
5743,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_smt/smt_2025_53,matharena,answer,Final Answer Parser,1.0
5744,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_brumo/brumo_2025_7,matharena,answer,Final Answer Parser,1.0
5745,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_smt/smt_2025_38,matharena,answer,Final Answer Parser,1.0
5746,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_cmimc/cmimc_2025_25,matharena,answer,Final Answer Parser,1.0
5747,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_cmimc/cmimc_2025_38,matharena,answer,Final Answer Parser,1.0
5748,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_smt/smt_2025_39,matharena,answer,Final Answer Parser,1.0
5749,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_cmimc/cmimc_2025_11,matharena,answer,Final Answer Parser,1.0
5750,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_smt/smt_2025_25,matharena,answer,Final Answer Parser,1.0
5751,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_cmimc/cmimc_2025_8,matharena,answer,Final Answer Parser,1.0
5752,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_smt/smt_2025_18,matharena,answer,Final Answer Parser,1.0
5753,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_cmimc/cmimc_2025_5,matharena,answer,Final Answer Parser,1.0
5754,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_hmmt/hmmt_feb_2025_26,matharena,answer,Final Answer Parser,1.0
5755,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_hmmt/hmmt_feb_2025_30,matharena,answer,Final Answer Parser,0.0
5756,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_brumo/brumo_2025_16,matharena,answer,Final Answer Parser,1.0
5757,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_brumo/brumo_2025_28,matharena,answer,Final Answer Parser,1.0
5758,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_cmimc/cmimc_2025_9,matharena,answer,Final Answer Parser,1.0
5759,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,matharena_smt/smt_2025_14,matharena,answer,Final Answer Parser,1.0
5760,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,bmosl_A_2025_1,bmosl,proofs,OPC R1 8B,1.0
5761,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,bmosl_G_2025_6,bmosl,proofs,OPC R1 8B,1.0
5762,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,bmosl_C_2025_5,bmosl,proofs,OPC R1 8B,0.0
5763,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,bmosl_NT_2025_4,bmosl,proofs,OPC R1 8B,0.0
5764,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,bmosl_NT_2025_6,bmosl,proofs,OPC R1 8B,1.0
5765,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,bmosl_G_2025_2,bmosl,proofs,OPC R1 8B,1.0
5766,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,bmosl_C_2025_6,bmosl,proofs,OPC R1 8B,0.0
5767,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,bmosl_NT_2025_2,bmosl,proofs,OPC R1 8B,0.0
5768,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,bmosl_C_2025_1,bmosl,proofs,OPC R1 8B,1.0
5769,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,bmosl_G_2025_7,bmosl,proofs,OPC R1 8B,0.0
5770,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,bmosl_C_2025_2,bmosl,proofs,OPC R1 8B,1.0
5771,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,bmosl_C_2025_4,bmosl,proofs,OPC R1 8B,0.0
5772,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,bmosl_G_2025_1,bmosl,proofs,OPC R1 8B,1.0
5773,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,bmosl_NT_2025_3,bmosl,proofs,OPC R1 8B,1.0
5774,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,bmosl_G_2025_5,bmosl,proofs,OPC R1 8B,1.0
5775,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,bmosl_NT_2025_5,bmosl,proofs,OPC R1 8B,0.0
5776,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,bmosl_A_2025_5,bmosl,proofs,OPC R1 8B,0.0
5777,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,bmosl_A_2025_4,bmosl,proofs,OPC R1 8B,0.0
5778,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,bmosl_C_2025_3,bmosl,proofs,OPC R1 8B,1.0
5779,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,bmosl_A_2025_3,bmosl,proofs,OPC R1 8B,0.0
5780,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,bmosl_NT_2025_7,bmosl,proofs,OPC R1 8B,1.0
5781,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,bmosl_G_2025_3,bmosl,proofs,OPC R1 8B,0.0
5782,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,bmosl_NT_2025_1,bmosl,proofs,OPC R1 8B,0.0
5783,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,bmosl_A_2025_6,bmosl,proofs,OPC R1 8B,1.0
5784,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,bmosl_A_2025_2,bmosl,proofs,OPC R1 8B,1.0
5785,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,bmosl_G_2025_4,bmosl,proofs,OPC R1 8B,0.0
5786,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,india_prep_2025_10,india,proofs,OPC R1 8B,0.0
5787,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,india_prep_2025_15,india,proofs,OPC R1 8B,0.0
5788,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,india_prep_2025_14,india,proofs,OPC R1 8B,1.0
5789,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,india_prep_2025_19,india,proofs,OPC R1 8B,0.0
5790,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,india_prep_2025_7,india,proofs,OPC R1 8B,0.0
5791,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,india_2025_6,india,proofs,OPC R1 8B,0.0
5792,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,india_prep_2025_2,india,proofs,OPC R1 8B,0.0
5793,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,india_2025_2,india,proofs,OPC R1 8B,0.0
5794,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,india_prep_2025_5,india,proofs,OPC R1 8B,0.0
5795,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,india_prep_2025_12,india,proofs,OPC R1 8B,1.0
5796,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,india_prep_2025_17,india,proofs,OPC R1 8B,1.0
5797,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,india_prep_2025_6,india,proofs,OPC R1 8B,0.0
5798,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,india_prep_2025_4,india,proofs,OPC R1 8B,1.0
5799,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,india_prep_2025_9,india,proofs,OPC R1 8B,1.0
5800,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,india_prep_2025_20,india,proofs,OPC R1 8B,0.0
5801,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,india_prep_2025_8,india,proofs,OPC R1 8B,0.0
5802,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,india_prep_2025_18,india,proofs,OPC R1 8B,0.0
5803,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,india_2025_1,india,proofs,OPC R1 8B,1.0
5804,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,india_prep_2025_1,india,proofs,OPC R1 8B,1.0
5805,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,india_prep_2025_11,india,proofs,OPC R1 8B,0.0
5806,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,india_2025_5,india,proofs,OPC R1 8B,0.0
5807,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,india_prep_2025_3,india,proofs,OPC R1 8B,0.0
5808,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,india_2025_3,india,proofs,OPC R1 8B,0.0
5809,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,india_prep_2025_21,india,proofs,OPC R1 8B,0.0
5810,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,india_prep_2025_13,india,proofs,OPC R1 8B,1.0
5811,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,india_prep_2025_16,india,proofs,OPC R1 8B,1.0
5812,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,india_2025_4,india,proofs,OPC R1 8B,1.0
5813,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,izho_2025_6,izho,proofs,OPC R1 8B,0.0
5814,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,izho_2025_2,izho,proofs,OPC R1 8B,1.0
5815,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,izho_2025_1,izho,proofs,OPC R1 8B,1.0
5816,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,izho_2025_5,izho,proofs,OPC R1 8B,0.0
5817,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,izho_2025_3,izho,proofs,OPC R1 8B,1.0
5818,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,izho_2025_4,izho,proofs,OPC R1 8B,1.0
5819,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,canada_2025_2,canada,proofs,OPC R1 8B,1.0
5820,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,canada_2025_1,canada,proofs,OPC R1 8B,0.0
5821,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,canada_2025_5,canada,proofs,OPC R1 8B,1.0
5822,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,canada_2025_3,canada,proofs,OPC R1 8B,1.0
5823,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,canada_2025_4,canada,proofs,OPC R1 8B,0.0
5824,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,greece_2025_2,greece,proofs,OPC R1 8B,1.0
5825,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,greece_2025_1,greece,proofs,OPC R1 8B,1.0
5826,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,greece_2025_3,greece,proofs,OPC R1 8B,1.0
5827,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,greece_2025_4,greece,proofs,OPC R1 8B,1.0
5828,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,turkey_tst_2025_7,turkey,proofs,OPC R1 8B,0.0
5829,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,turkey_tst_2025_3,turkey,proofs,OPC R1 8B,0.0
5830,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,turkey_tst_2025_5,turkey,proofs,OPC R1 8B,0.0
5831,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,turkey_tst_2025_4,turkey,proofs,OPC R1 8B,0.0
5832,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,turkey_tst_2025_6,turkey,proofs,OPC R1 8B,0.0
5833,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,turkey_tst_2025_1,turkey,proofs,OPC R1 8B,1.0
5834,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,turkey_tst_2025_2,turkey,proofs,OPC R1 8B,1.0
5835,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,turkey_tst_2025_8,turkey,proofs,OPC R1 8B,0.0
5836,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,turkey_tst_2025_9,turkey,proofs,OPC R1 8B,0.0
5837,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,nordic_2025_2,nordic,proofs,OPC R1 8B,1.0
5838,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,nordic_2025_1,nordic,proofs,OPC R1 8B,1.0
5839,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,nordic_2025_3,nordic,proofs,OPC R1 8B,1.0
5840,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,china_2025_6,china,proofs,OPC R1 8B,0.0
5841,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,china_2025_2,china,proofs,OPC R1 8B,0.0
5842,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,china_2025_1,china,proofs,OPC R1 8B,1.0
5843,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,china_2025_5,china,proofs,OPC R1 8B,0.0
5844,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,china_2025_3,china,proofs,OPC R1 8B,0.0
5845,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,chinatst_2025_7,chinatst,proofs,OPC R1 8B,1.0
5846,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,chinatst_2025_6,chinatst,proofs,OPC R1 8B,1.0
5847,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,chinatst_2025_9,chinatst,proofs,OPC R1 8B,0.0
5848,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,chinatst_2025_2,chinatst,proofs,OPC R1 8B,0.0
5849,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,chinatst_2025_12,chinatst,proofs,OPC R1 8B,1.0
5850,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,chinatst_2025_10,chinatst,proofs,OPC R1 8B,0.0
5851,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,chinatst_2025_11,chinatst,proofs,OPC R1 8B,0.0
5852,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,chinatst_2025_17,chinatst,proofs,OPC R1 8B,0.0
5853,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,chinatst_2025_8,chinatst,proofs,OPC R1 8B,0.0
5854,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,chinatst_2025_16,chinatst,proofs,OPC R1 8B,0.0
5855,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,chinatst_2025_19,chinatst,proofs,OPC R1 8B,0.0
5856,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,chinatst_2025_20,chinatst,proofs,OPC R1 8B,0.0
5857,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,chinatst_2025_22,chinatst,proofs,OPC R1 8B,0.0
5858,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,chinatst_2025_1,chinatst,proofs,OPC R1 8B,1.0
5859,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,chinatst_2025_15,chinatst,proofs,OPC R1 8B,1.0
5860,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,chinatst_2025_18,chinatst,proofs,OPC R1 8B,0.0
5861,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,chinatst_2025_21,chinatst,proofs,OPC R1 8B,1.0
5862,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,chinatst_2025_5,chinatst,proofs,OPC R1 8B,0.0
5863,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,chinatst_2025_13,chinatst,proofs,OPC R1 8B,0.0
5864,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,chinatst_2025_3,chinatst,proofs,OPC R1 8B,0.0
5865,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,chinatst_2025_14,chinatst,proofs,OPC R1 8B,1.0
5866,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,chinatst_2025_4,chinatst,proofs,OPC R1 8B,1.0
5867,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,serbia_tst_bmo_2025_2,serbia,proofs,OPC R1 8B,0.0
5868,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,serbia_tst_bmo_2025_3,serbia,proofs,OPC R1 8B,1.0
5869,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,serbia_tst_bmo_2025_1,serbia,proofs,OPC R1 8B,1.0
5870,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,serbia_tst_bmo_2025_4,serbia,proofs,OPC R1 8B,0.0
5871,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,iran_tst_2025_7,iran,proofs,OPC R1 8B,1.0
5872,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,iran_tst_2025_3,iran,proofs,OPC R1 8B,0.0
5873,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,iran_tst_2025_5,iran,proofs,OPC R1 8B,0.0
5874,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,iran_tst_2025_4,iran,proofs,OPC R1 8B,1.0
5875,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,iran_tst_2025_6,iran,proofs,OPC R1 8B,0.0
5876,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,iran_tst_2025_1,iran,proofs,OPC R1 8B,0.0
5877,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,iran_tst_2025_2,iran,proofs,OPC R1 8B,1.0
5878,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,iran_tst_2025_8,iran,proofs,OPC R1 8B,0.0
5879,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,iran_tst_2025_9,iran,proofs,OPC R1 8B,1.0
5880,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,philippines_2025_7,philippines,proofs,OPC R1 8B,1.0
5881,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,philippines_2025_6,philippines,proofs,OPC R1 8B,1.0
5882,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,philippines_2025_2,philippines,proofs,OPC R1 8B,0.0
5883,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,philippines_2025_8,philippines,proofs,OPC R1 8B,0.0
5884,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,philippines_2025_1,philippines,proofs,OPC R1 8B,1.0
5885,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,philippines_2025_5,philippines,proofs,OPC R1 8B,1.0
5886,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,philippines_2025_3,philippines,proofs,OPC R1 8B,1.0
5887,Gemini Pro 3 Preview,gemini/gemini-pro-3-preview,philippines_2025_4,philippines,proofs,OPC R1 8B,0.0
