Step,GRPO-Qwen2.5-math-7b-math - response_length/mean
1,991.5819702
2,949.9343872
3,917.4456177
4,849.2210083
5,781.234314
6,724.4401855
7,705.1735229
8,678.3019409
9,664.0440674
10,660.7515869
11,655.6636963
12,643.5480957
13,653.3731689
14,638.2384033
15,635.1629028
16,644.4938965
17,644.9567261
18,638.571106
19,633.2724609
20,646.0713501
21,618.8389282
22,615.8848267
23,617.1369019
24,614.7074585
25,612.4813232
26,636.7709961
27,614.7074585
28,644.7974243
29,635.8817749
30,639.8334961
31,631.6362305
32,637.9077759
33,639.668335
34,626.7819214
35,630.7491455
36,654.3745728
37,639.7384033
38,621.1446533
39,628.8532715
40,639.0414429
41,632.0765991
42,631.1132813
43,625.4914551
44,619.4537354
45,631.4252319
46,633.7897339
47,619.7453613
48,632.0925903
49,628.4858398
50,628.3568726
51,630.3144531
52,621.5449829
53,649.1175537
54,630.7145996
55,649.0249634
56,623.5426025
57,626.1973877
58,634.2229614
59,636.5403442
60,637.7223511
61,631.1018066
62,638.9943237
63,642.1618652
64,624.6462402
65,637.22052
66,619.4008179
67,621.9338379
68,619.9371338
69,653.006897
70,644.1104736
71,633.8881226
72,617.2404785
73,640.324585
74,621.1467896
75,621.9279785
76,640.0402222
77,646.9697266
78,650.1046753
79,621.0848389
80,626.7546387
81,617.6220703
82,607.2797852
83,625.7334595
84,611.739563
85,643.9490967
86,646.4887085
87,614.6621094
88,645.9016113
89,621.2492676
90,639.4799194
91,634.4927368
92,633.460144
93,610.7163086
94,614.4602661
95,620.0670776
96,636.2266846
97,616.1008301
98,635.3285522
99,603.3519287
100,616.4567871
101,623.3997192
102,639.4632568
103,630.7506714
104,629.647644
105,608.3625488
106,631.8171997
107,615.5597534
108,623.194458
109,631.6757202
110,608.3056641
111,616.3609619
112,628.1451416
113,623.0371094
114,617.0662842
115,605.6416626
116,617.3448486
117,622.9141235
118,613.5479736
119,620.5796509
120,613.088623
121,623.1877441
122,610.9520874
123,611.2958984
124,621.4353027
125,605.6774902
126,592.6160278
127,598.1504517
128,626.1226807
129,616.7356567
130,623.6588135
131,616.7879028
132,623.1381226
133,619.5656738
134,612.2159424
135,624.041748
136,604.8363037
137,629.8512573
138,632.1730347
139,611.3683472
140,621.8687134
141,624.399292
142,628.6776733
143,610.2142944
144,622.5049438
145,614.4033203
146,644.1848145
147,612.6724243
148,614.4124146
149,618.1450195
150,623.0491943
151,625.3064575
152,609.6743164
153,629.5596313
154,616.4800415
155,603.2509766
156,628.1335449
157,626.5060425
158,622.8169556
159,623.0704956
160,627.3109131
161,625.4833984
162,640.730835
163,620.2034302
164,631.8535767
165,632.6152954
166,629.7210083
167,636.3477783
168,610.2914429
169,617.6062622
170,636.5406494
171,634.8349609
172,629.7228394
173,619.2756348
174,619.5497437
175,626.7612305
176,625.7133789
177,622.0686646
178,617.0241089
179,619.2231445
180,631.6993408
181,622.8699341
182,628.2519531
183,625.8032837
184,624.0964966
185,645.1741333
186,620.1694946
187,612.46698
188,627.9989624
189,653.2272949
190,610.4472656
191,619.9860229
192,606.4709473
193,617.6062622
194,636.5406494
195,634.8349609
196,629.7228394
197,619.2756348
198,619.5497437
199,626.7612305
200,625.7133789
201,622.0686646
202,617.0241089
203,619.2231445
204,631.6993408
205,622.8699341
206,628.2519531
207,625.8032837
208,624.0964966
209,645.1741333
210,620.1694946
211,612.46698
212,627.9989624
213,620.2034302
214,631.8535767
215,632.6152954
216,629.7210083
217,636.3477783
218,610.2914429
219,606.4709473