Step,UCAS-Qwen2.5-math-7b-math_adaptive - actor/entropy
1,0.311713535
2,0.300570616
3,0.282090244
4,0.259782137
5,0.229327576
6,0.190502746
7,0.17639148
8,0.156251657
9,0.123858687
10,0.116251903
11,0.114651667
12,0.114812384
13,0.114755662
14,0.118127289
15,0.11346663
16,0.115350904
17,0.117797191
18,0.105729252
19,0.106785379
20,0.106501505
21,0.107950285
22,0.109348528
23,0.111315802
24,0.108038716
25,0.108399622
26,0.11231672
27,0.112649381
28,0.111206159
29,0.10959857
30,0.109507158
31,0.111082166
32,0.110067047
33,0.106736086
34,0.109862767
35,0.111328863
36,0.110718973
37,0.109029189
38,0.110011712
39,0.110042177
40,0.114780053
41,0.111579642
42,0.110331289
43,0.108704336
44,0.112530209
45,0.114266239
46,0.110055983
47,0.111051075
48,0.112960376
49,0.11242386
50,0.116592892
51,0.110869527
52,0.118256494
53,0.111674309
54,0.110089079
55,0.118401252
56,0.117497377
57,0.117278725
58,0.116477907
59,0.119276367
60,0.117624193
61,0.120729677
62,0.120802708
63,0.121075518
64,0.122463681
65,0.126091182
66,0.126887143
67,0.124553524
68,0.123090982
69,0.127089888
70,0.120970851
71,0.118768519
72,0.120259112
73,0.122188603
74,0.122453695
75,0.125524541
76,0.120262241
77,0.125468647
78,0.124165972
79,0.129037058
80,0.127734647
81,0.126692698
82,0.121635616
83,0.125732557
84,0.127735884
85,0.133332715
86,0.142330453
87,0.138692245
88,0.140073345
89,0.134601445
90,0.140331194
91,0.144157604
92,0.147496984
93,0.145935983
94,0.148015544
95,0.140855879
96,0.144329906
97,0.146171228
98,0.156293586
99,0.15686065
100,0.150819019
101,0.14671889
102,0.16387798
103,0.151569024
104,0.155832321
105,0.159117342
106,0.156471179
107,0.162879065
108,0.160175443
109,0.166053936
110,0.160910369
111,0.174654872
112,0.162877545
113,0.166559136
114,0.166016162
115,0.16662176
116,0.169741622
117,0.169334129
118,0.170568237
119,0.168153805
120,0.175971956
121,0.175552795
122,0.178817974
123,0.18384152
124,0.185781441
125,0.190061581
126,0.179514224
127,0.176918099
128,0.192044477
129,0.191764424
130,0.186757634
131,0.191803465
132,0.188868354
133,0.186029966
134,0.19604827
135,0.188420738
136,0.192767615
137,0.206613178
138,0.194764192
139,0.186514656
140,0.208530734
141,0.185003365
142,0.202994401
143,0.193236123
144,0.19656604
145,0.203541259
146,0.200636993
147,0.200225289
148,0.206129412
149,0.204285736
150,0.203335772
151,0.212286308
152,0.209865332
153,0.226023286
154,0.201114133
155,0.205821037
156,0.211214825
157,0.206508815
158,0.212201938
159,0.208820403
160,0.209964117
161,0.212873166
162,0.199498912
163,0.224889015
164,0.214790171
165,0.212759992
166,0.200993171
167,0.208643948
168,0.209962224
169,0.206712534
170,0.218020087
171,0.206085598
172,0.222222631
173,0.19568575
174,0.204840084
175,0.203064164
176,0.208410477
177,0.212706035
178,0.201962238
179,0.193656867
180,0.220729595
181,0.192726304
182,0.20672447
183,0.206821283
184,0.202500557
185,0.208465596
186,0.213230868
187,0.20907334
188,0.213018855
189,0.212481266
190,0.203127047
191,0.208170121
192,0.219824558
193,0.216533428
194,0.204748278
195,0.19410729
196,0.198729585
197,0.188839714
198,0.196143623
199,0.204753439
200,0.210761036
201,0.195953067
202,0.197960253
203,0.198786895
204,0.190831746
205,0.194434013
206,0.189792375
207,0.1875672
208,0.195123162
209,0.189167704
210,0.203615169
211,0.206955891
212,0.19459642
213,0.196780305
214,0.193027805
215,0.197250034
216,0.20349599
217,0.195459049
218,0.194127466
219,0.186540123
220,0.207762729
221,0.195125441
222,0.192381407
223,0.190427642
224,0.1866385
225,0.207100611
226,0.198641013
227,0.195747163
228,0.204878728
229,0.200153779
230,0.20003302
231,0.197411145
232,0.207637648
233,0.193477149
234,0.186264168
235,0.183865558
236,0.18367147
237,0.195575829
238,0.194384496
239,0.196639161
240,0.18559977
241,0.196396987