Step,UCAS-Qwen2.5-math-1.5b-math_adaptive_v5 - actor/entropy
1,0.431873798
2,0.452916265
3,0.397866279
4,0.338076472
5,0.266935021
6,0.202143759
7,0.18220076
8,0.162807301
9,0.140723646
10,0.137065455
11,0.127464607
12,0.128336132
13,0.12722367
14,0.121775702
15,0.119282492
16,0.125946969
17,0.119374976
18,0.121146418
19,0.121797256
20,0.11733868
21,0.118980467
22,0.117709167
23,0.118120968
24,0.117869742
25,0.117635399
26,0.116655059
27,0.116391182
28,0.119018532
29,0.115871146
30,0.113239467
31,0.112578288
32,0.115133144
33,0.114335954
34,0.111595653
35,0.108293556
36,0.107967652
37,0.110038228
38,0.105603173
39,0.109131508
40,0.109043345
41,0.102511778
42,0.107470319
43,0.104334466
44,0.100963503
45,0.099771157
46,0.100526862
47,0.098962739
48,0.101454705
49,0.099243268
50,0.097878516
51,0.097425684
52,0.095763877
53,0.097002931
54,0.094862357
55,0.096885435
56,0.094121926
57,0.096120872
58,0.094877757
59,0.093742125
60,0.089500882
61,0.090903893
62,0.088622175
63,0.08953882
64,0.089219816
65,0.085062005
66,0.087194085
67,0.083807342
68,0.085533097
69,0.087625511
70,0.08475697
71,0.08512792
72,0.083713442
73,0.083312117
74,0.084757887
75,0.08249595
76,0.082547687
77,0.082780115
78,0.081860989
79,0.081555463
80,0.084345467
81,0.082561456
82,0.08381328
83,0.082382433
84,0.080843791
85,0.081823334
86,0.078574695
87,0.081998251
88,0.080915548
89,0.081304751
90,0.081591517
91,0.078655645
92,0.078740098
93,0.07782495
94,0.078899898
95,0.078369193
96,0.077798128
97,0.078725778
98,0.077281013
99,0.078607157
100,0.076764211
101,0.07629551
102,0.077844582
103,0.076666161
104,0.078515522
105,0.078964576
106,0.077571474
107,0.076098993
108,0.079728745
109,0.080125272
110,0.080744788
111,0.078144841
112,0.079057984
113,0.078390449
114,0.077428356
115,0.078634188
116,0.078393236
117,0.077433363
118,0.078521557
119,0.077563889
120,0.079545222
121,0.078197427
122,0.07850489
123,0.080044329
124,0.076884575
125,0.081678033
126,0.081373721
127,0.082075879
128,0.080318056
129,0.081548244
130,0.078999005
131,0.08001674
132,0.081596717
133,0.083803773
134,0.081452332
135,0.081455216
136,0.082499102
137,0.080366448
138,0.082834184
139,0.081405699
140,0.084257819
141,0.083818503
142,0.083249316
143,0.083438039
144,0.082775608
145,0.083321862
146,0.084908232
147,0.083847187
148,0.085227922
149,0.083965302
150,0.085336208
151,0.08431159
152,0.08501631
153,0.084950134
154,0.084109135
155,0.091386363
156,0.088391662
157,0.085370205
158,0.085074365
159,0.084631309
160,0.086067237
161,0.086984426
162,0.085894965
163,0.086263724
164,0.085689545
165,0.085238986
166,0.085138455
167,0.089329422
168,0.087386414
169,0.089109227
170,0.086756788
171,0.086868308
172,0.086912282
173,0.089999892
174,0.088779368
175,0.089649782
176,0.090526268
177,0.091065153
178,0.090304211
179,0.091265976
180,0.091230981
181,0.091332957
182,0.095137171
183,0.096735775
184,0.093734503
185,0.095121749
186,0.094863139
187,0.098425888
188,0.094493851
189,0.099127002
190,0.095808171
191,0.097759329
192,0.100866824
193,0.097521015
194,0.099289238
195,0.098601975
196,0.09990824
197,0.098284096
198,0.0980938
199,0.09879116
200,0.099389285
201,0.100002781
202,0.099934496
203,0.099531136
204,0.101993367
205,0.098127976
206,0.102029726
207,0.098477051
208,0.102600239
209,0.100209109
210,0.099977754
211,0.098494895
212,0.101321504
213,0.099758953
214,0.100216582
215,0.103032626
216,0.1021614
217,0.104931593
218,0.106118783