_step,avg_score/16384/four_sets,critic/score/mean,response_length/mean
1,,0.125,2881.4619140625
2,,0.09765625,2994.697265625
3,,0.095703125,2989.4345703125
4,,0.091796875,2976.658203125
5,,0.123046875,3049.3876953125
6,,0.1181640625,2986.607421875
7,,0.103515625,3119.66015625
8,,0.140625,2977.5224609375
9,,0.1064453125,2832.775390625
10,0.12030220883534137,0.1494140625,3065.470703125
11,,0.134765625,3003.19921875
12,,0.1298828125,3289.6103515625
13,,0.140625,3589.67578125
14,,0.1435546875,4057.47265625
15,,0.1796875,4012.7978515625
16,,0.1708984375,4160.4521484375
17,,0.197265625,3985.861328125
18,,0.1767578125,4400.8642578125
19,,0.2509765625,3698.0419921875
20,0.19487354975457383,0.2421875,3894.37109375
21,,0.2451171875,4372.73828125
22,,0.283203125,3731.154296875
23,,0.25390625,4325.5458984375
24,,0.2744140625,4031.51953125
25,,0.2802734375,3862.380859375
26,,0.2470703125,3834.9765625
27,,0.28125,3728.86328125
28,,0.3173828125,3320.2724609375
29,,0.2744140625,3879.0029296875
30,0.2116693998215083,0.251953125,3954.720703125
31,,0.3515625,3564.1455078125
32,,0.302734375,3710.609375
33,,0.3115234375,3186.4794921875
34,,0.296875,3158.2822265625
35,,0.2646484375,2750.3330078125
36,,0.3017578125,2771.78125
37,,0.310546875,3488.064453125
38,,0.3857421875,3390.984375
39,,0.31640625,3945.7783203125
40,0.22940969433288708,0.375,3626.583984375
41,,0.3447265625,3685.203125
42,,0.267578125,3625.765625
43,,0.2822265625,3899.4169921875
44,,0.3359375,3258.494140625
45,,0.27734375,4029.3017578125
46,,0.38671875,3120.46484375
47,,0.37890625,2704.7431640625
48,,0.3486328125,1819.7919921875
49,,0.337890625,1982.599609375
50,0.21916108879964302,0.365234375,2370.701171875
51,,0.369140625,2501.9296875
52,,0.2822265625,2719.654296875
53,,0.4033203125,2398.0869140625
54,,0.3642578125,2011.8203125
55,,0.294921875,2494.1845703125
56,,0.3505859375,2187.0244140625
57,,0.30078125,2435.58203125
58,,0.3935546875,2663.267578125
59,,0.3994140625,2919.66015625
60,0.25081459170013387,0.4365234375,2641.017578125
61,,0.375,2946.568359375
62,,0.3896484375,2724.0712890625
63,,0.3408203125,1758.2001953125
64,,0.375,2070.3818359375
65,,0.2978515625,2503.201171875
66,,0.396484375,2504.763671875
67,,0.369140625,3012.6748046875
68,,0.3876953125,2595.74609375
69,,0.3642578125,2312.4755859375
70,0.26163286479250336,0.361328125,2801.716796875
71,,0.34375,2915.201171875
72,,0.353515625,2640.55859375
73,,0.423828125,2610.107421875
74,,0.40234375,3158.287109375
75,,0.345703125,2766.0439453125
76,,0.32421875,2481.2685546875
77,,0.322265625,2080.5576171875
78,,0.3525390625,2359.626953125
79,,0.328125,2054.59765625
80,0.26092776662204376,0.400390625,2304.48046875
81,,0.388671875,2690.025390625
82,,0.3740234375,2617.369140625
83,,0.390625,2756.8837890625
84,,0.3349609375,3522.20703125
85,,0.357421875,3017.171875
86,,0.361328125,2477.7109375
87,,0.423828125,2291.591796875
88,,0.3896484375,2386.6142578125
89,,0.35546875,1842.5849609375
90,0.26073655734047296,0.38671875,2199.1748046875
91,,0.349609375,2609.2666015625
92,,0.3291015625,2984.0556640625
93,,0.388671875,2397.0029296875
94,,0.3974609375,1967.3056640625
95,,0.4248046875,1982.1376953125
96,,0.4091796875,1678.337890625
97,,0.3779296875,1850.9326171875
98,,0.423828125,2077.0810546875
99,,0.5009765625,1816.5263671875
100,0.27244511378848724,0.3798828125,2583.607421875
101,,0.4580078125,2091.2783203125
102,,0.37890625,2295.6083984375
103,,0.38671875,2421.056640625
104,,0.3271484375,2825.3408203125
105,,0.3583984375,2027.1474609375
106,,0.380859375,1781.7529296875
107,,0.423828125,1373.0078125
108,,0.4072265625,1529.1455078125
109,,0.404296875,1254.89453125
110,0.2597761601963409,0.3671875,1522.6123046875
111,,0.4052734375,1624.7529296875
112,,0.3798828125,1905.1875
113,,0.33984375,2168.2431640625
114,,0.41796875,2332.345703125
115,,0.4580078125,2296.8955078125
116,,0.3818359375,1929.0517578125
117,,0.4404296875,2268.4248046875
118,,0.3935546875,2166.1640625
119,,0.375,2156.1064453125
120,0.2656646028558679,0.400390625,2349.5302734375
121,,0.466796875,2039.9052734375
122,,0.4375,1551.1318359375
123,,0.3916015625,1252.84375
124,,0.3837890625,1093.7822265625
125,,0.41796875,1098.6240234375
126,,0.3828125,812.716796875
127,,0.439453125,1052.55859375
128,,0.390625,636.0859375
129,,0.4052734375,575.6337890625
130,0.2119429941990183,0.41796875,623.5
131,,0.3701171875,573.4208984375
132,,0.4296875,696.4248046875
133,,0.4296875,1126.9794921875
134,,0.3134765625,949.3935546875
135,,0.50390625,1321.2958984375
136,,0.400390625,1908.2763671875
137,,0.349609375,1651.728515625
138,,0.341796875,1450.4501953125
139,,0.408203125,1771.869140625
140,0.25793423694779116,0.4716796875,1438.828125
141,,0.46484375,1480.8720703125
142,,0.431640625,1110.7900390625
143,,0.4697265625,1198.17578125
144,,0.3388671875,1927.4921875
145,,0.3603515625,2310.4912109375
146,,0.4443359375,2109.2314453125
147,,0.3955078125,2096.392578125
148,,0.4921875,2407.5087890625
149,,0.4013671875,2533.8349609375
150,0.283225011155734,0.3916015625,2622.2509765625
151,,0.427734375,2677.9033203125
152,,0.4658203125,3078.8779296875
153,,0.4130859375,2486.4599609375
154,,0.4501953125,2538.416015625
155,,0.51171875,2213.890625
156,,0.4560546875,2063.2880859375
157,,0.458984375,2608.865234375
158,,0.47265625,2502.732421875
159,,0.4453125,1828.86328125
160,0.28473823070058013,0.439453125,2204.5419921875
161,,0.404296875,2381.125
162,,0.45703125,1922.52734375
163,,0.5185546875,2280.6142578125
164,,0.443359375,2323.59375
165,,0.4541015625,2208.650390625
166,,0.4892578125,2332.2109375
167,,0.50390625,2274.0341796875
168,,0.3837890625,2353.0498046875
169,,0.4580078125,2277.2841796875
170,0.289825245426149,0.431640625,2356.2890625
171,,0.4296875,2362.125
172,,0.46484375,3050.822265625
173,,0.484375,2781.6748046875
174,,0.4287109375,3199.2490234375
175,,0.4140625,2262.65625
176,,0.494140625,2215.052734375
177,,0.4892578125,2117.77734375
178,,0.5068359375,1742.9111328125
179,,0.45703125,1704.19921875
180,0.26568540829986614,0.4423828125,843.609375
181,,0.4599609375,926.8447265625
182,,0.443359375,1164.689453125
183,,0.453125,1043.4228515625
184,,0.3935546875,968.892578125
185,,0.4248046875,1046.5751953125
186,,0.4228515625,1325.095703125
187,,0.494140625,1212.4619140625
188,,0.48828125,1329.7685546875
189,,0.478515625,1149.130859375
190,0.28166320838911196,0.455078125,1377.626953125
191,,0.4501953125,1227.44140625
192,,0.4462890625,1524.6904296875
193,,0.431640625,1066.1796875
194,,0.4306640625,1277.00390625
195,,0.40625,1150.048828125
196,,0.3916015625,1006.6591796875
197,,0.427734375,1352.435546875
198,,0.4130859375,1726.7333984375
199,,0.4794921875,894.0634765625
200,0.2849951472556894,0.3818359375,1027.9267578125
201,,0.4775390625,1729.572265625
202,,0.513671875,1442.86328125
203,,0.4609375,1846.5068359375
204,,0.486328125,1823.6494140625
205,,0.501953125,2009.3935546875
206,,0.4052734375,1823.4482421875
207,,0.4599609375,1583.21875
208,,0.447265625,1597.0087890625
209,,0.5126953125,1569.0732421875
210,0.29524609549308345,0.45703125,1795.5439453125
211,,0.4404296875,1884.1337890625
212,,0.46484375,1779.29296875
213,,0.505859375,1999.3525390625
214,,0.470703125,1944.51953125
215,,0.501953125,1512.0390625
216,,0.47265625,1594.5224609375
217,,0.4208984375,1712.5751953125
218,,0.4736328125,1619.0107421875
219,,0.376953125,2137.6787109375
220,0.27604027219991073,0.4619140625,1408.4287109375
221,,0.478515625,1244.107421875
222,,0.4609375,1593.87890625
223,,0.5400390625,1295.3544921875
224,,0.5244140625,1653.052734375
225,,0.505859375,1543.2529296875
226,,0.458984375,1564.720703125
227,,0.474609375,1263.3466796875
228,,0.447265625,1453.0087890625
229,,0.46484375,1214.39453125
230,0.27637338241856313,0.458984375,1285.7529296875
231,,0.462890625,1496.6845703125
232,,0.4404296875,1900.744140625
233,,0.466796875,1763.9345703125
234,,0.3818359375,1939.376953125
235,,0.3876953125,1904.970703125
236,,0.513671875,1583.0810546875
237,,0.4033203125,1746.6044921875
238,,0.5458984375,1617.41015625
239,,0.4375,1578.962890625
240,0.27775697233377955,0.4580078125,1087.529296875
241,,0.4912109375,926.314453125
242,,0.408203125,1114.587890625
243,,0.44921875,1371.45703125
244,,0.486328125,1665.2421875
245,,0.46875,1215.552734375
246,,0.4384765625,1544.6708984375
247,,0.537109375,1532.5830078125
248,,0.4228515625,1208.8828125
249,,0.5,1469.046875
250,0.26681922132976355,0.423828125,1437.8212890625
251,,0.4677734375,1451.5673828125
252,,0.47265625,1528.736328125
253,,0.509765625,1358.1650390625
254,,0.521484375,1293.1396484375
255,,0.423828125,1651.2109375
256,,0.42578125,1480.5859375
257,,0.482421875,1439.58984375
258,,0.47265625,1661.205078125
259,,0.5107421875,1382.798828125
260,0.2869449464524766,0.4580078125,2142.9033203125
261,,0.5068359375,1327.1826171875
262,,0.4814453125,1494.1416015625
263,,0.4228515625,1728.8408203125
264,,0.484375,1747.5185546875
265,,0.4716796875,1931.697265625
266,,0.494140625,1900.599609375
267,,0.484375,2039.1962890625
268,,0.505859375,1810.130859375
269,,0.4462890625,1835.9423828125
270,0.3003366242748773,0.4931640625,1739.08203125
271,,0.5244140625,1566.357421875
272,,0.5361328125,1323.3642578125
273,,0.484375,1422.0908203125
274,,0.4833984375,1184.3251953125
275,,0.458984375,1294.84765625
276,,0.3896484375,1167.5361328125
277,,0.447265625,1199.126953125
278,,0.5126953125,1268.7021484375
279,,0.537109375,1095.4453125
280,0.28097434181169123,0.462890625,1371.32421875
281,,0.4990234375,1040.83203125
282,,0.4248046875,1167.6005859375
283,,0.4716796875,1329.31640625
284,,0.5107421875,1202.8408203125
285,,0.5126953125,1390.759765625
286,,0.4287109375,1634.068359375
287,,0.53125,1425.8701171875
288,,0.474609375,1661.2509765625
289,,0.5302734375,1454.513671875
290,0.278437974118697,0.4482421875,1677.2294921875
291,,0.4892578125,1346.2099609375
292,,0.484375,1613.6484375
293,,0.474609375,1795.490234375
294,,0.5419921875,1364.5439453125
295,,0.494140625,1648.7978515625
296,,0.4140625,1877.9931640625
297,,0.509765625,1452.2900390625
298,,0.4794921875,1616.376953125
299,,0.513671875,1468.1728515625
300,0.3048752788933512,0.4560546875,1788.169921875
301,,0.419921875,1961.16796875
302,,0.4228515625,2283.525390625
303,,0.517578125,1819.701171875
304,,0.439453125,1642.251953125
305,,0.509765625,1940.87890625
306,,0.494140625,1646.556640625
307,,0.517578125,1673.33984375
308,,0.5439453125,1456.6181640625
309,,0.4638671875,1844.041015625
310,0.3112836345381526,0.482421875,1900.6416015625
311,,0.5263671875,1616.869140625
312,,0.478515625,1995.83203125
313,,0.49609375,1803.6142578125
314,,0.5380859375,1533.1669921875
315,,0.5244140625,1334.1689453125
316,,0.505859375,1319.412109375
317,,0.4345703125,1309.23828125
318,,0.537109375,1937.1689453125
319,,0.451171875,1975.474609375
320,0.2879109214636323,0.521484375,1238.9375
321,,0.49609375,1640.22265625
322,,0.4462890625,1653.4443359375
323,,0.46484375,2020.1552734375
324,,0.5322265625,1822.2880859375
325,,0.498046875,2153.4677734375
326,,0.4853515625,2218.4228515625
327,,0.490234375,1511.439453125
328,,0.4013671875,1275.662109375
329,,0.5830078125,864.4501953125
330,0.23566711289602854,0.4794921875,788.658203125
331,,0.4990234375,210.34765625
332,,0.3955078125,489.5390625
333,,0.42578125,617.732421875
334,,0.494140625,688.455078125
335,,0.48046875,501.3408203125
336,,0.5380859375,1178.0400390625
337,,0.431640625,1024.048828125
338,,0.490234375,1012.638671875
339,,0.48046875,1421.41796875
340,0.2738250223114681,0.4716796875,1386.1240234375
341,,0.4541015625,1216.3349609375
342,,0.4755859375,966.9521484375
343,,0.447265625,1207.3466796875
344,,0.482421875,892.34375
345,,0.4775390625,1298.322265625
346,,0.4345703125,1189.7158203125
347,,0.4287109375,899.166015625
348,,0.4765625,1221.7412109375
349,,0.451171875,1315.46875
350,0.2925894132083891,0.5341796875,1554.9794921875
351,,0.4521484375,1717.5029296875
352,,0.521484375,2045.8125
353,,0.580078125,1132.3876953125
354,,0.529296875,1716.134765625
355,,0.57421875,1481.521484375
356,,0.447265625,1135.3818359375
357,,0.41796875,1563.6064453125
358,,0.435546875,1480.4814453125
359,,0.44921875,1254.1318359375
360,0.27551321954484603,0.4443359375,1419.00390625
361,,0.5322265625,954.1455078125
362,,0.4931640625,1526.3115234375
363,,0.509765625,1790.1455078125
364,,0.4765625,1064.8134765625
365,,0.5205078125,1323.521484375
366,,0.482421875,1539.9443359375
367,,0.49609375,1535.2578125
368,,0.423828125,1213.865234375
369,,0.4912109375,1331.158203125
370,0.26958076751450244,0.4443359375,1772.236328125
371,,0.4853515625,1473.8984375
372,,0.4912109375,1704.3818359375
373,,0.4638671875,1442.3564453125
374,,0.533203125,1433.509765625
375,,0.48828125,1919.1669921875
376,,0.466796875,1894.611328125
377,,0.4931640625,1747.5693359375
378,,0.45703125,2175.4560546875
379,,0.478515625,1717.4287109375
380,0.2871164658634538,0.4814453125,1830.4404296875
381,,0.5458984375,1496.2802734375
382,,0.4482421875,2165.4619140625
383,,0.5029296875,2030.904296875
384,,0.4990234375,1592.2216796875
385,,0.494140625,1804.47265625
386,,0.447265625,2152.51953125
387,,0.4345703125,2010.16796875
388,,0.5009765625,1709.84765625
389,,0.4521484375,1722.29296875
