_step,actor/entropy,avg_score/16384/four_sets,critic/acc/mean,response_length/mean
1,1.048940896987915,,0.0966796875,1292.8779296875
2,1.037702202796936,,0.0927734375,1261.416015625
3,0.958188533782959,,0.1123046875,1318.6689453125
4,0.8118701577186584,,0.1064453125,1337.07421875
5,1.2164140939712524,,0.1103515625,1263.205078125
6,0.9515784978866577,,0.1376953125,1206.240234375
7,0.927644670009613,,0.095703125,1350.91796875
8,1.221787929534912,,0.1171875,1433.58203125
9,1.1177133321762085,,0.12109375,1399.6669921875
10,1.0333952903747559,0.30551210397144135,0.1298828125,1529.291015625
11,0.9422702193260193,,0.123046875,1531.71875
12,1.0039443969726562,,0.1259765625,1475.37890625
13,0.842411994934082,,0.1455078125,1599.806640625
14,0.914419412612915,,0.1689453125,1564.455078125
15,0.9186915159225464,,0.1357421875,1652.83203125
16,0.7773234248161316,,0.1640625,1796.833984375
17,0.8878266215324402,,0.142578125,1808.830078125
18,0.7553147673606873,,0.171875,1803.4326171875
19,0.6967107057571411,,0.181640625,1871.2587890625
20,0.7326955795288086,0.33607139669790276,0.1728515625,1869.9375
21,0.804415225982666,,0.1689453125,1889.2587890625
22,0.7675164937973022,,0.189453125,2049.8837890625
23,0.7771696448326111,,0.1767578125,2120.1826171875
24,0.6014740467071533,,0.138671875,2016.38671875
25,0.7877092361450195,,0.181640625,2099.693359375
26,0.8437134027481079,,0.1748046875,2202.7568359375
27,0.8444793224334717,,0.1845703125,2050.3837890625
28,0.64154452085495,,0.181640625,2011.18359375
29,0.6889636516571045,,0.177734375,2151.0615234375
30,0.7894794344902039,0.37616287371709056,0.2060546875,2026.662109375
31,0.5965559482574463,,0.1728515625,2119.2333984375
32,0.7561321258544922,,0.2294921875,2069.783203125
33,0.6414928436279297,,0.1474609375,2124.9931640625
34,0.6461452841758728,,0.18359375,2196.1787109375
35,0.7404161095619202,,0.1875,2226.7900390625
36,0.6688610911369324,,0.2041015625,2264.53125
37,0.5670307278633118,,0.1552734375,2243.5888671875
38,0.741607129573822,,0.201171875,2310.7392578125
39,0.6701458692550659,,0.2255859375,2483.9365234375
40,0.6681188344955444,0.38577309236947793,0.2099609375,2206.48828125
41,0.6483098864555359,,0.2119140625,2251.2841796875
42,0.5355284214019775,,0.19921875,2370.26953125
43,0.6680513620376587,,0.1875,2226.6064453125
44,0.7070887088775635,,0.224609375,2535.2490234375
45,0.6399738788604736,,0.1796875,2531.4716796875
46,0.724408745765686,,0.21484375,2615.0048828125
47,0.601334273815155,,0.2314453125,2416.025390625
48,0.5774431228637695,,0.2109375,2529.0234375
49,0.697655439376831,,0.23046875,2582.111328125
50,0.5553936958312988,0.42283327755466305,0.2060546875,2559.2412109375
51,0.5958781838417053,,0.224609375,2401.7744140625
52,0.546944797039032,,0.212890625,2392.55859375
53,0.4955240488052368,,0.1953125,2349.251953125
54,0.5722750425338745,,0.2060546875,2522.39453125
55,0.4831763505935669,,0.2373046875,2491.53515625
56,0.5030492544174194,,0.2890625,2209.197265625
57,0.5456334352493286,,0.236328125,2553.3642578125
58,0.5644177198410034,,0.28125,2379.3779296875
59,0.4053701162338257,,0.2578125,2353.078125
60,0.5463905334472656,0.4295937081659973,0.2578125,2407.6240234375
61,0.5270535349845886,,0.248046875,2720.939453125
62,0.5425812602043152,,0.2294921875,2521.8037109375
63,0.40611031651496887,,0.255859375,2404.26953125
64,0.4475526511669159,,0.2744140625,2547.328125
65,0.4762980043888092,,0.2724609375,2627.796875
66,0.3795531094074249,,0.22265625,2612.3798828125
67,0.3951592743396759,,0.27734375,2523.064453125
68,0.43384966254234314,,0.2783203125,2646.7490234375
69,0.451524555683136,,0.2373046875,2626.3330078125
70,0.538785994052887,0.4335446229361892,0.2255859375,2729.478515625
71,0.4253896176815033,,0.2373046875,2607.1240234375
72,0.41470593214035034,,0.189453125,2894.0361328125
73,0.5000185370445251,,0.2421875,2894.5244140625
74,0.5030209422111511,,0.2431640625,2992.9677734375
75,0.4938274919986725,,0.2578125,2955.5703125
76,0.510744571685791,,0.26171875,2881.3056640625
77,0.5058920979499817,,0.2587890625,2973.9404296875
78,0.5274516940116882,,0.2646484375,3167.7646484375
79,0.5416415333747864,,0.2568359375,2941.5185546875
80,0.4475818872451782,0.4370957719767961,0.232421875,2968.9912109375
81,0.48294728994369507,,0.2490234375,2982.23046875
82,0.4671449065208435,,0.2763671875,2715.8603515625
83,0.4530303180217743,,0.2744140625,2834.078125
84,0.46806541085243225,,0.271484375,2746.0126953125
85,0.5213765501976013,,0.2734375,2782.6611328125
86,0.5236703157424927,,0.3017578125,2742.9384765625
87,0.5046821236610413,,0.2822265625,3142.142578125
88,0.39443132281303406,,0.2802734375,2860.1015625
89,0.40307778120040894,,0.28515625,2934.9521484375
90,0.3956192135810852,0.43689139892904955,0.314453125,2770.658203125
91,0.3623059093952179,,0.296875,2773.9501953125
92,0.4784562587738037,,0.2919921875,2891.0283203125
93,0.4439318776130676,,0.2958984375,2783.49609375
94,0.405166357755661,,0.2939453125,2901.01953125
95,0.36226120591163635,,0.3056640625,2637.10546875
96,0.3395519554615021,,0.2431640625,2900.962890625
97,0.3746739625930786,,0.328125,3070.4150390625
98,0.3312295973300934,,0.283203125,2772.875
99,0.27675461769104004,,0.31640625,2789.416015625
100,0.31377261877059937,0.44781503792949573,0.333984375,2845.548828125
101,0.3154202997684479,,0.296875,2770.365234375
102,0.3549240529537201,,0.2783203125,2767.6455078125
103,0.29554587602615356,,0.404296875,2559.0830078125
104,0.3073597252368927,,0.3515625,2680.6494140625
105,0.3493289649486542,,0.33203125,2984.02734375
106,0.33643466234207153,,0.3310546875,3128.9833984375
107,0.2977725863456726,,0.3095703125,3038.1875
108,0.3316822350025177,,0.2919921875,3228.2802734375
109,0.370138943195343,,0.3359375,2964.408203125
110,0.3565221130847931,0.46895995091477016,0.2392578125,3112.5732421875
111,0.3183656930923462,,0.34375,2829.3310546875
112,0.2796025276184082,,0.3359375,2901.373046875
113,0.30156204104423523,,0.3212890625,3187.32421875
114,0.23273009061813354,,0.3525390625,3022.86328125
115,0.3644959032535553,,0.3193359375,3450.6416015625
116,0.32995912432670593,,0.314453125,3423.966796875
117,0.322103351354599,,0.32421875,3502.1474609375
118,0.3654092252254486,,0.3076171875,3573.4677734375
119,0.32828256487846375,,0.3271484375,3567.5576171875
120,0.29374444484710693,0.45957312583668003,0.318359375,3700.8828125
121,0.2844080626964569,,0.345703125,3556.4482421875
122,0.2441033124923706,,0.330078125,3498.2109375
123,0.2399771511554718,,0.3154296875,4018.130859375
124,0.26033350825309753,,0.3154296875,3750.7734375
125,0.2512822151184082,,0.3173828125,3615.724609375
126,0.2518809735774994,,0.3203125,3626.3974609375
127,0.2626775801181793,,0.3349609375,3683.1123046875
128,0.2524873912334442,,0.3046875,3778.30078125
129,0.27227532863616943,,0.3203125,3563.5908203125
130,0.23095335066318512,0.483,0.3486328125,3888.1845703125
131,0.2628720700740814,,0.3466796875,3714.62890625
132,0.27187326550483704,,0.3447265625,3722.9638671875
133,0.22710509598255157,,0.328125,3747.3271484375
134,0.2540423274040222,,0.431640625,3767.78125
135,0.2690262496471405,,0.38671875,3902.51171875
136,0.27373820543289185,,0.3408203125,3839.3779296875
137,0.2339351773262024,,0.4111328125,3838.62109375
138,0.23882144689559937,,0.3974609375,3864.4296875
139,0.2520626485347748,,0.333984375,4136.3935546875
140,0.23277784883975983,0.49563888888888885,0.3251953125,4360.513671875
141,0.21886533498764038,,0.404296875,4230.7890625
142,0.20897917449474335,,0.3857421875,4006.5
143,0.2464999556541443,,0.39453125,3971.552734375
144,0.2285100668668747,,0.384765625,4247.9052734375
145,0.2530154883861542,,0.419921875,3959.94140625
146,0.20332995057106018,,0.412109375,4260.3154296875
147,0.21602554619312286,,0.4794921875,4089.5732421875
148,0.20294035971164703,,0.3896484375,4535.806640625
149,0.214430034160614,,0.39453125,4337.2841796875
150,0.19675594568252563,0.5298984270414993,0.427734375,4350.048828125
151,0.1978849172592163,,0.349609375,4792.2197265625
152,0.20166711509227753,,0.3994140625,4386.5712890625
153,0.18828697502613068,,0.4013671875,4306.6591796875
154,0.20137803256511688,,0.4150390625,4166.888671875
155,0.20072215795516968,,0.369140625,4397.765625
156,0.17723453044891357,,0.390625,4513.3330078125
157,0.2045496553182602,,0.3671875,4580.1455078125
158,0.21017754077911377,,0.3203125,4858.7197265625
159,0.1778281182050705,,0.431640625,4640.1630859375
160,0.21213483810424805,0.5406873047746542,0.400390625,4718.01953125
161,0.208065465092659,,0.3583984375,4821.8955078125
162,0.21587274968624115,,0.40625,4680.4560546875
163,0.18320848047733307,,0.421875,4579.9716796875
164,0.20684774219989777,,0.43359375,4393.47265625
165,0.18497507274150848,,0.447265625,4433.9873046875
166,0.16799978911876678,,0.392578125,4704.7705078125
167,0.1594163030385971,,0.40234375,4726.4384765625
168,0.18246285617351532,,0.40234375,4527.298828125
169,0.1809898018836975,,0.4443359375,4502.8935546875
170,0.16959121823310852,0.5710924810352521,0.3955078125,4772.001953125
171,0.1802626997232437,,0.4384765625,4383.8583984375
172,0.17672374844551086,,0.4609375,4223.2373046875
173,0.19599631428718567,,0.4912109375,4140.96875
174,0.17733298242092133,,0.3955078125,4783.2744140625
175,0.19849739968776703,,0.404296875,4511.9990234375
176,0.1910647749900818,,0.4033203125,4301.8447265625
177,0.19644798338413239,,0.412109375,4802.1181640625
178,0.2172674685716629,,0.427734375,4334.513671875
179,0.1859249472618103,,0.4033203125,4626.4287109375
180,0.18193469941616058,0.5532568049977689,0.421875,4520.7763671875
181,0.15856128931045532,,0.3935546875,4797.490234375
182,0.16475100815296173,,0.4609375,4327.65234375
183,0.1755627542734146,,0.435546875,4570.9541015625
184,0.16689860820770264,,0.4140625,4645.5546875
185,0.15640072524547577,,0.4111328125,4500.9560546875
186,0.1542760133743286,,0.45703125,4357.0634765625
187,0.16437236964702606,,0.404296875,4287.505859375
188,0.16014553606510162,,0.4560546875,4031.9189453125
189,0.17039626836776733,,0.4150390625,4403.0341796875
190,0.1669730246067047,0.5655561133422579,0.4619140625,4183.26171875
191,0.16162094473838806,,0.4404296875,4393.001953125
192,0.16427086293697357,,0.42578125,4372.9384765625
193,0.16818341612815857,,0.404296875,4563.8056640625
194,0.1680627316236496,,0.4501953125,4242.666015625
195,0.15897198021411896,,0.458984375,4150.708984375
196,0.1469435691833496,,0.4716796875,4527.5791015625
197,0.15677577257156372,,0.4609375,4148.783203125
198,0.15764302015304565,,0.4521484375,4497.6513671875
199,0.14540286362171173,,0.5107421875,4366.03125
200,0.15061448514461517,0.5595410531012941,0.49609375,4225.09375
201,0.15546178817749023,,0.44921875,4211.734375
202,0.1563504934310913,,0.4580078125,4075.404296875
203,0.16863276064395905,,0.4306640625,4481.541015625
204,0.15268321335315704,,0.5341796875,4018.431640625
205,0.1409187763929367,,0.443359375,4387.0830078125
206,0.15183787047863007,,0.4052734375,4525.5283203125
207,0.14945301413536072,,0.3935546875,4562.1767578125
208,0.16508424282073975,,0.439453125,4233.5185546875
209,0.17592012882232666,,0.4697265625,3991.41796875
210,0.1564856320619583,0.5486575189647479,0.435546875,4455.34765625
211,0.1757000982761383,,0.4189453125,4149.0556640625
212,0.1641055792570114,,0.41015625,4495.3681640625
213,0.13729791343212128,,0.4921875,4188.2099609375
214,0.14024631679058075,,0.44921875,4215.7529296875
215,0.1571350395679474,,0.4296875,4462.1474609375
216,0.13928155601024628,,0.466796875,4204.4375
217,0.14988358318805695,,0.458984375,4433.4736328125
218,0.1412406712770462,,0.455078125,4486.990234375
219,0.15048415958881378,,0.4013671875,4890.5791015625
220,0.13837124407291412,0.5782473226238286,0.4521484375,4310.1845703125
221,0.1411222219467163,,0.466796875,4418.978515625
222,0.14701016247272491,,0.546875,4410.3134765625
223,0.14082302153110504,,0.4736328125,4477.677734375
224,0.13826300203800201,,0.458984375,4761.408203125
225,0.13991183042526245,,0.4541015625,4556.359375
226,0.1451120525598526,,0.3857421875,4857.3212890625
227,0.13123641908168793,,0.48046875,4504.0595703125
228,0.13184578716754913,,0.49609375,4486.3095703125
229,0.14366890490055084,,0.4521484375,4264.0556640625
230,0.14900603890419006,0.5764005466309683,0.4619140625,4632.4287109375
231,0.1405390352010727,,0.4501953125,4375.103515625
232,0.14506784081459045,,0.458984375,4267.05078125
233,0.135674849152565,,0.5146484375,4223.87109375
234,0.14289364218711853,,0.50390625,4407.0703125
235,0.1428067982196808,,0.466796875,4649.0009765625
236,0.14258641004562378,,0.5517578125,4119.7685546875
237,0.15774480998516083,,0.4609375,4520.708984375
238,0.14656391739845276,,0.48046875,4466.4765625
239,0.14210397005081177,,0.4697265625,4621.8896484375
240,0.14308620989322662,0.5632433623382419,0.4833984375,4648.529296875
241,0.14362730085849762,,0.46875,4559.05859375
242,0.15098071098327637,,0.4306640625,4512.349609375
243,0.13477559387683868,,0.486328125,4418.1865234375
244,0.14813949167728424,,0.4736328125,4340.6259765625
245,0.1390058547258377,,0.4921875,4408.740234375
246,0.15066389739513397,,0.4541015625,4381.259765625
247,0.15233050286769867,,0.447265625,4238.0712890625
248,0.15006856620311737,,0.4755859375,4193.6728515625
249,0.1468016803264618,,0.53125,4263.8154296875
250,0.1414499282836914,0.5668616688978135,0.509765625,4127.13671875
251,0.15145538747310638,,0.525390625,4199.5048828125
252,0.13260242342948914,,0.4912109375,4419.2880859375
253,0.14646615087985992,,0.4765625,4481.51171875
254,0.1424201875925064,,0.4853515625,4450.5810546875
255,0.15429401397705078,,0.4560546875,4443.6474609375
256,0.1465451717376709,,0.482421875,4198.74609375
257,0.1273096650838852,,0.544921875,4227.693359375
258,0.15182948112487793,,0.447265625,4339.79296875
259,0.15000683069229126,,0.486328125,4236.666015625
260,0.15275894105434418,0.5741130633645695,0.451171875,4532.3642578125
261,0.1598961502313614,,0.4375,4642.423828125
262,0.14686539769172668,,0.4853515625,4391.724609375
263,0.1452905833721161,,0.4111328125,4479.970703125
264,0.1566038429737091,,0.501953125,4106.591796875
265,0.14889094233512878,,0.4921875,4333.2158203125
266,0.14308343827724457,,0.5693359375,4058.314453125
267,0.143973246216774,,0.501953125,4253.861328125
268,0.14800313115119934,,0.529296875,4139.1728515625
269,0.14984692633152008,,0.5556640625,4036.775390625
270,0.1525711566209793,0.5857232820169567,0.544921875,4282.5634765625
271,0.1453663408756256,,0.5546875,4198.28515625
272,0.16254077851772308,,0.4453125,4565.7685546875
273,0.15173648297786713,,0.4873046875,4504.677734375
274,0.15041927993297577,,0.51953125,4641.6337890625
275,0.16454799473285675,,0.4638671875,4686.8505859375
276,0.15705735981464386,,0.451171875,4723.6416015625
277,0.15660907328128815,,0.4326171875,5008.2626953125
278,0.1503327637910843,,0.587890625,4202.76953125
279,0.1507638692855835,,0.4990234375,4521.984375
280,0.14448951184749603,0.5800892458723784,0.5126953125,4677.484375
281,0.15446904301643372,,0.455078125,4764.853515625
282,0.15193039178848267,,0.505859375,4342.515625
283,0.16575752198696136,,0.53125,4317.3603515625
284,0.13956138491630554,,0.5390625,4402.6640625
285,0.14757557213306427,,0.552734375,4557.8251953125
286,0.15466147661209106,,0.4501953125,4816.8623046875
287,0.1566060185432434,,0.458984375,4720.2275390625
288,0.151140034198761,,0.51953125,4564.6845703125
289,0.15449899435043335,,0.4853515625,4588.8583984375
290,0.13794387876987457,0.5850913096831771,0.552734375,4571.5615234375
291,0.1389903873205185,,0.50390625,4675.7666015625
292,0.1576436311006546,,0.478515625,4616.1240234375
293,0.14682678878307343,,0.52734375,4509.396484375
294,0.1452769786119461,,0.5263671875,4682.4716796875
295,0.1739925742149353,,0.4873046875,4632.0107421875
296,0.1483059972524643,,0.470703125,4600.7236328125
297,0.15429756045341492,,0.5234375,4676.349609375
298,0.1513432413339615,,0.4560546875,4764.3173828125
299,0.16569988429546356,,0.498046875,4589.357421875
300,0.14646358788013458,0.5802677376171352,0.53515625,4776.1767578125
