_step,actor/entropy,avg_score/16384/four_sets,critic/acc/mean,response_length/mean
1,1.048940896987915,,0.0966796875,1292.8779296875
2,1.037702202796936,,0.0927734375,1261.416015625
3,0.9349271655082703,,0.1162109375,1291.89453125
4,1.0309401750564575,,0.1103515625,1305.58984375
5,0.9456517100334167,,0.140625,1168.529296875
6,0.9341753721237183,,0.1259765625,1309.216796875
7,0.9142586588859558,,0.1181640625,1304.05078125
8,0.9223456978797913,,0.1298828125,1273.6484375
9,0.9879432320594788,,0.1220703125,1383.580078125
10,0.9258550405502319,0.33181793842034807,0.123046875,1562.4287109375
11,0.8722853660583496,,0.1298828125,1523.107421875
12,0.9441710710525513,,0.1259765625,1488.4267578125
13,0.7452278733253479,,0.150390625,1634.033203125
14,1.0094748735427856,,0.1640625,1639.9072265625
15,0.8742159605026245,,0.16015625,1738.6845703125
16,0.7969779372215271,,0.16796875,1802.1875
17,0.9493458867073059,,0.1591796875,1906.1806640625
18,0.7676389217376709,,0.1591796875,2005.076171875
19,0.7951299548149109,,0.1875,2012.05859375
20,0.8728427886962891,0.33947233377956265,0.1767578125,2167.2548828125
21,0.7268337607383728,,0.1884765625,1937.158203125
22,0.787345290184021,,0.1650390625,2104.0498046875
23,0.7519121766090393,,0.15625,2044.48828125
24,0.6841181516647339,,0.1494140625,2062.4638671875
25,0.7313006520271301,,0.1982421875,2060.1376953125
26,0.6507143974304199,,0.193359375,2189.75
27,0.6575917601585388,,0.189453125,2063.5625
28,0.6644745469093323,,0.189453125,2180.8349609375
29,0.5856471061706543,,0.173828125,2314.306640625
30,0.7126524448394775,0.3640394912985274,0.2275390625,2163.189453125
31,0.6177217364311218,,0.1826171875,2042.8994140625
32,0.6340759992599487,,0.2236328125,2307.208984375
33,0.5798024535179138,,0.162109375,2277.041015625
34,0.6479659676551819,,0.1845703125,2462.9404296875
35,0.5944085121154785,,0.1875,2226.80078125
36,0.5943964719772339,,0.21484375,2206.2998046875
37,0.5325513482093811,,0.1943359375,2116.4267578125
38,0.5837413668632507,,0.234375,2150.4658203125
39,0.47490066289901733,,0.234375,2307.6904296875
40,0.5786012411117554,0.37970894689870593,0.21875,2292.115234375
41,0.5362961292266846,,0.216796875,2323.3583984375
42,0.4801284372806549,,0.1962890625,2394.9765625
43,0.6590713262557983,,0.19921875,2466.3994140625
44,0.5676201581954956,,0.2490234375,2415.3212890625
45,0.6070054769515991,,0.203125,2408.611328125
46,0.6634806394577026,,0.2080078125,2579.7431640625
47,0.5910064578056335,,0.224609375,2647.0556640625
48,0.5499816536903381,,0.220703125,2699.7041015625
49,0.6348438858985901,,0.224609375,2677.7119140625
50,0.6149523854255676,0.40353977019187864,0.216796875,2695.583984375
51,0.5575366616249084,,0.2197265625,2578.767578125
52,0.5257735252380371,,0.2099609375,2386.16015625
53,0.44132617115974426,,0.19921875,2417.8232421875
54,0.4841168224811554,,0.2353515625,2365.7060546875
55,0.48085322976112366,,0.248046875,2291.2294921875
56,0.4996477961540222,,0.267578125,2196.59765625
57,0.4777590334415436,,0.259765625,2323.65234375
58,0.4651239812374115,,0.279296875,2209.7744140625
59,0.4704245626926422,,0.28125,2048.9150390625
60,0.397807240486145,0.4252483266398929,0.2568359375,2159.0029296875
61,0.40859466791152954,,0.2490234375,2310.8779296875
62,0.3970121741294861,,0.2275390625,2378.609375
63,0.43222323060035706,,0.2578125,2304.890625
64,0.37114188075065613,,0.259765625,2475.9404296875
65,0.43945467472076416,,0.2685546875,2359.875
66,0.45019036531448364,,0.2138671875,2393.865234375
67,0.39466938376426697,,0.2666015625,2405.208984375
68,0.3910785913467407,,0.279296875,2337.7685546875
69,0.34692949056625366,,0.2626953125,2406.8173828125
70,0.3464331328868866,0.44586618697010266,0.25390625,2485.3779296875
71,0.3920729160308838,,0.23828125,2569.6025390625
72,0.3028305172920227,,0.193359375,2519.7294921875
73,0.3726155757904053,,0.240234375,2612.73046875
74,0.4048455059528351,,0.2548828125,2691.181640625
75,0.30071404576301575,,0.2587890625,2506.3037109375
76,0.3273458480834961,,0.259765625,2554.8583984375
77,0.35298845171928406,,0.2978515625,2512.6572265625
78,0.311466783285141,,0.2685546875,2578.6240234375
79,0.3288600444793701,,0.265625,2502.49609375
80,0.3165881931781769,0.4297668451584114,0.2265625,2755.87890625
81,0.3287346065044403,,0.2744140625,2469.6318359375
82,0.26738011837005615,,0.2958984375,2371.7509765625
83,0.25766727328300476,,0.26953125,2571.7724609375
84,0.24330472946166992,,0.2890625,2390.94921875
85,0.3014355003833771,,0.2587890625,2562.896484375
86,0.2804647982120514,,0.3134765625,2385.2705078125
87,0.2770220935344696,,0.29296875,2839.287109375
88,0.2718498110771179,,0.283203125,2583.193359375
89,0.2575286626815796,,0.2880859375,2698.5908203125
90,0.2985458970069885,0.4563659638554217,0.3359375,2504.89453125
91,0.24097971618175507,,0.2646484375,2622.9384765625
92,0.24977700412273407,,0.29296875,2538.5400390625
93,0.25461652874946594,,0.2958984375,2629.0224609375
94,0.254587322473526,,0.2939453125,2623.3642578125
95,0.25101959705352783,,0.3125,2604.5625
96,0.23352183401584625,,0.2822265625,2671.5361328125
97,0.22246575355529785,,0.345703125,2815.552734375
98,0.22156135737895966,,0.2919921875,2520.9580078125
99,0.22105185687541962,,0.2998046875,2754.8525390625
100,0.21342308819293976,0.4598941878625614,0.3349609375,2740.373046875
101,0.2183859497308731,,0.3017578125,2796.98828125
102,0.2112235277891159,,0.3115234375,2764.83203125
103,0.24462196230888367,,0.3916015625,2661.6064453125
104,0.20249781012535095,,0.3359375,2746.0673828125
105,0.22926805913448334,,0.3447265625,2756.5703125
106,0.22008898854255676,,0.330078125,2831.6064453125
107,0.24627286195755005,,0.3330078125,2883.7431640625
108,0.17909736931324005,,0.310546875,3224.8740234375
109,0.2287282943725586,,0.333984375,2821.54296875
110,0.20833200216293335,0.46741387773315485,0.2451171875,3210.0615234375
111,0.2051052302122116,,0.333984375,2906.48046875
112,0.20102229714393616,,0.3544921875,2973.330078125
113,0.2128685712814331,,0.3486328125,3269.474609375
114,0.1714026778936386,,0.345703125,3060.11328125
115,0.19857624173164368,,0.3173828125,3121.6884765625
116,0.21089130640029907,,0.33203125,3022.6962890625
117,0.19522985816001892,,0.3408203125,3101.3623046875
118,0.17585115134716034,,0.322265625,3102.2451171875
119,0.19314710795879364,,0.341796875,2990.9912109375
120,0.16964735090732574,0.47424375278893355,0.30859375,2953.0107421875
121,0.22270135581493378,,0.333984375,2989.6103515625
122,0.16841483116149902,,0.33203125,2985.890625
123,0.15874511003494263,,0.3203125,3283.0263671875
124,0.15642546117305756,,0.2958984375,2949.9404296875
125,0.15062347054481506,,0.3203125,2978.3798828125
126,0.15504975616931915,,0.3408203125,3075.0654296875
127,0.1588089019060135,,0.3466796875,3022.3603515625
128,0.15838854014873505,,0.310546875,3058.1484375
129,0.1527603566646576,,0.3173828125,2985.56640625
130,0.149629607796669,0.4790465194109772,0.349609375,3381.9345703125
131,0.14152801036834717,,0.3359375,3254.3330078125
132,0.14329388737678528,,0.3642578125,3222.7685546875
133,0.13577419519424438,,0.341796875,3146.1044921875
134,0.1411183625459671,,0.443359375,3209.0390625
135,0.1408335268497467,,0.3681640625,3434.546875
136,0.15587225556373596,,0.3310546875,3612.14453125
137,0.14040762186050415,,0.3984375,3436.376953125
138,0.13812780380249023,,0.38671875,3511.572265625
139,0.1554163098335266,,0.322265625,3736.98046875
140,0.136626735329628,0.490037260151718,0.3369140625,3801.623046875
141,0.12336304038763046,,0.3916015625,3749.892578125
142,0.13970325887203217,,0.3603515625,3577.8017578125
143,0.13438916206359863,,0.3955078125,3620.8330078125
144,0.1329752504825592,,0.357421875,3772.125
145,0.1257733702659607,,0.4072265625,3538.21484375
146,0.11247428506612778,,0.4072265625,3797.953125
147,0.133270725607872,,0.4287109375,3572.3017578125
148,0.13337929546833038,,0.37109375,3752.9990234375
149,0.13946786522865295,,0.3740234375,3788.4521484375
150,0.12771646678447723,0.49094701026327536,0.4013671875,3729.865234375
151,0.13723236322402954,,0.345703125,4052.7841796875
152,0.13817988336086273,,0.36328125,3814.212890625
153,0.1352337896823883,,0.392578125,3480.5595703125
154,0.11770575493574142,,0.392578125,3676.712890625
155,0.12900206446647644,,0.3515625,3832.8876953125
156,0.12467876076698303,,0.34765625,3906.9501953125
157,0.12841923534870148,,0.37109375,3834.0283203125
158,0.12807753682136536,,0.298828125,3876.3046875
159,0.1273195594549179,,0.4169921875,3848.0068359375
160,0.13318562507629395,0.5005701695671575,0.3544921875,3945.0146484375
161,0.13370265066623688,,0.3427734375,4295.576171875
162,0.13724654912948608,,0.3916015625,4026.9150390625
163,0.12540827691555023,,0.4443359375,3904.6904296875
164,0.1359451562166214,,0.4248046875,3651.205078125
165,0.12700708210468292,,0.4541015625,3726.650390625
166,0.1232239380478859,,0.35546875,4034.94921875
167,0.1273251175880432,,0.3896484375,4230.8779296875
168,0.1300511509180069,,0.4091796875,3917.78125
169,0.1280907243490219,,0.4521484375,3930.8466796875
170,0.12772123515605927,0.5117921686746988,0.3896484375,4433.890625
171,0.1258910447359085,,0.421875,4102.23828125
172,0.12722747027873993,,0.423828125,4030.21875
173,0.13855820894241333,,0.48046875,4031.9267578125
174,0.12047343701124191,,0.3662109375,4555.20703125
175,0.13402360677719116,,0.388671875,4339.5615234375
176,0.13282303512096405,,0.4150390625,4028.7138671875
177,0.12522082030773163,,0.3828125,4630.833984375
178,0.13798028230667114,,0.439453125,4195.763671875
179,0.11983855813741684,,0.3779296875,4462.2578125
180,0.12374776601791382,0.5062942324854975,0.4072265625,4344.1416015625
181,0.11755809932947159,,0.3798828125,4560.4345703125
182,0.12374727427959442,,0.4326171875,4313.5419921875
183,0.12711884081363678,,0.3984375,4423.779296875
184,0.1235228180885315,,0.404296875,4625.4609375
185,0.12648704648017883,,0.3857421875,4349.05859375
186,0.11229857802391052,,0.4140625,4360.064453125
187,0.12926466763019562,,0.40234375,4230.8251953125
188,0.12223411351442337,,0.431640625,4137.703125
189,0.12799566984176636,,0.3916015625,4583.8046875
190,0.1243695318698883,0.5360829428826417,0.451171875,4319.6474609375
191,0.12469780445098877,,0.4267578125,4621.2939453125
192,0.1418135017156601,,0.3974609375,4335.4921875
193,0.13830429315567017,,0.3837890625,4502.2783203125
194,0.1482691615819931,,0.4326171875,4299.693359375
195,0.12690600752830505,,0.45703125,4040.62890625
196,0.12360978871583939,,0.4423828125,4538.7998046875
197,0.13220681250095367,,0.4580078125,4233.310546875
198,0.12728995084762573,,0.4580078125,4474.384765625
199,0.12837877869606018,,0.4501953125,4478.015625
200,0.12894634902477264,0.5138817492190986,0.4658203125,4522.427734375
201,0.12696070969104767,,0.4140625,4451.353515625
202,0.12209251523017883,,0.4736328125,4401.078125
203,0.13168495893478394,,0.4248046875,4525.6015625
204,0.12984244525432587,,0.515625,4307.783203125
205,0.12350206822156906,,0.3984375,4688.501953125
206,0.12696364521980286,,0.419921875,4730.9560546875
207,0.14846087992191315,,0.3798828125,4774.5380859375
208,0.1386384516954422,,0.419921875,4508.193359375
209,0.15106523036956787,,0.4443359375,4429.9375
210,0.13919925689697266,0.5387264614011602,0.3994140625,4891.6630859375
211,0.1466885209083557,,0.419921875,4416.34375
212,0.14860166609287262,,0.3935546875,4829.0703125
213,0.1226336732506752,,0.490234375,4468.392578125
214,0.1363704651594162,,0.4580078125,4470.6142578125
215,0.14007574319839478,,0.44921875,4735.513671875
216,0.1323121041059494,,0.478515625,4508.9013671875
217,0.13657639920711517,,0.458984375,4648.552734375
218,0.12611551582813263,,0.419921875,4839.9775390625
219,0.13572368025779724,,0.349609375,5139.87109375
220,0.12437764555215836,0.5359500780901383,0.4560546875,4726.2763671875
221,0.1358201801776886,,0.4375,4714.603515625
222,0.12872885167598724,,0.5439453125,4382.3251953125
223,0.12822912633419037,,0.44921875,4717.5615234375
224,0.12821190059185028,,0.4326171875,4912.509765625
225,0.1382870227098465,,0.4111328125,4770.57421875
226,0.13642770051956177,,0.375,5190.8720703125
227,0.12463057041168213,,0.4296875,4839.4697265625
228,0.12895339727401733,,0.466796875,4941.2880859375
229,0.13724921643733978,,0.4306640625,4659.08203125
230,0.13480117917060852,0.5435100401606425,0.4287109375,5101.0380859375
231,0.1338130384683609,,0.421875,4789.1123046875
232,0.13730712234973907,,0.4814453125,4627.63671875
233,0.12891912460327148,,0.4970703125,4481.640625
234,0.13454222679138184,,0.5,4693.8779296875
235,0.13811609148979187,,0.42578125,4952.9365234375
236,0.13523709774017334,,0.515625,4637.94921875
237,0.15049517154693604,,0.4287109375,4993.921875
238,0.14613783359527588,,0.4453125,4850.263671875
239,0.13883990049362183,,0.44921875,5013.857421875
240,0.13632450997829437,0.5494873382418564,0.4765625,4932.5029296875
241,0.1429639458656311,,0.43359375,4873.9443359375
242,0.15056177973747253,,0.4345703125,4939.2099609375
243,0.13510800898075104,,0.47265625,4857.560546875
244,0.14204755425453186,,0.4462890625,4723.1484375
245,0.1361970603466034,,0.458984375,4830.333984375
246,0.14883895218372345,,0.453125,4807.7412109375
247,0.1463196575641632,,0.4677734375,4687.9453125
248,0.142476424574852,,0.4638671875,4624.3837890625
249,0.1357283741235733,,0.529296875,4541.0888671875
250,0.13664467632770538,0.5415614123159304,0.49609375,4518.3232421875
251,0.15015855431556702,,0.4716796875,4526.9375
252,0.1359556019306183,,0.484375,4718.48828125
253,0.14566704630851746,,0.4443359375,4799.8505859375
254,0.14033295214176178,,0.4609375,4835.3125
255,0.14330902695655823,,0.4501953125,4872.6591796875
256,0.14198008179664612,,0.498046875,4732.7880859375
257,0.1226305216550827,,0.48828125,4659.89453125
258,0.14892829954624176,,0.396484375,4917.328125
259,0.14338046312332153,,0.4501953125,4872.328125
260,0.1494635045528412,0.5475811021865238,0.4423828125,5150.67578125
261,0.16140641272068024,,0.408203125,5189.2314453125
262,0.136082261800766,,0.4736328125,4905.93359375
263,0.13797155022621155,,0.421875,5010.7783203125
264,0.14875231683254242,,0.5205078125,4572.486328125
265,0.1441052258014679,,0.513671875,4855.6796875
266,0.1433451771736145,,0.5546875,4608.1787109375
267,0.14218205213546753,,0.505859375,4762.5185546875
268,0.14231757819652557,,0.533203125,4784.3857421875
269,0.13984353840351105,,0.5009765625,4559.0126953125
270,0.13505342602729797,0.5744161088799643,0.53125,4874.8486328125
271,0.13976715505123138,,0.5087890625,4936.0546875
272,0.16018424928188324,,0.484375,5124.7919921875
273,0.15172971785068512,,0.486328125,5106.7412109375
274,0.1474377065896988,,0.5341796875,5128.1279296875
275,0.15961508452892303,,0.4951171875,5123.4873046875
276,0.15219570696353912,,0.4599609375,5133.8681640625
277,0.15252618491649628,,0.4326171875,5421.2744140625
278,0.15662842988967896,,0.5400390625,4749.4931640625
279,0.15442219376564026,,0.4765625,5018.4462890625
280,0.14206759631633759,0.5710295069165551,0.48046875,5188.8173828125
281,0.15737228095531464,,0.4609375,5203.0634765625
282,0.15809066593647003,,0.4912109375,5019.07421875
283,0.17081710696220398,,0.4912109375,4964.140625
284,0.14476513862609863,,0.541015625,5145.572265625
285,0.15517158806324005,,0.5458984375,5135.72265625
286,0.16007648408412933,,0.4482421875,5422.486328125
287,0.15723058581352234,,0.4443359375,5182.61328125
288,0.15601420402526855,,0.53125,5113.162109375
289,0.15456905961036682,,0.4375,5222.6025390625
290,0.14577414095401764,0.5833049977688531,0.5048828125,5230.544921875
291,0.1433631181716919,,0.51953125,5300.873046875
292,0.16145412623882294,,0.4560546875,5092.2958984375
293,0.15342378616333008,,0.517578125,5035.3984375
294,0.15264837443828583,,0.4990234375,5162.0439453125
295,0.1732293665409088,,0.4638671875,5085.142578125
296,0.16045266389846802,,0.4853515625,5056.8525390625
297,0.16346266865730286,,0.486328125,4977.3359375
298,0.15864920616149902,,0.4833984375,5147.3720703125
