Running Env Steps,Itration,Running Reverse KL,Real Sto Return,Loss,Real Det Return,Running Forward KL,Running Update Time
0,0,6.9935,-1487.64,-116.49739837646484,-796.3,39.2943,0
5000,1,6.1895,-1431.02,176.10255432128906,-548.39,38.7815,1
10000,2,8.4068,-1082.61,-11.91598129272461,-342.45,39.8844,2
15000,3,6.0236,-589.73,24.309337615966797,-315.65,38.549,3
20000,4,7.0799,-555.72,-26.769840240478516,-931.82,38.6884,4
25000,5,8.0685,-738.54,487.8677673339844,-1315.92,39.0198,5
30000,6,8.0807,-906.05,-22.16559600830078,-1650.56,39.5647,6
35000,7,8.8629,-1078.61,79.48371887207031,-1582.82,41.0195,7
40000,8,8.9435,-1186.96,5.646303176879883,-2006.62,40.5684,8
45000,9,8.7703,-1477.42,-244.7947540283203,-2268.25,41.6539,9
50000,10,8.7778,-1242.08,-68.78327941894531,-2111.57,39.098,10
55000,11,9.1582,-1500.34,-9.641796112060547,-2533.45,40.2489,11
60000,12,9.8003,-1602.29,81.58033752441406,-2581.94,41.2138,12
65000,13,9.9116,-1609.57,9.013861656188965,-2403.72,40.8287,13
70000,14,9.002,-1821.98,812.4005126953125,-3108.84,40.4144,14
75000,15,10.4691,-1952.7,-5.109667778015137,-2835.76,41.2581,15
80000,16,10.9186,-2167.45,4.597663879394531,-3030.81,41.1491,16
85000,17,10.565,-2352.19,-64.56765747070312,-3514.97,41.2232,17
90000,18,10.1677,-2151.99,442.1686706542969,-3711.57,41.2998,18
95000,19,11.6126,-2522.41,113.97164916992188,-3315.87,41.3202,19
100000,20,10.7032,-2558.69,47.4374885559082,-3354.43,40.926,20
105000,21,11.3991,-2547.59,11.77215576171875,-3692.33,42.0244,21
110000,22,11.1347,-2507.52,25.09540367126465,-3491.68,40.9574,22
115000,23,11.2664,-2536.65,19.53238296508789,-3467.0,41.5059,23
120000,24,11.5985,-2806.99,96.68749237060547,-3759.05,42.2072,24
125000,25,10.7899,-2658.41,19.57106590270996,-3598.18,41.4587,25
130000,26,11.0556,-2785.43,-10.157644271850586,-3801.49,41.708,26
135000,27,12.1572,-2702.57,-17.843664169311523,-3773.42,42.7262,27
140000,28,10.2211,-2616.76,-49.667091369628906,-3307.42,41.0539,28
145000,29,11.6104,-2887.44,34.75612258911133,-3537.06,42.3571,29
150000,30,10.8732,-2718.86,9.434043884277344,-3498.89,41.5055,30
155000,31,11.29,-2863.18,-44.40271759033203,-3648.51,41.7066,31
160000,32,12.1421,-2984.65,29.311477661132812,-3636.06,42.1664,32
165000,33,11.1315,-2792.17,-17.042278289794922,-3593.94,40.9091,33
170000,34,11.518,-3065.49,41.99147033691406,-3946.25,42.1637,34
175000,35,10.9792,-2696.5,70.88240814208984,-4231.3,41.2536,35
180000,36,10.9106,-2447.03,11.548370361328125,-3003.59,41.1368,36
185000,37,10.7117,-2971.89,28.621315002441406,-3676.63,42.0515,37
190000,38,11.675,-3151.76,47.81401062011719,-3968.46,42.3478,38
195000,39,11.3593,-3121.5,70.91670989990234,-3754.19,42.1435,39
200000,40,11.3665,-3088.96,29.943645477294922,-4002.19,41.9721,40
205000,41,11.1079,-3011.36,-15.61892032623291,-4034.79,41.1537,41
210000,42,11.0774,-3052.31,0.16492605209350586,-3851.91,41.646,42
215000,43,11.0246,-2864.43,15.793621063232422,-3476.99,41.2478,43
220000,44,10.9333,-2982.72,51.3538703918457,-3989.16,41.5195,44
225000,45,10.7492,-2858.83,-21.5609073638916,-4139.46,41.6857,45
230000,46,11.0757,-2951.28,-25.6960391998291,-3692.4,41.6024,46
235000,47,11.0904,-3083.84,11.519074440002441,-4137.91,42.2173,47
