Itration,Running Forward KL,Running Reverse KL,Real Det Return,Running Update Time,Reward Loss,Real Sto Return,Running Env Steps
0,153.3443,2580.8371,886.88,0,35553.79296875,-193.69,0
1,150.2433,2558.3291,709.85,1,188149.375,-129.03,5000
2,146.0277,1569.4328,800.7,2,184316.671875,-118.61,10000
3,145.2146,1707.4093,737.94,3,-114384.8984375,-132.99,15000
4,144.7026,1961.9831,704.11,4,-240584.578125,-91.81,20000
5,143.0009,1792.5846,618.61,5,-193853.953125,-158.2,25000
6,144.6066,1032.0339,816.54,6,-234545.984375,-107.76,30000
7,144.4794,1764.838,675.0,7,-281930.5625,-212.36,35000
8,145.5033,1037.3204,706.69,8,-658017.75,-173.3,40000
9,148.0166,1755.0269,632.61,9,-507495.53125,-155.64,45000
10,146.5801,2133.8985,645.84,10,-654622.8125,-148.95,50000
11,144.5947,1149.0775,586.96,11,-696156.5,-161.52,55000
12,145.5299,1617.7107,763.75,12,-607049.5625,-172.49,60000
13,145.7339,1684.711,649.52,13,-759752.3125,-173.1,65000
14,143.1232,1261.6338,720.01,14,-685802.0,-214.44,70000
15,139.7485,989.605,781.69,15,-923527.0625,-185.07,75000
16,138.8981,942.4862,713.81,16,-1014933.875,-153.47,80000
17,144.7906,1401.649,729.96,17,-921674.875,-157.2,85000
18,138.9205,1090.811,595.16,18,-1007535.8125,-165.26,90000
19,143.1491,792.4944,715.67,19,-1151538.125,-161.74,95000
20,143.1076,1631.3939,785.49,20,-1378459.125,-160.79,100000
21,142.2286,461.9472,691.29,21,-1335930.5,-163.35,105000
22,142.0849,1043.8706,708.2,22,-1641353.75,-182.1,110000
23,136.5213,544.5347,744.28,23,-1621620.625,-171.75,115000
24,142.459,1355.0853,692.1,24,-1478351.25,-228.57,120000
25,139.4429,1328.5921,707.47,25,-1687897.25,-251.67,125000
26,140.9822,1091.8037,751.23,26,-1896870.5,-190.42,130000
27,141.3741,1015.1862,775.55,27,-1965236.75,-195.48,135000
28,140.2007,842.9661,680.66,28,-1913304.125,-221.28,140000
29,142.085,907.5354,742.13,29,-1965281.75,-239.98,145000
30,140.4671,1086.0195,799.94,30,-2064484.375,-205.5,150000
31,139.7732,742.357,819.12,31,-2372470.0,-195.81,155000
32,142.7062,1378.6245,679.26,32,-2304961.0,-231.14,160000
33,139.0344,881.7807,706.82,33,-2241604.0,-182.03,165000
34,141.8417,1697.9705,829.28,34,-2539392.0,-190.9,170000
35,141.7456,633.8774,764.35,35,-2549291.75,-239.73,175000
36,140.4651,1172.9748,786.48,36,-2749076.5,-186.55,180000
37,141.8065,593.9979,791.44,37,-2603066.5,-252.53,185000
38,139.8266,845.3242,758.19,38,-2572911.75,-203.76,190000
39,143.159,610.3534,705.38,39,-3062633.5,-175.14,195000
40,136.6225,715.489,719.14,40,-2783706.5,-241.84,200000
41,139.8949,795.3851,752.87,41,-2856202.5,-183.93,205000
42,136.7748,402.2792,773.69,42,-3044873.5,-245.54,210000
43,139.7061,795.5657,762.95,43,-2917539.75,-250.97,215000
44,136.832,523.3114,755.93,44,-3220933.75,-217.2,220000
45,139.1111,415.67,687.14,45,-3464728.5,-201.8,225000
46,141.6275,907.4859,800.5,46,-3409198.0,-183.74,230000
47,138.4059,948.1921,839.78,47,-3450424.5,-223.53,235000
48,140.1295,281.8494,848.78,48,-3566767.5,-277.82,240000
49,138.2279,229.5275,763.6,49,-3609166.75,-219.7,245000
50,140.8588,440.1902,703.33,50,-3709778.75,-205.99,250000
51,139.4348,611.1036,762.13,51,-3664974.25,-218.71,255000
52,139.5545,323.5778,746.8,52,-4038596.25,-181.71,260000
53,139.036,657.7815,778.94,53,-4173696.0,-212.75,265000
54,135.539,472.8641,788.62,54,-4137876.5,-245.34,270000
55,137.2191,507.4271,814.99,55,-4125467.0,-186.32,275000
56,137.4995,270.4839,814.02,56,-4247657.0,-242.26,280000
57,136.0165,325.34,737.6,57,-4248805.0,-229.26,285000
58,141.7477,509.4171,759.43,58,-4508683.5,-256.45,290000
59,138.7988,389.8394,651.66,59,-4527454.0,-288.03,295000
60,139.6838,166.3227,715.44,60,-4680172.0,-247.74,300000
61,141.4821,547.1451,733.22,61,-4776395.0,-231.71,305000
62,141.8545,561.6566,675.08,62,-5003671.0,-259.75,310000
63,138.2452,408.4497,789.19,63,-4950495.0,-255.2,315000
64,138.6556,928.6335,639.3,64,-4910260.5,-249.32,320000
65,134.5477,298.8346,830.44,65,-4887440.5,-234.95,325000
66,138.0533,345.3386,782.77,66,-5146417.0,-212.98,330000
67,135.407,641.8729,828.85,67,-5183848.0,-199.98,335000
68,139.3405,702.0458,677.85,68,-5455398.0,-283.02,340000
69,140.9534,510.4282,763.09,69,-5369386.0,-247.37,345000
70,137.3816,219.4332,807.34,70,-5603723.5,-226.83,350000
71,137.8818,547.5937,712.71,71,-5826581.5,-232.67,355000
72,139.7139,568.989,684.12,72,-5739251.5,-219.05,360000
73,140.8779,148.9603,619.78,73,-5983816.5,-210.84,365000
74,139.9974,1052.3559,789.2,74,-5765842.5,-237.27,370000
75,137.3692,537.4053,798.34,75,-6113316.5,-216.56,375000
76,139.3649,410.9284,769.95,76,-6102171.5,-251.13,380000
77,136.9296,46.3996,632.37,77,-6303865.0,-228.78,385000
78,138.4959,533.5719,759.62,78,-6402526.5,-184.86,390000
79,137.1159,74.0519,738.81,79,-6566401.0,-213.58,395000
80,140.9278,928.2992,741.18,80,-6715384.0,-223.92,400000
81,140.1993,123.6455,801.21,81,-6785062.0,-247.71,405000
