Running Update Time,Reward Loss,Running Reverse KL,Real Sto Return,Running Forward KL,Real Det Return,Real Sto violation,Running Env Steps,Real Det violation,Itration
0,706.5711669921875,10.8435,-142.08,17.6702,-1271.61,1.0,0,0.0,0
1,869.6453247070312,13.1007,-314.03,19.6465,-1599.67,1.0,5000,0.3,1
2,856.6932373046875,12.6395,-461.19,19.3474,-1742.94,1.0,10000,0.15,2
3,802.3172607421875,12.5083,-349.06,19.0794,-1506.14,1.0,15000,0.05,3
4,723.4979858398438,12.0401,-387.5,18.6684,-1694.35,1.0,20000,0.0,4
5,633.3189086914062,11.3104,-377.76,18.2413,-1785.12,1.0,25000,0.0,5
6,627.3408813476562,11.1857,-376.24,18.3548,-1635.36,0.9,30000,0.0,6
7,582.3284912109375,11.0493,-371.55,18.0634,-1532.3,1.0,35000,0.0,7
8,563.918701171875,10.896,-416.91,18.4205,-1582.57,1.0,40000,0.0,8
9,519.3582763671875,10.5813,-469.21,17.9368,-1453.23,1.0,45000,0.0,9
10,540.8156127929688,10.5612,-488.1,18.3423,-1727.6,1.0,50000,0.0,10
11,491.9237976074219,10.4228,-455.0,17.9904,-1564.99,1.0,55000,0.0,11
12,491.2100524902344,10.568,-471.35,17.915,-1774.1,1.0,60000,0.0,12
13,450.4280090332031,10.1315,-436.92,17.6431,-1604.12,1.0,65000,0.0,13
14,418.89617919921875,10.1336,-453.25,18.0428,-1601.51,0.95,70000,0.0,14
15,408.1478576660156,9.7777,-470.92,17.9716,-1683.89,1.0,75000,0.0,15
16,394.7976379394531,9.6576,-338.98,17.4801,-1578.19,1.0,80000,0.0,16
17,354.7752990722656,9.6939,-318.64,17.4812,-1203.13,1.0,85000,0.0,17
18,331.2891845703125,9.4649,-415.97,17.6668,-1320.83,1.0,90000,0.0,18
19,308.65435791015625,9.4973,-382.98,17.1333,-1499.21,1.0,95000,0.0,19
20,306.5234680175781,9.4129,-427.75,17.6589,-1592.14,1.0,100000,0.0,20
21,281.3668518066406,9.3717,-430.65,17.371,-1481.19,0.95,105000,0.0,21
22,277.67669677734375,9.2699,-404.1,17.5713,-1374.04,1.0,110000,0.0,22
23,253.5480194091797,8.7263,-291.38,17.2453,-1442.01,1.0,115000,0.0,23
24,248.78598022460938,9.1972,-403.59,17.6744,-1657.37,1.0,120000,0.0,24
25,235.5999298095703,8.9869,-407.31,17.3458,-1409.22,1.0,125000,0.0,25
26,223.51670837402344,9.0863,-387.68,17.1723,-1286.68,1.0,130000,0.0,26
27,197.36570739746094,8.7153,-302.07,17.0459,-1243.69,1.0,135000,0.0,27
28,193.90696716308594,8.5505,-325.6,16.5885,-1456.62,1.0,140000,0.0,28
29,167.47837829589844,8.1507,-303.97,16.8289,-1219.93,1.0,145000,0.0,29
30,177.5477294921875,8.587,-338.29,17.1979,-1075.64,1.0,150000,0.0,30
31,149.12509155273438,8.5569,-275.92,16.9873,-1263.93,0.95,155000,0.0,31
32,146.6197052001953,8.5517,-347.53,16.6335,-1262.53,1.0,160000,0.0,32
33,144.4752197265625,8.3522,-231.19,16.7434,-1347.82,1.0,165000,0.0,33
34,125.18263244628906,8.3948,-293.57,16.7813,-1124.2,1.0,170000,0.0,34
35,123.6574935913086,8.3433,-282.81,16.4674,-1355.86,1.0,175000,0.0,35
36,114.66106414794922,8.0832,-343.4,16.373,-1318.65,0.95,180000,0.0,36
37,115.59593963623047,8.3115,-314.83,16.556,-1252.24,1.0,185000,0.0,37
38,108.87354278564453,8.2053,-341.25,16.6576,-1252.92,1.0,190000,0.0,38
