Logging to logs/HalfCheetah-v3/exp-1/maxentirl/2023_11_09_06_01_18
--2023-11-09 06:02:38.051157 CST--
| Itration            | 0        |
| Real Det Return     | 1.75e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.81e+03 |
| Real Sto violation  | 0.95     |
| Reward Loss         | -106     |
| Running Env Steps   | 0        |
| Running Forward KL  | 16       |
| Running Reverse KL  | 10.3     |
| Running Update Time | 0        |
----------------------------------
--2023-11-09 06:04:01.409496 CST--
| Itration            | 1        |
| Real Det Return     | 1.75e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.81e+03 |
| Real Sto violation  | 0.7      |
| Reward Loss         | -63.2    |
| Running Env Steps   | 5000     |
| Running Forward KL  | 15.8     |
| Running Reverse KL  | 11.7     |
| Running Update Time | 1        |
----------------------------------
--2023-11-09 06:05:31.959857 CST--
| Itration            | 2        |
| Real Det Return     | 1.76e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.86e+03 |
| Real Sto violation  | 0.45     |
| Reward Loss         | -49.1    |
| Running Env Steps   | 10000    |
| Running Forward KL  | 14.4     |
| Running Reverse KL  | 12       |
| Running Update Time | 2        |
----------------------------------
--2023-11-09 06:07:02.854977 CST--
| Itration            | 3        |
| Real Det Return     | 1.76e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.86e+03 |
| Real Sto violation  | 0.2      |
| Reward Loss         | -47.8    |
| Running Env Steps   | 15000    |
| Running Forward KL  | 13.9     |
| Running Reverse KL  | 12       |
| Running Update Time | 3        |
----------------------------------
--2023-11-09 06:08:33.388246 CST--
| Itration            | 4        |
| Real Det Return     | 1.76e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.88e+03 |
| Real Sto violation  | 0.2      |
| Reward Loss         | -57      |
| Running Env Steps   | 20000    |
| Running Forward KL  | 14.3     |
| Running Reverse KL  | 12.1     |
| Running Update Time | 4        |
----------------------------------
--2023-11-09 06:10:03.703698 CST--
| Itration            | 5        |
| Real Det Return     | 1.76e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.86e+03 |
| Real Sto violation  | 0.3      |
| Reward Loss         | -66.1    |
| Running Env Steps   | 25000    |
| Running Forward KL  | 14.2     |
| Running Reverse KL  | 12.4     |
| Running Update Time | 5        |
----------------------------------
--2023-11-09 06:11:34.250751 CST--
| Itration            | 6        |
| Real Det Return     | 1.76e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.88e+03 |
| Real Sto violation  | 0.2      |
| Reward Loss         | -84      |
| Running Env Steps   | 30000    |
| Running Forward KL  | 13.6     |
| Running Reverse KL  | 12.2     |
| Running Update Time | 6        |
----------------------------------
--2023-11-09 06:13:04.871319 CST--
| Itration            | 7        |
| Real Det Return     | 1.76e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.88e+03 |
| Real Sto violation  | 0.25     |
| Reward Loss         | -91.5    |
| Running Env Steps   | 35000    |
| Running Forward KL  | 13.7     |
| Running Reverse KL  | 12       |
| Running Update Time | 7        |
----------------------------------
--2023-11-09 06:14:35.564726 CST--
| Itration            | 8        |
| Real Det Return     | 1.76e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.9e+03  |
| Real Sto violation  | 0.1      |
| Reward Loss         | -116     |
| Running Env Steps   | 40000    |
| Running Forward KL  | 14.2     |
| Running Reverse KL  | 11.9     |
| Running Update Time | 8        |
----------------------------------
--2023-11-09 06:16:06.304207 CST--
| Itration            | 9        |
| Real Det Return     | 1.76e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.91e+03 |
| Real Sto violation  | 0.2      |
| Reward Loss         | -127     |
| Running Env Steps   | 45000    |
| Running Forward KL  | 13.7     |
| Running Reverse KL  | 11.8     |
| Running Update Time | 9        |
----------------------------------
--2023-11-09 06:17:38.308582 CST--
| Itration            | 10       |
| Real Det Return     | 1.76e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.9e+03  |
| Real Sto violation  | 0.15     |
| Reward Loss         | -142     |
| Running Env Steps   | 50000    |
| Running Forward KL  | 13.5     |
| Running Reverse KL  | 11.6     |
| Running Update Time | 10       |
----------------------------------
--2023-11-09 06:19:11.538868 CST--
| Itration            | 11       |
| Real Det Return     | 1.76e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.91e+03 |
| Real Sto violation  | 0.2      |
| Reward Loss         | -150     |
| Running Env Steps   | 55000    |
| Running Forward KL  | 13.4     |
| Running Reverse KL  | 11.6     |
| Running Update Time | 11       |
----------------------------------
--2023-11-09 06:20:46.100706 CST--
| Itration            | 12       |
| Real Det Return     | 1.76e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.91e+03 |
| Real Sto violation  | 0.15     |
| Reward Loss         | -164     |
| Running Env Steps   | 60000    |
| Running Forward KL  | 14       |
| Running Reverse KL  | 11.8     |
| Running Update Time | 12       |
----------------------------------
--2023-11-09 06:22:14.751653 CST--
| Itration            | 13       |
| Real Det Return     | 1.76e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.92e+03 |
| Real Sto violation  | 0.4      |
| Reward Loss         | -172     |
| Running Env Steps   | 65000    |
| Running Forward KL  | 12.9     |
| Running Reverse KL  | 11.6     |
| Running Update Time | 13       |
----------------------------------
--2023-11-09 06:23:47.194003 CST--
| Itration            | 14       |
| Real Det Return     | 1.76e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.92e+03 |
| Real Sto violation  | 0.05     |
| Reward Loss         | -191     |
| Running Env Steps   | 70000    |
| Running Forward KL  | 13.5     |
| Running Reverse KL  | 11.6     |
| Running Update Time | 14       |
----------------------------------
--2023-11-09 06:25:25.173135 CST--
| Itration            | 15       |
| Real Det Return     | 1.76e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.92e+03 |
| Real Sto violation  | 0.15     |
| Reward Loss         | -199     |
| Running Env Steps   | 75000    |
| Running Forward KL  | 13.4     |
| Running Reverse KL  | 11.5     |
| Running Update Time | 15       |
----------------------------------
--2023-11-09 06:27:05.654750 CST--
| Itration            | 16       |
| Real Det Return     | 1.76e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.93e+03 |
| Real Sto violation  | 0.1      |
| Reward Loss         | -217     |
| Running Env Steps   | 80000    |
| Running Forward KL  | 13.1     |
| Running Reverse KL  | 11.2     |
| Running Update Time | 16       |
----------------------------------
--2023-11-09 06:28:46.971361 CST--
| Itration            | 17       |
| Real Det Return     | 1.76e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.92e+03 |
| Real Sto violation  | 0.1      |
| Reward Loss         | -226     |
| Running Env Steps   | 85000    |
| Running Forward KL  | 13.1     |
| Running Reverse KL  | 11.2     |
| Running Update Time | 17       |
----------------------------------
--2023-11-09 06:30:28.491878 CST--
| Itration            | 18       |
| Real Det Return     | 1.76e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.94e+03 |
| Real Sto violation  | 0.1      |
| Reward Loss         | -232     |
| Running Env Steps   | 90000    |
| Running Forward KL  | 13.2     |
| Running Reverse KL  | 11.3     |
| Running Update Time | 18       |
----------------------------------
--2023-11-09 06:32:10.533775 CST--
| Itration            | 19       |
| Real Det Return     | 1.76e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.94e+03 |
| Real Sto violation  | 0.15     |
| Reward Loss         | -247     |
| Running Env Steps   | 95000    |
| Running Forward KL  | 12.9     |
| Running Reverse KL  | 11       |
| Running Update Time | 19       |
----------------------------------
--2023-11-09 06:33:53.045842 CST--
| Itration            | 20       |
| Real Det Return     | 1.76e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.93e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -249     |
| Running Env Steps   | 100000   |
| Running Forward KL  | 12.9     |
| Running Reverse KL  | 11.2     |
| Running Update Time | 20       |
----------------------------------
--2023-11-09 06:35:35.927363 CST--
| Itration            | 21       |
| Real Det Return     | 1.76e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.95e+03 |
| Real Sto violation  | 0.15     |
| Reward Loss         | -262     |
| Running Env Steps   | 105000   |
| Running Forward KL  | 12.8     |
| Running Reverse KL  | 10.9     |
| Running Update Time | 21       |
----------------------------------
--2023-11-09 06:37:19.610847 CST--
| Itration            | 22       |
| Real Det Return     | 1.76e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.93e+03 |
| Real Sto violation  | 0.1      |
| Reward Loss         | -274     |
| Running Env Steps   | 110000   |
| Running Forward KL  | 12.5     |
| Running Reverse KL  | 11       |
| Running Update Time | 22       |
----------------------------------
--2023-11-09 06:39:04.095402 CST--
| Itration            | 23       |
| Real Det Return     | 1.76e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.94e+03 |
| Real Sto violation  | 0.25     |
| Reward Loss         | -291     |
| Running Env Steps   | 115000   |
| Running Forward KL  | 12.5     |
| Running Reverse KL  | 10.7     |
| Running Update Time | 23       |
----------------------------------
--2023-11-09 06:40:49.026112 CST--
| Itration            | 24       |
| Real Det Return     | 1.76e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.94e+03 |
| Real Sto violation  | 0.15     |
| Reward Loss         | -296     |
| Running Env Steps   | 120000   |
| Running Forward KL  | 12.4     |
| Running Reverse KL  | 10.9     |
| Running Update Time | 24       |
----------------------------------
--2023-11-09 06:42:34.297772 CST--
| Itration            | 25       |
| Real Det Return     | 1.76e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.95e+03 |
| Real Sto violation  | 0.1      |
| Reward Loss         | -303     |
| Running Env Steps   | 125000   |
| Running Forward KL  | 12.2     |
| Running Reverse KL  | 10.5     |
| Running Update Time | 25       |
----------------------------------
--2023-11-09 06:44:20.677303 CST--
| Itration            | 26       |
| Real Det Return     | 1.76e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.96e+03 |
| Real Sto violation  | 0.05     |
| Reward Loss         | -315     |
| Running Env Steps   | 130000   |
| Running Forward KL  | 12.8     |
| Running Reverse KL  | 10.7     |
| Running Update Time | 26       |
----------------------------------
--2023-11-09 06:46:08.019573 CST--
| Itration            | 27       |
| Real Det Return     | 1.76e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.97e+03 |
| Real Sto violation  | 0.05     |
| Reward Loss         | -318     |
| Running Env Steps   | 135000   |
| Running Forward KL  | 12.3     |
| Running Reverse KL  | 10.5     |
| Running Update Time | 27       |
----------------------------------
--2023-11-09 06:47:56.037584 CST--
| Itration            | 28       |
| Real Det Return     | 1.76e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.96e+03 |
| Real Sto violation  | 0.2      |
| Reward Loss         | -335     |
| Running Env Steps   | 140000   |
| Running Forward KL  | 12.2     |
| Running Reverse KL  | 10.4     |
| Running Update Time | 28       |
----------------------------------
--2023-11-09 06:49:43.593679 CST--
| Itration            | 29       |
| Real Det Return     | 1.76e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.97e+03 |
| Real Sto violation  | 0.3      |
| Reward Loss         | -341     |
| Running Env Steps   | 145000   |
| Running Forward KL  | 12       |
| Running Reverse KL  | 10.2     |
| Running Update Time | 29       |
----------------------------------
--2023-11-09 06:51:32.008425 CST--
| Itration            | 30       |
| Real Det Return     | 1.76e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.99e+03 |
| Real Sto violation  | 0.5      |
| Reward Loss         | -354     |
| Running Env Steps   | 150000   |
| Running Forward KL  | 12.4     |
| Running Reverse KL  | 10.1     |
| Running Update Time | 30       |
----------------------------------
--2023-11-09 06:53:21.476265 CST--
| Itration            | 31       |
| Real Det Return     | 1.76e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.97e+03 |
| Real Sto violation  | 0.15     |
| Reward Loss         | -356     |
| Running Env Steps   | 155000   |
| Running Forward KL  | 11.8     |
| Running Reverse KL  | 10.1     |
| Running Update Time | 31       |
----------------------------------
--2023-11-09 06:55:11.110985 CST--
| Itration            | 32       |
| Real Det Return     | 1.76e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.98e+03 |
| Real Sto violation  | 0.15     |
| Reward Loss         | -372     |
| Running Env Steps   | 160000   |
| Running Forward KL  | 12.6     |
| Running Reverse KL  | 10.2     |
| Running Update Time | 32       |
----------------------------------
--2023-11-09 06:57:01.100912 CST--
| Itration            | 33       |
| Real Det Return     | 1.76e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2e+03    |
| Real Sto violation  | 0.25     |
| Reward Loss         | -374     |
| Running Env Steps   | 165000   |
| Running Forward KL  | 12.2     |
| Running Reverse KL  | 9.99     |
| Running Update Time | 33       |
----------------------------------
--2023-11-09 07:27:57.318329 CST--
| Itration            | 34       |
| Real Det Return     | 1.76e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.99e+03 |
| Real Sto violation  | 0.2      |
| Reward Loss         | -373     |
| Running Env Steps   | 170000   |
| Running Forward KL  | 11.5     |
| Running Reverse KL  | 9.89     |
| Running Update Time | 34       |
----------------------------------
--2023-11-09 07:29:49.433381 CST--
| Itration            | 35       |
| Real Det Return     | 1.76e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2e+03    |
| Real Sto violation  | 0.2      |
| Reward Loss         | -384     |
| Running Env Steps   | 175000   |
| Running Forward KL  | 12.1     |
| Running Reverse KL  | 9.87     |
| Running Update Time | 35       |
----------------------------------
--2023-11-09 07:31:42.075061 CST--
| Itration            | 36       |
| Real Det Return     | 1.76e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.01e+03 |
| Real Sto violation  | 0.2      |
| Reward Loss         | -395     |
| Running Env Steps   | 180000   |
| Running Forward KL  | 11.2     |
| Running Reverse KL  | 9.89     |
| Running Update Time | 36       |
----------------------------------
--2023-11-09 07:33:35.557983 CST--
| Itration            | 37       |
| Real Det Return     | 1.76e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.01e+03 |
| Real Sto violation  | 0.05     |
| Reward Loss         | -400     |
| Running Env Steps   | 185000   |
| Running Forward KL  | 11.3     |
| Running Reverse KL  | 9.77     |
| Running Update Time | 37       |
----------------------------------
--2023-11-09 07:35:30.178676 CST--
| Itration            | 38       |
| Real Det Return     | 1.76e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2e+03    |
| Real Sto violation  | 0.2      |
| Reward Loss         | -408     |
| Running Env Steps   | 190000   |
| Running Forward KL  | 12       |
| Running Reverse KL  | 9.82     |
| Running Update Time | 38       |
----------------------------------
--2023-11-09 07:37:25.243924 CST--
| Itration            | 39       |
| Real Det Return     | 1.76e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.02e+03 |
| Real Sto violation  | 0.05     |
| Reward Loss         | -405     |
| Running Env Steps   | 195000   |
| Running Forward KL  | 11.4     |
| Running Reverse KL  | 9.65     |
| Running Update Time | 39       |
----------------------------------
--2023-11-09 07:39:20.913331 CST--
| Itration            | 40       |
| Real Det Return     | 1.76e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.05e+03 |
| Real Sto violation  | 0.45     |
| Reward Loss         | -409     |
| Running Env Steps   | 200000   |
| Running Forward KL  | 11.4     |
| Running Reverse KL  | 9.41     |
| Running Update Time | 40       |
----------------------------------
--2023-11-09 07:41:14.620462 CST--
| Itration            | 41       |
| Real Det Return     | 1.76e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.05e+03 |
| Real Sto violation  | 0.2      |
| Reward Loss         | -420     |
| Running Env Steps   | 205000   |
| Running Forward KL  | 10.9     |
| Running Reverse KL  | 9.42     |
| Running Update Time | 41       |
----------------------------------
--2023-11-09 07:43:08.054015 CST--
| Itration            | 42       |
| Real Det Return     | 1.76e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.06e+03 |
| Real Sto violation  | 0.45     |
| Reward Loss         | -417     |
| Running Env Steps   | 210000   |
| Running Forward KL  | 11.1     |
| Running Reverse KL  | 9.3      |
| Running Update Time | 42       |
----------------------------------
--2023-11-09 07:45:01.555391 CST--
| Itration            | 43       |
| Real Det Return     | 1.76e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.07e+03 |
| Real Sto violation  | 0.55     |
| Reward Loss         | -422     |
| Running Env Steps   | 215000   |
| Running Forward KL  | 11       |
| Running Reverse KL  | 9.14     |
| Running Update Time | 43       |
----------------------------------
--2023-11-09 07:46:55.141610 CST--
| Itration            | 44       |
| Real Det Return     | 1.76e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.06e+03 |
| Real Sto violation  | 0.3      |
| Reward Loss         | -431     |
| Running Env Steps   | 220000   |
| Running Forward KL  | 10.9     |
| Running Reverse KL  | 9.29     |
| Running Update Time | 44       |
----------------------------------
--2023-11-09 07:48:47.413664 CST--
| Itration            | 45       |
| Real Det Return     | 1.9e+03  |
| Real Det violation  | 0        |
| Real Sto Return     | 2.1e+03  |
| Real Sto violation  | 0.3      |
| Reward Loss         | -416     |
| Running Env Steps   | 225000   |
| Running Forward KL  | 10.8     |
| Running Reverse KL  | 8.93     |
| Running Update Time | 45       |
----------------------------------
--2023-11-09 07:50:39.456507 CST--
| Itration            | 46       |
| Real Det Return     | 1.89e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.11e+03 |
| Real Sto violation  | 0.45     |
| Reward Loss         | -414     |
| Running Env Steps   | 230000   |
| Running Forward KL  | 10.8     |
| Running Reverse KL  | 8.89     |
| Running Update Time | 46       |
----------------------------------
--2023-11-09 07:52:31.381986 CST--
| Itration            | 47       |
| Real Det Return     | 1.94e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.12e+03 |
| Real Sto violation  | 0.4      |
| Reward Loss         | -417     |
| Running Env Steps   | 235000   |
| Running Forward KL  | 10.5     |
| Running Reverse KL  | 8.88     |
| Running Update Time | 47       |
----------------------------------
--2023-11-09 07:54:23.778231 CST--
| Itration            | 48       |
| Real Det Return     | 1.94e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.11e+03 |
| Real Sto violation  | 0.35     |
| Reward Loss         | -427     |
| Running Env Steps   | 240000   |
| Running Forward KL  | 10.8     |
| Running Reverse KL  | 9.02     |
| Running Update Time | 48       |
----------------------------------
--2023-11-09 07:56:16.078092 CST--
| Itration            | 49       |
| Real Det Return     | 2.31e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.16e+03 |
| Real Sto violation  | 0.5      |
| Reward Loss         | -414     |
| Running Env Steps   | 245000   |
| Running Forward KL  | 10.3     |
| Running Reverse KL  | 8.71     |
| Running Update Time | 49       |
----------------------------------
--2023-11-09 07:58:08.723874 CST--
| Itration            | 50       |
| Real Det Return     | 2.24e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.19e+03 |
| Real Sto violation  | 0.75     |
| Reward Loss         | -409     |
| Running Env Steps   | 250000   |
| Running Forward KL  | 10.1     |
| Running Reverse KL  | 8.42     |
| Running Update Time | 50       |
----------------------------------
--2023-11-09 08:00:01.593096 CST--
| Itration            | 51       |
| Real Det Return     | 2.28e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.19e+03 |
| Real Sto violation  | 0.75     |
| Reward Loss         | -403     |
| Running Env Steps   | 255000   |
| Running Forward KL  | 10.5     |
| Running Reverse KL  | 8.6      |
| Running Update Time | 51       |
----------------------------------
--2023-11-09 08:01:54.679099 CST--
| Itration            | 52       |
| Real Det Return     | 2.54e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.22e+03 |
| Real Sto violation  | 0.55     |
| Reward Loss         | -407     |
| Running Env Steps   | 260000   |
| Running Forward KL  | 9.76     |
| Running Reverse KL  | 8.46     |
| Running Update Time | 52       |
----------------------------------
--2023-11-09 08:03:49.066706 CST--
| Itration            | 53       |
| Real Det Return     | 2.19e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.19e+03 |
| Real Sto violation  | 0.35     |
| Reward Loss         | -393     |
| Running Env Steps   | 265000   |
| Running Forward KL  | 10.3     |
| Running Reverse KL  | 8.41     |
| Running Update Time | 53       |
----------------------------------
--2023-11-09 08:05:42.881173 CST--
| Itration            | 54       |
| Real Det Return     | 2.69e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.27e+03 |
| Real Sto violation  | 0.6      |
| Reward Loss         | -403     |
| Running Env Steps   | 270000   |
| Running Forward KL  | 10.2     |
| Running Reverse KL  | 8.03     |
| Running Update Time | 54       |
----------------------------------
--2023-11-09 08:07:36.754892 CST--
| Itration            | 55       |
| Real Det Return     | 2.44e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.21e+03 |
| Real Sto violation  | 0.7      |
| Reward Loss         | -394     |
| Running Env Steps   | 275000   |
| Running Forward KL  | 9.99     |
| Running Reverse KL  | 8.38     |
| Running Update Time | 55       |
----------------------------------
--2023-11-09 08:09:30.685878 CST--
| Itration            | 56       |
| Real Det Return     | 2.69e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.25e+03 |
| Real Sto violation  | 0.65     |
| Reward Loss         | -383     |
| Running Env Steps   | 280000   |
| Running Forward KL  | 10.1     |
| Running Reverse KL  | 8.14     |
| Running Update Time | 56       |
----------------------------------
--2023-11-09 08:11:24.929494 CST--
| Itration            | 57       |
| Real Det Return     | 2.71e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.27e+03 |
| Real Sto violation  | 0.8      |
| Reward Loss         | -389     |
| Running Env Steps   | 285000   |
| Running Forward KL  | 9.67     |
| Running Reverse KL  | 8.25     |
| Running Update Time | 57       |
----------------------------------
--2023-11-09 08:13:19.574094 CST--
| Itration            | 58       |
| Real Det Return     | 2.71e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.25e+03 |
| Real Sto violation  | 0.4      |
| Reward Loss         | -392     |
| Running Env Steps   | 290000   |
| Running Forward KL  | 9.78     |
| Running Reverse KL  | 8.44     |
| Running Update Time | 58       |
----------------------------------
--2023-11-09 08:15:14.455149 CST--
| Itration            | 59       |
| Real Det Return     | 2.63e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.27e+03 |
| Real Sto violation  | 0.3      |
| Reward Loss         | -391     |
| Running Env Steps   | 295000   |
| Running Forward KL  | 9.83     |
| Running Reverse KL  | 8.37     |
| Running Update Time | 59       |
----------------------------------
--2023-11-09 08:17:08.513450 CST--
| Itration            | 60       |
| Real Det Return     | 2.73e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.32e+03 |
| Real Sto violation  | 0.9      |
| Reward Loss         | -373     |
| Running Env Steps   | 300000   |
| Running Forward KL  | 10       |
| Running Reverse KL  | 8.27     |
| Running Update Time | 60       |
----------------------------------
--2023-11-09 08:19:02.769812 CST--
| Itration            | 61       |
| Real Det Return     | 2.76e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.32e+03 |
| Real Sto violation  | 0.75     |
| Reward Loss         | -390     |
| Running Env Steps   | 305000   |
| Running Forward KL  | 9.87     |
| Running Reverse KL  | 8.1      |
| Running Update Time | 61       |
----------------------------------
--2023-11-09 08:20:57.586660 CST--
| Itration            | 62       |
| Real Det Return     | 2.74e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.3e+03  |
| Real Sto violation  | 0.85     |
| Reward Loss         | -395     |
| Running Env Steps   | 310000   |
| Running Forward KL  | 9.93     |
| Running Reverse KL  | 8.18     |
| Running Update Time | 62       |
----------------------------------
--2023-11-09 08:22:52.707049 CST--
| Itration            | 63       |
| Real Det Return     | 2.76e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.34e+03 |
| Real Sto violation  | 0.65     |
| Reward Loss         | -389     |
| Running Env Steps   | 315000   |
| Running Forward KL  | 9.6      |
| Running Reverse KL  | 7.88     |
| Running Update Time | 63       |
----------------------------------
--2023-11-09 08:24:47.693084 CST--
| Itration            | 64       |
| Real Det Return     | 2.74e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.36e+03 |
| Real Sto violation  | 0.45     |
| Reward Loss         | -376     |
| Running Env Steps   | 320000   |
| Running Forward KL  | 10.1     |
| Running Reverse KL  | 7.99     |
| Running Update Time | 64       |
----------------------------------
--2023-11-09 08:26:43.099261 CST--
| Itration            | 65       |
| Real Det Return     | 2.74e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.35e+03 |
| Real Sto violation  | 0.65     |
| Reward Loss         | -386     |
| Running Env Steps   | 325000   |
| Running Forward KL  | 10.1     |
| Running Reverse KL  | 7.98     |
| Running Update Time | 65       |
----------------------------------
--2023-11-09 08:28:36.649317 CST--
| Itration            | 66       |
| Real Det Return     | 2.72e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.37e+03 |
| Real Sto violation  | 0.95     |
| Reward Loss         | -365     |
| Running Env Steps   | 330000   |
| Running Forward KL  | 9.94     |
| Running Reverse KL  | 7.92     |
| Running Update Time | 66       |
----------------------------------
--2023-11-09 08:30:35.479435 CST--
| Itration            | 67       |
| Real Det Return     | 2.75e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.32e+03 |
| Real Sto violation  | 0.6      |
| Reward Loss         | -384     |
| Running Env Steps   | 335000   |
| Running Forward KL  | 9.31     |
| Running Reverse KL  | 7.93     |
| Running Update Time | 67       |
----------------------------------
--2023-11-09 08:32:32.140085 CST--
| Itration            | 68       |
| Real Det Return     | 2.75e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.38e+03 |
| Real Sto violation  | 0.4      |
| Reward Loss         | -379     |
| Running Env Steps   | 340000   |
| Running Forward KL  | 9.71     |
| Running Reverse KL  | 8.03     |
| Running Update Time | 68       |
----------------------------------
--2023-11-09 08:34:29.928150 CST--
| Itration            | 69       |
| Real Det Return     | 2.75e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.4e+03  |
| Real Sto violation  | 0.65     |
| Reward Loss         | -361     |
| Running Env Steps   | 345000   |
| Running Forward KL  | 9.49     |
| Running Reverse KL  | 7.94     |
| Running Update Time | 69       |
----------------------------------
--2023-11-09 08:36:27.515060 CST--
| Itration            | 70       |
| Real Det Return     | 2.72e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.36e+03 |
| Real Sto violation  | 0.65     |
| Reward Loss         | -382     |
| Running Env Steps   | 350000   |
| Running Forward KL  | 9.37     |
| Running Reverse KL  | 7.85     |
| Running Update Time | 70       |
----------------------------------
--2023-11-09 08:38:25.211941 CST--
| Itration            | 71       |
| Real Det Return     | 2.71e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.37e+03 |
| Real Sto violation  | 0.7      |
| Reward Loss         | -397     |
| Running Env Steps   | 355000   |
| Running Forward KL  | 9.5      |
| Running Reverse KL  | 7.65     |
| Running Update Time | 71       |
----------------------------------
--2023-11-09 08:40:22.935995 CST--
| Itration            | 72       |
| Real Det Return     | 2.75e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.37e+03 |
| Real Sto violation  | 0.55     |
| Reward Loss         | -376     |
| Running Env Steps   | 360000   |
| Running Forward KL  | 9.53     |
| Running Reverse KL  | 7.8      |
| Running Update Time | 72       |
----------------------------------
--2023-11-09 08:42:20.591237 CST--
| Itration            | 73       |
| Real Det Return     | 2.81e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.4e+03  |
| Real Sto violation  | 0.85     |
| Reward Loss         | -386     |
| Running Env Steps   | 365000   |
| Running Forward KL  | 9.48     |
| Running Reverse KL  | 7.64     |
| Running Update Time | 73       |
----------------------------------
--2023-11-09 08:44:18.912111 CST--
| Itration            | 74       |
| Real Det Return     | 2.72e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.37e+03 |
| Real Sto violation  | 0.85     |
| Reward Loss         | -389     |
| Running Env Steps   | 370000   |
| Running Forward KL  | 9.09     |
| Running Reverse KL  | 7.71     |
| Running Update Time | 74       |
----------------------------------
--2023-11-09 08:46:16.842774 CST--
| Itration            | 75       |
| Real Det Return     | 2.72e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.38e+03 |
| Real Sto violation  | 0.75     |
| Reward Loss         | -385     |
| Running Env Steps   | 375000   |
| Running Forward KL  | 9.51     |
| Running Reverse KL  | 7.7      |
| Running Update Time | 75       |
----------------------------------
