Logging to logs/Walker2d-v3/exp-1/maxentirl_sa/2023_11_10_06_54_01
--2023-11-10 06:55:15.293829 CST--
| Itration            | 0        |
| Real Det Return     | 61.4     |
| Real Det violation  | 0        |
| Real Sto Return     | 122      |
| Real Sto violation  | 0.35     |
| Reward Loss         | 109      |
| Running Env Steps   | 0        |
| Running Forward KL  | 28.3     |
| Running Reverse KL  | 14.4     |
| Running Update Time | 0        |
----------------------------------
--2023-11-10 06:56:46.467016 CST--
| Itration            | 1        |
| Real Det Return     | 102      |
| Real Det violation  | 0.55     |
| Real Sto Return     | 180      |
| Real Sto violation  | 0.8      |
| Reward Loss         | 149      |
| Running Env Steps   | 5000     |
| Running Forward KL  | 28.6     |
| Running Reverse KL  | 15.7     |
| Running Update Time | 1        |
----------------------------------
--2023-11-10 06:58:17.300529 CST--
| Itration            | 2        |
| Real Det Return     | 94.2     |
| Real Det violation  | 0.15     |
| Real Sto Return     | 147      |
| Real Sto violation  | 0.35     |
| Reward Loss         | 128      |
| Running Env Steps   | 10000    |
| Running Forward KL  | 29.1     |
| Running Reverse KL  | 16.3     |
| Running Update Time | 2        |
----------------------------------
--2023-11-10 06:59:47.654756 CST--
| Itration            | 3        |
| Real Det Return     | 111      |
| Real Det violation  | 0        |
| Real Sto Return     | 185      |
| Real Sto violation  | 0.4      |
| Reward Loss         | 129      |
| Running Env Steps   | 15000    |
| Running Forward KL  | 28.9     |
| Running Reverse KL  | 16.5     |
| Running Update Time | 3        |
----------------------------------
--2023-11-10 07:01:18.630758 CST--
| Itration            | 4        |
| Real Det Return     | 187      |
| Real Det violation  | 1        |
| Real Sto Return     | 162      |
| Real Sto violation  | 0.65     |
| Reward Loss         | 178      |
| Running Env Steps   | 20000    |
| Running Forward KL  | 28.4     |
| Running Reverse KL  | 16.7     |
| Running Update Time | 4        |
----------------------------------
--2023-11-10 07:02:49.929791 CST--
| Itration            | 5        |
| Real Det Return     | 167      |
| Real Det violation  | 1        |
| Real Sto Return     | 219      |
| Real Sto violation  | 0.35     |
| Reward Loss         | 148      |
| Running Env Steps   | 25000    |
| Running Forward KL  | 27.7     |
| Running Reverse KL  | 15.2     |
| Running Update Time | 5        |
----------------------------------
--2023-11-10 07:04:22.259302 CST--
| Itration            | 6        |
| Real Det Return     | 163      |
| Real Det violation  | 1        |
| Real Sto Return     | 284      |
| Real Sto violation  | 0.8      |
| Reward Loss         | 112      |
| Running Env Steps   | 30000    |
| Running Forward KL  | 27.7     |
| Running Reverse KL  | 16.3     |
| Running Update Time | 6        |
----------------------------------
--2023-11-10 07:05:58.422281 CST--
| Itration            | 7        |
| Real Det Return     | 493      |
| Real Det violation  | 0.95     |
| Real Sto Return     | 340      |
| Real Sto violation  | 0.65     |
| Reward Loss         | 41.5     |
| Running Env Steps   | 35000    |
| Running Forward KL  | 28.4     |
| Running Reverse KL  | 17.1     |
| Running Update Time | 7        |
----------------------------------
--2023-11-10 07:07:34.918256 CST--
| Itration            | 8        |
| Real Det Return     | 516      |
| Real Det violation  | 0.95     |
| Real Sto Return     | 291      |
| Real Sto violation  | 0.9      |
| Reward Loss         | 46.7     |
| Running Env Steps   | 40000    |
| Running Forward KL  | 28       |
| Running Reverse KL  | 15.1     |
| Running Update Time | 8        |
----------------------------------
--2023-11-10 07:09:26.382690 CST--
| Itration            | 9        |
| Real Det Return     | 2.34e+03 |
| Real Det violation  | 0.05     |
| Real Sto Return     | 557      |
| Real Sto violation  | 0.9      |
| Reward Loss         | -2.62    |
| Running Env Steps   | 45000    |
| Running Forward KL  | 28.4     |
| Running Reverse KL  | 24.9     |
| Running Update Time | 9        |
----------------------------------
--2023-11-10 07:11:17.319190 CST--
| Itration            | 10       |
| Real Det Return     | 2.42e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 597      |
| Real Sto violation  | 0.85     |
| Reward Loss         | 47.6     |
| Running Env Steps   | 50000    |
| Running Forward KL  | 27.9     |
| Running Reverse KL  | 14.6     |
| Running Update Time | 10       |
----------------------------------
--2023-11-10 07:13:00.374745 CST--
| Itration            | 11       |
| Real Det Return     | 1.13e+03 |
| Real Det violation  | 1        |
| Real Sto Return     | 639      |
| Real Sto violation  | 0.8      |
| Reward Loss         | 61.1     |
| Running Env Steps   | 55000    |
| Running Forward KL  | 28.1     |
| Running Reverse KL  | 15.9     |
| Running Update Time | 11       |
----------------------------------
--2023-11-10 07:14:44.548194 CST--
| Itration            | 12       |
| Real Det Return     | 1.09e+03 |
| Real Det violation  | 1        |
| Real Sto Return     | 510      |
| Real Sto violation  | 0.85     |
| Reward Loss         | 81.7     |
| Running Env Steps   | 60000    |
| Running Forward KL  | 28.5     |
| Running Reverse KL  | 16.8     |
| Running Update Time | 12       |
----------------------------------
--2023-11-10 07:16:41.972832 CST--
| Itration            | 13       |
| Real Det Return     | 2.73e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 908      |
| Real Sto violation  | 0.8      |
| Reward Loss         | 80.2     |
| Running Env Steps   | 65000    |
| Running Forward KL  | 29       |
| Running Reverse KL  | 14.9     |
| Running Update Time | 13       |
----------------------------------
--2023-11-10 07:18:39.873775 CST--
| Itration            | 14       |
| Real Det Return     | 2.59e+03 |
| Real Det violation  | 0.05     |
| Real Sto Return     | 758      |
| Real Sto violation  | 0.8      |
| Reward Loss         | 61.5     |
| Running Env Steps   | 70000    |
| Running Forward KL  | 27.5     |
| Running Reverse KL  | 13.8     |
| Running Update Time | 14       |
----------------------------------
--2023-11-10 07:20:28.575200 CST--
| Itration            | 15       |
| Real Det Return     | 1.19e+03 |
| Real Det violation  | 1        |
| Real Sto Return     | 683      |
| Real Sto violation  | 0.95     |
| Reward Loss         | 43.7     |
| Running Env Steps   | 75000    |
| Running Forward KL  | 27.8     |
| Running Reverse KL  | 14.9     |
| Running Update Time | 15       |
----------------------------------
--2023-11-10 07:22:14.915092 CST--
| Itration            | 16       |
| Real Det Return     | 583      |
| Real Det violation  | 1        |
| Real Sto Return     | 628      |
| Real Sto violation  | 0.6      |
| Reward Loss         | 70.3     |
| Running Env Steps   | 80000    |
| Running Forward KL  | 28.2     |
| Running Reverse KL  | 14.4     |
| Running Update Time | 16       |
----------------------------------
--2023-11-10 07:24:15.689260 CST--
| Itration            | 17       |
| Real Det Return     | 2.67e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 986      |
| Real Sto violation  | 0.75     |
| Reward Loss         | 64.3     |
| Running Env Steps   | 85000    |
| Running Forward KL  | 27.9     |
| Running Reverse KL  | 14.4     |
| Running Update Time | 17       |
----------------------------------
--2023-11-10 07:26:11.114388 CST--
| Itration            | 18       |
| Real Det Return     | 1.66e+03 |
| Real Det violation  | 0.4      |
| Real Sto Return     | 777      |
| Real Sto violation  | 0.75     |
| Reward Loss         | 28.7     |
| Running Env Steps   | 90000    |
| Running Forward KL  | 27.9     |
| Running Reverse KL  | 15.5     |
| Running Update Time | 18       |
----------------------------------
--2023-11-10 07:28:09.939494 CST--
| Itration            | 19       |
| Real Det Return     | 1.61e+03 |
| Real Det violation  | 0.25     |
| Real Sto Return     | 952      |
| Real Sto violation  | 0.5      |
| Reward Loss         | 24.9     |
| Running Env Steps   | 95000    |
| Running Forward KL  | 27.9     |
| Running Reverse KL  | 14.7     |
| Running Update Time | 19       |
----------------------------------
--2023-11-10 07:30:07.520324 CST--
| Itration            | 20       |
| Real Det Return     | 1.56e+03 |
| Real Det violation  | 0.5      |
| Real Sto Return     | 1.06e+03 |
| Real Sto violation  | 0.5      |
| Reward Loss         | 19       |
| Running Env Steps   | 100000   |
| Running Forward KL  | 28       |
| Running Reverse KL  | 14.6     |
| Running Update Time | 20       |
----------------------------------
--2023-11-10 07:32:11.913071 CST--
| Itration            | 21       |
| Real Det Return     | 2.74e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.17e+03 |
| Real Sto violation  | 0.65     |
| Reward Loss         | 12.3     |
| Running Env Steps   | 105000   |
| Running Forward KL  | 28       |
| Running Reverse KL  | 14.7     |
| Running Update Time | 21       |
----------------------------------
--2023-11-10 07:34:07.415319 CST--
| Itration            | 22       |
| Real Det Return     | 1.19e+03 |
| Real Det violation  | 0.85     |
| Real Sto Return     | 1.12e+03 |
| Real Sto violation  | 0.65     |
| Reward Loss         | 11       |
| Running Env Steps   | 110000   |
| Running Forward KL  | 27.6     |
| Running Reverse KL  | 14.9     |
| Running Update Time | 22       |
----------------------------------
--2023-11-10 07:36:13.747068 CST--
| Itration            | 23       |
| Real Det Return     | 1.92e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.58e+03 |
| Real Sto violation  | 0.35     |
| Reward Loss         | 40.4     |
| Running Env Steps   | 115000   |
| Running Forward KL  | 27.8     |
| Running Reverse KL  | 16       |
| Running Update Time | 23       |
----------------------------------
--2023-11-10 07:38:21.193191 CST--
| Itration            | 24       |
| Real Det Return     | 2.21e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.78e+03 |
| Real Sto violation  | 0.15     |
| Reward Loss         | 4.77     |
| Running Env Steps   | 120000   |
| Running Forward KL  | 27.8     |
| Running Reverse KL  | 15       |
| Running Update Time | 24       |
----------------------------------
--2023-11-10 07:40:28.098739 CST--
| Itration            | 25       |
| Real Det Return     | 1.93e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.72e+03 |
| Real Sto violation  | 0.2      |
| Reward Loss         | 9.08     |
| Running Env Steps   | 125000   |
| Running Forward KL  | 27.9     |
| Running Reverse KL  | 15.9     |
| Running Update Time | 25       |
----------------------------------
--2023-11-10 07:42:31.377416 CST--
| Itration            | 26       |
| Real Det Return     | 1.83e+03 |
| Real Det violation  | 0.3      |
| Real Sto Return     | 1.68e+03 |
| Real Sto violation  | 0.2      |
| Reward Loss         | -13.6    |
| Running Env Steps   | 130000   |
| Running Forward KL  | 28.1     |
| Running Reverse KL  | 15.4     |
| Running Update Time | 26       |
----------------------------------
--2023-11-10 07:44:41.019330 CST--
| Itration            | 27       |
| Real Det Return     | 2.25e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.87e+03 |
| Real Sto violation  | 0.15     |
| Reward Loss         | -27.3    |
| Running Env Steps   | 135000   |
| Running Forward KL  | 28.1     |
| Running Reverse KL  | 15.6     |
| Running Update Time | 27       |
----------------------------------
--2023-11-10 07:46:48.117351 CST--
| Itration            | 28       |
| Real Det Return     | 2.23e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.48e+03 |
| Real Sto violation  | 0.5      |
| Reward Loss         | 1.09     |
| Running Env Steps   | 140000   |
| Running Forward KL  | 27.7     |
| Running Reverse KL  | 15.7     |
| Running Update Time | 28       |
----------------------------------
--2023-11-10 07:48:58.172854 CST--
| Itration            | 29       |
| Real Det Return     | 2.05e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.84e+03 |
| Real Sto violation  | 0.1      |
| Reward Loss         | -5.03    |
| Running Env Steps   | 145000   |
| Running Forward KL  | 27.6     |
| Running Reverse KL  | 15.8     |
| Running Update Time | 29       |
----------------------------------
--2023-11-10 07:51:05.912630 CST--
| Itration            | 30       |
| Real Det Return     | 2.13e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.84e+03 |
| Real Sto violation  | 0.2      |
| Reward Loss         | -15.8    |
| Running Env Steps   | 150000   |
| Running Forward KL  | 28.9     |
| Running Reverse KL  | 17       |
| Running Update Time | 30       |
----------------------------------
--2023-11-10 07:53:13.633666 CST--
| Itration            | 31       |
| Real Det Return     | 2e+03    |
| Real Det violation  | 0        |
| Real Sto Return     | 1.77e+03 |
| Real Sto violation  | 0.2      |
| Reward Loss         | -20.7    |
| Running Env Steps   | 155000   |
| Running Forward KL  | 27.5     |
| Running Reverse KL  | 16.5     |
| Running Update Time | 31       |
----------------------------------
--2023-11-10 07:55:23.250426 CST--
| Itration            | 32       |
| Real Det Return     | 2.2e+03  |
| Real Det violation  | 0        |
| Real Sto Return     | 2.19e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -36.7    |
| Running Env Steps   | 160000   |
| Running Forward KL  | 27.8     |
| Running Reverse KL  | 16.2     |
| Running Update Time | 32       |
----------------------------------
--2023-11-10 07:57:33.404864 CST--
| Itration            | 33       |
| Real Det Return     | 2.14e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.04e+03 |
| Real Sto violation  | 0.05     |
| Reward Loss         | -35.3    |
| Running Env Steps   | 165000   |
| Running Forward KL  | 27.6     |
| Running Reverse KL  | 16.6     |
| Running Update Time | 33       |
----------------------------------
--2023-11-10 07:59:41.123718 CST--
| Itration            | 34       |
| Real Det Return     | 2.16e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.88e+03 |
| Real Sto violation  | 0.1      |
| Reward Loss         | -51.7    |
| Running Env Steps   | 170000   |
| Running Forward KL  | 28       |
| Running Reverse KL  | 15.8     |
| Running Update Time | 34       |
----------------------------------
--2023-11-10 08:01:50.511980 CST--
| Itration            | 35       |
| Real Det Return     | 2.12e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.99e+03 |
| Real Sto violation  | 0.1      |
| Reward Loss         | -68.7    |
| Running Env Steps   | 175000   |
| Running Forward KL  | 28.6     |
| Running Reverse KL  | 16.5     |
| Running Update Time | 35       |
----------------------------------
--2023-11-10 08:03:59.061085 CST--
| Itration            | 36       |
| Real Det Return     | 2.19e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.98e+03 |
| Real Sto violation  | 0.15     |
| Reward Loss         | -80.1    |
| Running Env Steps   | 180000   |
| Running Forward KL  | 27.9     |
| Running Reverse KL  | 16.2     |
| Running Update Time | 36       |
----------------------------------
--2023-11-10 08:06:09.030115 CST--
| Itration            | 37       |
| Real Det Return     | 2.25e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.04e+03 |
| Real Sto violation  | 0.1      |
| Reward Loss         | -76.5    |
| Running Env Steps   | 185000   |
| Running Forward KL  | 27.6     |
| Running Reverse KL  | 16.4     |
| Running Update Time | 37       |
----------------------------------
--2023-11-10 08:08:18.008626 CST--
| Itration            | 38       |
| Real Det Return     | 2.2e+03  |
| Real Det violation  | 0        |
| Real Sto Return     | 2.14e+03 |
| Real Sto violation  | 0.1      |
| Reward Loss         | -89.6    |
| Running Env Steps   | 190000   |
| Running Forward KL  | 27.3     |
| Running Reverse KL  | 15.8     |
| Running Update Time | 38       |
----------------------------------
--2023-11-10 08:10:28.175766 CST--
| Itration            | 39       |
| Real Det Return     | 2.27e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.16e+03 |
| Real Sto violation  | 0.05     |
| Reward Loss         | -122     |
| Running Env Steps   | 195000   |
| Running Forward KL  | 27.3     |
| Running Reverse KL  | 15.3     |
| Running Update Time | 39       |
----------------------------------
--2023-11-10 08:12:38.638665 CST--
| Itration            | 40       |
| Real Det Return     | 2.47e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.19e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -102     |
| Running Env Steps   | 200000   |
| Running Forward KL  | 27.1     |
| Running Reverse KL  | 15.4     |
| Running Update Time | 40       |
----------------------------------
--2023-11-10 08:14:48.874861 CST--
| Itration            | 41       |
| Real Det Return     | 2.23e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.08e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -124     |
| Running Env Steps   | 205000   |
| Running Forward KL  | 28.2     |
| Running Reverse KL  | 15.8     |
| Running Update Time | 41       |
----------------------------------
--2023-11-10 08:16:59.277463 CST--
| Itration            | 42       |
| Real Det Return     | 2.22e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.24e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -121     |
| Running Env Steps   | 210000   |
| Running Forward KL  | 27.4     |
| Running Reverse KL  | 15.8     |
| Running Update Time | 42       |
----------------------------------
--2023-11-10 08:19:09.277422 CST--
| Itration            | 43       |
| Real Det Return     | 2.43e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.11e+03 |
| Real Sto violation  | 0.05     |
| Reward Loss         | -136     |
| Running Env Steps   | 215000   |
| Running Forward KL  | 27.8     |
| Running Reverse KL  | 15.5     |
| Running Update Time | 43       |
----------------------------------
--2023-11-10 08:21:20.412409 CST--
| Itration            | 44       |
| Real Det Return     | 2.28e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.22e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -143     |
| Running Env Steps   | 220000   |
| Running Forward KL  | 27.2     |
| Running Reverse KL  | 15.3     |
| Running Update Time | 44       |
----------------------------------
--2023-11-10 08:23:32.487416 CST--
| Itration            | 45       |
| Real Det Return     | 2.32e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.26e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -131     |
| Running Env Steps   | 225000   |
| Running Forward KL  | 26.9     |
| Running Reverse KL  | 15.9     |
| Running Update Time | 45       |
----------------------------------
--2023-11-10 08:25:48.542897 CST--
| Itration            | 46       |
| Real Det Return     | 2.46e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.17e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -140     |
| Running Env Steps   | 230000   |
| Running Forward KL  | 27.2     |
| Running Reverse KL  | 15.4     |
| Running Update Time | 46       |
----------------------------------
--2023-11-10 08:28:03.892864 CST--
| Itration            | 47       |
| Real Det Return     | 2.42e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.19e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -164     |
| Running Env Steps   | 235000   |
| Running Forward KL  | 27       |
| Running Reverse KL  | 14.7     |
| Running Update Time | 47       |
----------------------------------
--2023-11-10 08:30:18.801788 CST--
| Itration            | 48       |
| Real Det Return     | 2.47e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.25e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -167     |
| Running Env Steps   | 240000   |
| Running Forward KL  | 27.3     |
| Running Reverse KL  | 15.4     |
| Running Update Time | 48       |
----------------------------------
--2023-11-10 08:32:32.650236 CST--
| Itration            | 49       |
| Real Det Return     | 2.7e+03  |
| Real Det violation  | 0        |
| Real Sto Return     | 2.23e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -193     |
| Running Env Steps   | 245000   |
| Running Forward KL  | 27.6     |
| Running Reverse KL  | 15.2     |
| Running Update Time | 49       |
----------------------------------
--2023-11-10 08:34:46.213412 CST--
| Itration            | 50       |
| Real Det Return     | 2.29e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.24e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -184     |
| Running Env Steps   | 250000   |
| Running Forward KL  | 27.2     |
| Running Reverse KL  | 15.5     |
| Running Update Time | 50       |
----------------------------------
--2023-11-10 08:36:59.882410 CST--
| Itration            | 51       |
| Real Det Return     | 2.44e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.27e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -194     |
| Running Env Steps   | 255000   |
| Running Forward KL  | 27.2     |
| Running Reverse KL  | 15.4     |
| Running Update Time | 51       |
----------------------------------
--2023-11-10 08:39:13.010520 CST--
| Itration            | 52       |
| Real Det Return     | 2.31e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.26e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -205     |
| Running Env Steps   | 260000   |
| Running Forward KL  | 27.7     |
| Running Reverse KL  | 15.6     |
| Running Update Time | 52       |
----------------------------------
--2023-11-10 08:41:26.070188 CST--
| Itration            | 53       |
| Real Det Return     | 2.45e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.32e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -193     |
| Running Env Steps   | 265000   |
| Running Forward KL  | 26.4     |
| Running Reverse KL  | 15.4     |
| Running Update Time | 53       |
----------------------------------
--2023-11-10 08:43:39.380376 CST--
| Itration            | 54       |
| Real Det Return     | 2.4e+03  |
| Real Det violation  | 0.05     |
| Real Sto Return     | 2.31e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -207     |
| Running Env Steps   | 270000   |
| Running Forward KL  | 26.9     |
| Running Reverse KL  | 15.3     |
| Running Update Time | 54       |
----------------------------------
--2023-11-10 08:45:52.801885 CST--
| Itration            | 55       |
| Real Det Return     | 2.38e+03 |
| Real Det violation  | 0.05     |
| Real Sto Return     | 2.29e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -216     |
| Running Env Steps   | 275000   |
| Running Forward KL  | 26.7     |
| Running Reverse KL  | 14.9     |
| Running Update Time | 55       |
----------------------------------
--2023-11-10 08:47:53.734192 CST--
| Itration            | 56       |
| Real Det Return     | 2.6e+03  |
| Real Det violation  | 0.05     |
| Real Sto Return     | 2.31e+03 |
| Real Sto violation  | 0.05     |
| Reward Loss         | -225     |
| Running Env Steps   | 280000   |
| Running Forward KL  | 26.7     |
| Running Reverse KL  | 15.1     |
| Running Update Time | 56       |
----------------------------------
--2023-11-10 08:49:54.704625 CST--
| Itration            | 57       |
| Real Det Return     | 2.72e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.37e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -218     |
| Running Env Steps   | 285000   |
| Running Forward KL  | 25.9     |
| Running Reverse KL  | 13.7     |
| Running Update Time | 57       |
----------------------------------
--2023-11-10 08:51:56.946094 CST--
| Itration            | 58       |
| Real Det Return     | 2.73e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.37e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -230     |
| Running Env Steps   | 290000   |
| Running Forward KL  | 26.6     |
| Running Reverse KL  | 14.4     |
| Running Update Time | 58       |
----------------------------------
--2023-11-10 08:53:58.487188 CST--
| Itration            | 59       |
| Real Det Return     | 2.73e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.34e+03 |
| Real Sto violation  | 0.05     |
| Reward Loss         | -248     |
| Running Env Steps   | 295000   |
| Running Forward KL  | 26.6     |
| Running Reverse KL  | 14.2     |
| Running Update Time | 59       |
----------------------------------
--2023-11-10 08:56:01.147338 CST--
| Itration            | 60       |
| Real Det Return     | 2.73e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.37e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -248     |
| Running Env Steps   | 300000   |
| Running Forward KL  | 26.8     |
| Running Reverse KL  | 14.5     |
| Running Update Time | 60       |
----------------------------------
--2023-11-10 08:58:03.554146 CST--
| Itration            | 61       |
| Real Det Return     | 2.71e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.3e+03  |
| Real Sto violation  | 0.05     |
| Reward Loss         | -248     |
| Running Env Steps   | 305000   |
| Running Forward KL  | 26.6     |
| Running Reverse KL  | 14.3     |
| Running Update Time | 61       |
----------------------------------
--2023-11-10 09:00:06.238445 CST--
| Itration            | 62       |
| Real Det Return     | 2.72e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.37e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -267     |
| Running Env Steps   | 310000   |
| Running Forward KL  | 26.3     |
| Running Reverse KL  | 13.8     |
| Running Update Time | 62       |
----------------------------------
--2023-11-10 09:02:09.063509 CST--
| Itration            | 63       |
| Real Det Return     | 2.74e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.44e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -256     |
| Running Env Steps   | 315000   |
| Running Forward KL  | 26       |
| Running Reverse KL  | 13.6     |
| Running Update Time | 63       |
----------------------------------
--2023-11-10 09:04:11.784639 CST--
| Itration            | 64       |
| Real Det Return     | 2.74e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.41e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -262     |
| Running Env Steps   | 320000   |
| Running Forward KL  | 26.1     |
| Running Reverse KL  | 14.1     |
| Running Update Time | 64       |
----------------------------------
--2023-11-10 09:06:14.601456 CST--
| Itration            | 65       |
| Real Det Return     | 2.73e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.43e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -267     |
| Running Env Steps   | 325000   |
| Running Forward KL  | 26.3     |
| Running Reverse KL  | 14.1     |
| Running Update Time | 65       |
----------------------------------
--2023-11-10 09:08:17.093007 CST--
| Itration            | 66       |
| Real Det Return     | 2.74e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.44e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -287     |
| Running Env Steps   | 330000   |
| Running Forward KL  | 26.4     |
| Running Reverse KL  | 14       |
| Running Update Time | 66       |
----------------------------------
--2023-11-10 09:10:19.496586 CST--
| Itration            | 67       |
| Real Det Return     | 2.74e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.42e+03 |
| Real Sto violation  | 0.05     |
| Reward Loss         | -273     |
| Running Env Steps   | 335000   |
| Running Forward KL  | 26.2     |
| Running Reverse KL  | 13.8     |
| Running Update Time | 67       |
----------------------------------
--2023-11-10 09:12:22.056945 CST--
| Itration            | 68       |
| Real Det Return     | 2.73e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.43e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -289     |
| Running Env Steps   | 340000   |
| Running Forward KL  | 26.2     |
| Running Reverse KL  | 13.5     |
| Running Update Time | 68       |
----------------------------------
--2023-11-10 09:14:24.396460 CST--
| Itration            | 69       |
| Real Det Return     | 2.73e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.42e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -299     |
| Running Env Steps   | 345000   |
| Running Forward KL  | 25.9     |
| Running Reverse KL  | 13.3     |
| Running Update Time | 69       |
----------------------------------
--2023-11-10 09:16:27.319025 CST--
| Itration            | 70       |
| Real Det Return     | 2.74e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.46e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -301     |
| Running Env Steps   | 350000   |
| Running Forward KL  | 26       |
| Running Reverse KL  | 13.8     |
| Running Update Time | 70       |
----------------------------------
--2023-11-10 09:18:30.950707 CST--
| Itration            | 71       |
| Real Det Return     | 2.73e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.47e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -297     |
| Running Env Steps   | 355000   |
| Running Forward KL  | 25.8     |
| Running Reverse KL  | 13       |
| Running Update Time | 71       |
----------------------------------
--2023-11-10 09:20:35.030898 CST--
| Itration            | 72       |
| Real Det Return     | 2.73e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.47e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -299     |
| Running Env Steps   | 360000   |
| Running Forward KL  | 26       |
| Running Reverse KL  | 14       |
| Running Update Time | 72       |
----------------------------------
--2023-11-10 09:22:39.093477 CST--
| Itration            | 73       |
| Real Det Return     | 2.73e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.46e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -315     |
| Running Env Steps   | 365000   |
| Running Forward KL  | 25.6     |
| Running Reverse KL  | 13.1     |
| Running Update Time | 73       |
----------------------------------
--2023-11-10 09:24:43.606237 CST--
| Itration            | 74       |
| Real Det Return     | 2.71e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.45e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -304     |
| Running Env Steps   | 370000   |
| Running Forward KL  | 25.5     |
| Running Reverse KL  | 13       |
| Running Update Time | 74       |
----------------------------------
--2023-11-10 09:26:48.286886 CST--
| Itration            | 75       |
| Real Det Return     | 2.73e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.48e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -329     |
| Running Env Steps   | 375000   |
| Running Forward KL  | 25.3     |
| Running Reverse KL  | 13.3     |
| Running Update Time | 75       |
----------------------------------
--2023-11-10 09:28:52.974450 CST--
| Itration            | 76       |
| Real Det Return     | 2.74e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.46e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -326     |
| Running Env Steps   | 380000   |
| Running Forward KL  | 25.9     |
| Running Reverse KL  | 13.4     |
| Running Update Time | 76       |
----------------------------------
--2023-11-10 09:30:57.804258 CST--
| Itration            | 77       |
| Real Det Return     | 2.72e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.48e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -340     |
| Running Env Steps   | 385000   |
| Running Forward KL  | 25.3     |
| Running Reverse KL  | 12.8     |
| Running Update Time | 77       |
----------------------------------
--2023-11-10 09:33:02.034803 CST--
| Itration            | 78       |
| Real Det Return     | 2.73e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.5e+03  |
| Real Sto violation  | 0        |
| Reward Loss         | -350     |
| Running Env Steps   | 390000   |
| Running Forward KL  | 25.5     |
| Running Reverse KL  | 12.8     |
| Running Update Time | 78       |
----------------------------------
--2023-11-10 09:35:06.154379 CST--
| Itration            | 79       |
| Real Det Return     | 2.74e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.53e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -314     |
| Running Env Steps   | 395000   |
| Running Forward KL  | 25.3     |
| Running Reverse KL  | 13.3     |
| Running Update Time | 79       |
----------------------------------
--2023-11-10 09:37:10.181433 CST--
| Itration            | 80       |
| Real Det Return     | 2.72e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.49e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -344     |
| Running Env Steps   | 400000   |
| Running Forward KL  | 25.5     |
| Running Reverse KL  | 13       |
| Running Update Time | 80       |
----------------------------------
--2023-11-10 09:39:14.074487 CST--
| Itration            | 81       |
| Real Det Return     | 2.73e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.52e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -347     |
| Running Env Steps   | 405000   |
| Running Forward KL  | 25.6     |
| Running Reverse KL  | 13       |
| Running Update Time | 81       |
----------------------------------
--2023-11-10 09:41:17.521664 CST--
| Itration            | 82       |
| Real Det Return     | 2.73e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.52e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -360     |
| Running Env Steps   | 410000   |
| Running Forward KL  | 25.5     |
| Running Reverse KL  | 13.2     |
| Running Update Time | 82       |
----------------------------------
--2023-11-10 09:43:21.572953 CST--
| Itration            | 83       |
| Real Det Return     | 2.74e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.53e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -353     |
| Running Env Steps   | 415000   |
| Running Forward KL  | 25.4     |
| Running Reverse KL  | 13.2     |
| Running Update Time | 83       |
----------------------------------
--2023-11-10 09:45:24.921837 CST--
| Itration            | 84       |
| Real Det Return     | 2.74e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.5e+03  |
| Real Sto violation  | 0.05     |
| Reward Loss         | -345     |
| Running Env Steps   | 420000   |
| Running Forward KL  | 24.8     |
| Running Reverse KL  | 12.9     |
| Running Update Time | 84       |
----------------------------------
--2023-11-10 09:47:28.704786 CST--
| Itration            | 85       |
| Real Det Return     | 2.73e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.54e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -353     |
| Running Env Steps   | 425000   |
| Running Forward KL  | 25.3     |
| Running Reverse KL  | 13.3     |
| Running Update Time | 85       |
----------------------------------
--2023-11-10 09:49:32.717354 CST--
| Itration            | 86       |
| Real Det Return     | 2.74e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.56e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -340     |
| Running Env Steps   | 430000   |
| Running Forward KL  | 25       |
| Running Reverse KL  | 13.2     |
| Running Update Time | 86       |
----------------------------------
--2023-11-10 09:51:37.035417 CST--
| Itration            | 87       |
| Real Det Return     | 2.74e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.54e+03 |
| Real Sto violation  | 0.05     |
| Reward Loss         | -363     |
| Running Env Steps   | 435000   |
| Running Forward KL  | 25.4     |
| Running Reverse KL  | 13.3     |
| Running Update Time | 87       |
----------------------------------
--2023-11-10 09:53:39.853809 CST--
| Itration            | 88       |
| Real Det Return     | 2.74e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.55e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -377     |
| Running Env Steps   | 440000   |
| Running Forward KL  | 24.8     |
| Running Reverse KL  | 12.7     |
| Running Update Time | 88       |
----------------------------------
--2023-11-10 09:55:44.366094 CST--
| Itration            | 89       |
| Real Det Return     | 2.74e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.56e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -375     |
| Running Env Steps   | 445000   |
| Running Forward KL  | 25.2     |
| Running Reverse KL  | 13       |
| Running Update Time | 89       |
----------------------------------
--2023-11-10 09:57:49.487992 CST--
| Itration            | 90       |
| Real Det Return     | 2.73e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.58e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -365     |
| Running Env Steps   | 450000   |
| Running Forward KL  | 24.9     |
| Running Reverse KL  | 13       |
| Running Update Time | 90       |
----------------------------------
--2023-11-10 09:59:54.307267 CST--
| Itration            | 91       |
| Real Det Return     | 2.73e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.57e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -366     |
| Running Env Steps   | 455000   |
| Running Forward KL  | 24.5     |
| Running Reverse KL  | 12.7     |
| Running Update Time | 91       |
----------------------------------
--2023-11-10 10:02:00.010708 CST--
| Itration            | 92       |
| Real Det Return     | 2.73e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.55e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -388     |
| Running Env Steps   | 460000   |
| Running Forward KL  | 25       |
| Running Reverse KL  | 13.1     |
| Running Update Time | 92       |
----------------------------------
--2023-11-10 10:04:06.040456 CST--
| Itration            | 93       |
| Real Det Return     | 2.74e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.58e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -381     |
| Running Env Steps   | 465000   |
| Running Forward KL  | 25.2     |
| Running Reverse KL  | 13       |
| Running Update Time | 93       |
----------------------------------
--2023-11-10 10:06:11.833097 CST--
| Itration            | 94       |
| Real Det Return     | 2.74e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.58e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -389     |
| Running Env Steps   | 470000   |
| Running Forward KL  | 25       |
| Running Reverse KL  | 13       |
| Running Update Time | 94       |
----------------------------------
--2023-11-10 10:08:17.760781 CST--
| Itration            | 95       |
| Real Det Return     | 2.73e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.56e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -389     |
| Running Env Steps   | 475000   |
| Running Forward KL  | 24.4     |
| Running Reverse KL  | 13       |
| Running Update Time | 95       |
----------------------------------
--2023-11-10 10:10:23.468263 CST--
| Itration            | 96       |
| Real Det Return     | 2.74e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.56e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -412     |
| Running Env Steps   | 480000   |
| Running Forward KL  | 25       |
| Running Reverse KL  | 12.9     |
| Running Update Time | 96       |
----------------------------------
--2023-11-10 10:12:29.536019 CST--
| Itration            | 97       |
| Real Det Return     | 2.74e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.59e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -398     |
| Running Env Steps   | 485000   |
| Running Forward KL  | 24.6     |
| Running Reverse KL  | 13.1     |
| Running Update Time | 97       |
----------------------------------
--2023-11-10 10:14:34.857118 CST--
| Itration            | 98       |
| Real Det Return     | 2.73e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.46e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -417     |
| Running Env Steps   | 490000   |
| Running Forward KL  | 25.2     |
| Running Reverse KL  | 13       |
| Running Update Time | 98       |
----------------------------------
--2023-11-10 10:16:40.426568 CST--
| Itration            | 99       |
| Real Det Return     | 2.74e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.48e+03 |
| Real Sto violation  | 0.15     |
| Reward Loss         | -397     |
| Running Env Steps   | 495000   |
| Running Forward KL  | 24.3     |
| Running Reverse KL  | 14.1     |
| Running Update Time | 99       |
----------------------------------
--2023-11-10 10:18:47.129684 CST--
| Itration            | 100      |
| Real Det Return     | 2.74e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.63e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -399     |
| Running Env Steps   | 500000   |
| Running Forward KL  | 24.7     |
| Running Reverse KL  | 12.8     |
| Running Update Time | 100      |
----------------------------------
--2023-11-10 10:20:53.300599 CST--
| Itration            | 101      |
| Real Det Return     | 2.74e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.64e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -404     |
| Running Env Steps   | 505000   |
| Running Forward KL  | 24       |
| Running Reverse KL  | 12.8     |
| Running Update Time | 101      |
----------------------------------
--2023-11-10 10:23:00.219459 CST--
| Itration            | 102      |
| Real Det Return     | 2.74e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.61e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -407     |
| Running Env Steps   | 510000   |
| Running Forward KL  | 24.3     |
| Running Reverse KL  | 12.8     |
| Running Update Time | 102      |
----------------------------------
--2023-11-10 10:25:07.383790 CST--
| Itration            | 103      |
| Real Det Return     | 2.74e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.6e+03  |
| Real Sto violation  | 0        |
| Reward Loss         | -421     |
| Running Env Steps   | 515000   |
| Running Forward KL  | 24.3     |
| Running Reverse KL  | 12.9     |
| Running Update Time | 103      |
----------------------------------
--2023-11-10 10:27:14.748343 CST--
| Itration            | 104      |
| Real Det Return     | 2.74e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.62e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -424     |
| Running Env Steps   | 520000   |
| Running Forward KL  | 24.5     |
| Running Reverse KL  | 13.1     |
| Running Update Time | 104      |
----------------------------------
--2023-11-10 10:29:21.888636 CST--
| Itration            | 105      |
| Real Det Return     | 2.74e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.62e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -431     |
| Running Env Steps   | 525000   |
| Running Forward KL  | 24.3     |
| Running Reverse KL  | 12.7     |
| Running Update Time | 105      |
----------------------------------
--2023-11-10 10:31:29.031500 CST--
| Itration            | 106      |
| Real Det Return     | 2.74e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.62e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -442     |
| Running Env Steps   | 530000   |
| Running Forward KL  | 24.9     |
| Running Reverse KL  | 13       |
| Running Update Time | 106      |
----------------------------------
--2023-11-10 10:33:36.702679 CST--
| Itration            | 107      |
| Real Det Return     | 2.74e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.62e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -437     |
| Running Env Steps   | 535000   |
| Running Forward KL  | 24.5     |
| Running Reverse KL  | 13       |
| Running Update Time | 107      |
----------------------------------
--2023-11-10 10:35:44.237233 CST--
| Itration            | 108      |
| Real Det Return     | 2.75e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.63e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -440     |
| Running Env Steps   | 540000   |
| Running Forward KL  | 24.5     |
| Running Reverse KL  | 13.2     |
| Running Update Time | 108      |
----------------------------------
--2023-11-10 10:37:52.218458 CST--
| Itration            | 109      |
| Real Det Return     | 2.74e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.63e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -452     |
| Running Env Steps   | 545000   |
| Running Forward KL  | 24.5     |
| Running Reverse KL  | 13.3     |
| Running Update Time | 109      |
----------------------------------
--2023-11-10 10:39:59.582387 CST--
| Itration            | 110      |
| Real Det Return     | 2.75e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.63e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -455     |
| Running Env Steps   | 550000   |
| Running Forward KL  | 24.6     |
| Running Reverse KL  | 13       |
| Running Update Time | 110      |
----------------------------------
--2023-11-10 10:42:07.300578 CST--
| Itration            | 111      |
| Real Det Return     | 2.74e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.62e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -463     |
| Running Env Steps   | 555000   |
| Running Forward KL  | 23.9     |
| Running Reverse KL  | 12.6     |
| Running Update Time | 111      |
----------------------------------
--2023-11-10 10:44:14.865532 CST--
| Itration            | 112      |
| Real Det Return     | 2.75e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.64e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -461     |
| Running Env Steps   | 560000   |
| Running Forward KL  | 23.9     |
| Running Reverse KL  | 12.8     |
| Running Update Time | 112      |
----------------------------------
--2023-11-10 10:46:22.261292 CST--
| Itration            | 113      |
| Real Det Return     | 2.74e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.63e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -483     |
| Running Env Steps   | 565000   |
| Running Forward KL  | 25.1     |
| Running Reverse KL  | 12.9     |
| Running Update Time | 113      |
----------------------------------
--2023-11-10 10:48:29.583667 CST--
| Itration            | 114      |
| Real Det Return     | 2.76e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.64e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -463     |
| Running Env Steps   | 570000   |
| Running Forward KL  | 24       |
| Running Reverse KL  | 13.1     |
| Running Update Time | 114      |
----------------------------------
--2023-11-10 10:50:36.569352 CST--
| Itration            | 115      |
| Real Det Return     | 2.75e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.64e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -477     |
| Running Env Steps   | 575000   |
| Running Forward KL  | 24.2     |
| Running Reverse KL  | 12.8     |
| Running Update Time | 115      |
----------------------------------
--2023-11-10 10:52:43.066989 CST--
| Itration            | 116      |
| Real Det Return     | 2.75e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.65e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -473     |
| Running Env Steps   | 580000   |
| Running Forward KL  | 23.8     |
| Running Reverse KL  | 12.6     |
| Running Update Time | 116      |
----------------------------------
--2023-11-10 10:54:49.507262 CST--
| Itration            | 117      |
| Real Det Return     | 2.76e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.62e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -477     |
| Running Env Steps   | 585000   |
| Running Forward KL  | 23.4     |
| Running Reverse KL  | 12.6     |
| Running Update Time | 117      |
----------------------------------
--2023-11-10 10:56:54.403493 CST--
| Itration            | 118      |
| Real Det Return     | 2.74e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.37e+03 |
| Real Sto violation  | 0.25     |
| Reward Loss         | -486     |
| Running Env Steps   | 590000   |
| Running Forward KL  | 24       |
| Running Reverse KL  | 12.9     |
| Running Update Time | 118      |
----------------------------------
--2023-11-10 10:58:57.335453 CST--
| Itration            | 119      |
| Real Det Return     | 2.75e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.42e+03 |
| Real Sto violation  | 0.15     |
| Reward Loss         | -498     |
| Running Env Steps   | 595000   |
| Running Forward KL  | 23.7     |
| Running Reverse KL  | 12.7     |
| Running Update Time | 119      |
----------------------------------
--2023-11-10 11:01:01.946785 CST--
| Itration            | 120      |
| Real Det Return     | 2.75e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.63e+03 |
| Real Sto violation  | 0.05     |
| Reward Loss         | -487     |
| Running Env Steps   | 600000   |
| Running Forward KL  | 23.9     |
| Running Reverse KL  | 12.8     |
| Running Update Time | 120      |
----------------------------------
--2023-11-10 11:03:05.873922 CST--
| Itration            | 121      |
| Real Det Return     | 2.75e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.47e+03 |
| Real Sto violation  | 0.1      |
| Reward Loss         | -496     |
| Running Env Steps   | 605000   |
| Running Forward KL  | 24.2     |
| Running Reverse KL  | 13       |
| Running Update Time | 121      |
----------------------------------
--2023-11-10 11:05:13.715691 CST--
| Itration            | 122      |
| Real Det Return     | 2.74e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.65e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -506     |
| Running Env Steps   | 610000   |
| Running Forward KL  | 24       |
| Running Reverse KL  | 13       |
| Running Update Time | 122      |
----------------------------------
--2023-11-10 11:07:19.545724 CST--
| Itration            | 123      |
| Real Det Return     | 2.77e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.66e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -490     |
| Running Env Steps   | 615000   |
| Running Forward KL  | 24.1     |
| Running Reverse KL  | 13.4     |
| Running Update Time | 123      |
----------------------------------
--2023-11-10 11:09:25.777177 CST--
| Itration            | 124      |
| Real Det Return     | 2.76e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.67e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -513     |
| Running Env Steps   | 620000   |
| Running Forward KL  | 24.6     |
| Running Reverse KL  | 13       |
| Running Update Time | 124      |
----------------------------------
--2023-11-10 11:11:30.348008 CST--
| Itration            | 125      |
| Real Det Return     | 2.75e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.28e+03 |
| Real Sto violation  | 0.25     |
| Reward Loss         | -554     |
| Running Env Steps   | 625000   |
| Running Forward KL  | 24.3     |
| Running Reverse KL  | 12       |
| Running Update Time | 125      |
----------------------------------
--2023-11-10 11:13:37.394507 CST--
| Itration            | 126      |
| Real Det Return     | 2.75e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.67e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -497     |
| Running Env Steps   | 630000   |
| Running Forward KL  | 24.2     |
| Running Reverse KL  | 13.1     |
| Running Update Time | 126      |
----------------------------------
--2023-11-10 11:15:44.115964 CST--
| Itration            | 127      |
| Real Det Return     | 2.74e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.68e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -515     |
| Running Env Steps   | 635000   |
| Running Forward KL  | 24.2     |
| Running Reverse KL  | 13       |
| Running Update Time | 127      |
----------------------------------
--2023-11-10 11:17:51.011608 CST--
| Itration            | 128      |
| Real Det Return     | 2.75e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.66e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -537     |
| Running Env Steps   | 640000   |
| Running Forward KL  | 23.7     |
| Running Reverse KL  | 12.7     |
| Running Update Time | 128      |
----------------------------------
--2023-11-10 11:19:56.253034 CST--
| Itration            | 129      |
| Real Det Return     | 2.75e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.41e+03 |
| Real Sto violation  | 0.15     |
| Reward Loss         | -515     |
| Running Env Steps   | 645000   |
| Running Forward KL  | 24.2     |
| Running Reverse KL  | 13.1     |
| Running Update Time | 129      |
----------------------------------
--2023-11-10 11:22:02.209466 CST--
| Itration            | 130      |
| Real Det Return     | 2.76e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.61e+03 |
| Real Sto violation  | 0.05     |
| Reward Loss         | -531     |
| Running Env Steps   | 650000   |
| Running Forward KL  | 23.5     |
| Running Reverse KL  | 12.4     |
| Running Update Time | 130      |
----------------------------------
--2023-11-10 11:24:09.197379 CST--
| Itration            | 131      |
| Real Det Return     | 2.76e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.61e+03 |
| Real Sto violation  | 0.1      |
| Reward Loss         | -540     |
| Running Env Steps   | 655000   |
| Running Forward KL  | 24.1     |
| Running Reverse KL  | 13       |
| Running Update Time | 131      |
----------------------------------
--2023-11-10 11:26:14.368318 CST--
| Itration            | 132      |
| Real Det Return     | 2.75e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.51e+03 |
| Real Sto violation  | 0.1      |
| Reward Loss         | -566     |
| Running Env Steps   | 660000   |
| Running Forward KL  | 23.4     |
| Running Reverse KL  | 12.5     |
| Running Update Time | 132      |
----------------------------------
--2023-11-10 11:28:20.009785 CST--
| Itration            | 133      |
| Real Det Return     | 2.75e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.55e+03 |
| Real Sto violation  | 0.1      |
| Reward Loss         | -544     |
| Running Env Steps   | 665000   |
| Running Forward KL  | 24.4     |
| Running Reverse KL  | 13.2     |
| Running Update Time | 133      |
----------------------------------
--2023-11-10 11:30:25.832194 CST--
| Itration            | 134      |
| Real Det Return     | 2.76e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.69e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -569     |
| Running Env Steps   | 670000   |
| Running Forward KL  | 24       |
| Running Reverse KL  | 13       |
| Running Update Time | 134      |
----------------------------------
--2023-11-10 11:32:28.419033 CST--
| Itration            | 135      |
| Real Det Return     | 2.75e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.12e+03 |
| Real Sto violation  | 0.45     |
| Reward Loss         | -608     |
| Running Env Steps   | 675000   |
| Running Forward KL  | 24.2     |
| Running Reverse KL  | 11.5     |
| Running Update Time | 135      |
----------------------------------
--2023-11-10 11:34:33.473675 CST--
| Itration            | 136      |
| Real Det Return     | 2.76e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.54e+03 |
| Real Sto violation  | 0.1      |
| Reward Loss         | -622     |
| Running Env Steps   | 680000   |
| Running Forward KL  | 23.8     |
| Running Reverse KL  | 12.2     |
| Running Update Time | 136      |
----------------------------------
--2023-11-10 11:36:34.966014 CST--
| Itration            | 137      |
| Real Det Return     | 2.76e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.9e+03  |
| Real Sto violation  | 0.55     |
| Reward Loss         | -662     |
| Running Env Steps   | 685000   |
| Running Forward KL  | 24.1     |
| Running Reverse KL  | 12       |
| Running Update Time | 137      |
----------------------------------
--2023-11-10 11:38:40.620000 CST--
| Itration            | 138      |
| Real Det Return     | 2.76e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.61e+03 |
| Real Sto violation  | 0.05     |
| Reward Loss         | -579     |
| Running Env Steps   | 690000   |
| Running Forward KL  | 24.3     |
| Running Reverse KL  | 12.8     |
| Running Update Time | 138      |
----------------------------------
--2023-11-10 11:40:44.535708 CST--
| Itration            | 139      |
| Real Det Return     | 2.71e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.29e+03 |
| Real Sto violation  | 0.3      |
| Reward Loss         | -651     |
| Running Env Steps   | 695000   |
| Running Forward KL  | 24.1     |
| Running Reverse KL  | 12.7     |
| Running Update Time | 139      |
----------------------------------
--2023-11-10 11:42:39.715103 CST--
| Itration            | 140      |
| Real Det Return     | 998      |
| Real Det violation  | 1        |
| Real Sto Return     | 1.06e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -762     |
| Running Env Steps   | 700000   |
| Running Forward KL  | 24.6     |
| Running Reverse KL  | 11       |
| Running Update Time | 140      |
----------------------------------
--2023-11-10 11:44:52.158812 CST--
| Itration            | 141      |
| Real Det Return     | 2.68e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.07e+03 |
| Real Sto violation  | 0.5      |
| Reward Loss         | -632     |
| Running Env Steps   | 705000   |
| Running Forward KL  | 24.4     |
| Running Reverse KL  | 11.5     |
| Running Update Time | 141      |
----------------------------------
--2023-11-10 11:47:07.856755 CST--
| Itration            | 142      |
| Real Det Return     | 2.76e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.68e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -601     |
| Running Env Steps   | 710000   |
| Running Forward KL  | 24.1     |
| Running Reverse KL  | 13.4     |
| Running Update Time | 142      |
----------------------------------
--2023-11-10 11:49:22.092434 CST--
| Itration            | 143      |
| Real Det Return     | 2.74e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.46e+03 |
| Real Sto violation  | 0.15     |
| Reward Loss         | -610     |
| Running Env Steps   | 715000   |
| Running Forward KL  | 24.5     |
| Running Reverse KL  | 13.2     |
| Running Update Time | 143      |
----------------------------------
--2023-11-10 11:51:35.460132 CST--
| Itration            | 144      |
| Real Det Return     | 2.7e+03  |
| Real Det violation  | 0        |
| Real Sto Return     | 2.28e+03 |
| Real Sto violation  | 0.3      |
| Reward Loss         | -611     |
| Running Env Steps   | 720000   |
| Running Forward KL  | 24       |
| Running Reverse KL  | 12.9     |
| Running Update Time | 144      |
----------------------------------
--2023-11-10 11:53:51.183505 CST--
| Itration            | 145      |
| Real Det Return     | 2.71e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.68e+03 |
| Real Sto violation  | 0.05     |
| Reward Loss         | -622     |
| Running Env Steps   | 725000   |
| Running Forward KL  | 24.2     |
| Running Reverse KL  | 12.8     |
| Running Update Time | 145      |
----------------------------------
--2023-11-10 11:56:00.195906 CST--
| Itration            | 146      |
| Real Det Return     | 2.74e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.54e+03 |
| Real Sto violation  | 0.8      |
| Reward Loss         | -719     |
| Running Env Steps   | 730000   |
| Running Forward KL  | 24       |
| Running Reverse KL  | 11.2     |
| Running Update Time | 146      |
----------------------------------
--2023-11-10 11:58:16.026415 CST--
| Itration            | 147      |
| Real Det Return     | 2.74e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.69e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -659     |
| Running Env Steps   | 735000   |
| Running Forward KL  | 23.9     |
| Running Reverse KL  | 12.4     |
| Running Update Time | 147      |
----------------------------------
--2023-11-10 12:00:31.390495 CST--
| Itration            | 148      |
| Real Det Return     | 2.74e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.68e+03 |
| Real Sto violation  | 0.05     |
| Reward Loss         | -647     |
| Running Env Steps   | 740000   |
| Running Forward KL  | 23.9     |
| Running Reverse KL  | 12.5     |
| Running Update Time | 148      |
----------------------------------
--2023-11-10 12:02:46.049093 CST--
| Itration            | 149      |
| Real Det Return     | 2.71e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.61e+03 |
| Real Sto violation  | 0.05     |
| Reward Loss         | -634     |
| Running Env Steps   | 745000   |
| Running Forward KL  | 23.8     |
| Running Reverse KL  | 13.2     |
| Running Update Time | 149      |
----------------------------------
--2023-11-10 12:04:59.181777 CST--
| Itration            | 150      |
| Real Det Return     | 2.71e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.31e+03 |
| Real Sto violation  | 0.35     |
| Reward Loss         | -694     |
| Running Env Steps   | 750000   |
| Running Forward KL  | 23.6     |
| Running Reverse KL  | 12.1     |
| Running Update Time | 150      |
----------------------------------
--2023-11-10 12:07:10.220666 CST--
| Itration            | 151      |
| Real Det Return     | 2.74e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.97e+03 |
| Real Sto violation  | 0.7      |
| Reward Loss         | -711     |
| Running Env Steps   | 755000   |
| Running Forward KL  | 24.3     |
| Running Reverse KL  | 12.7     |
| Running Update Time | 151      |
----------------------------------
--2023-11-10 12:09:22.463482 CST--
| Itration            | 152      |
| Real Det Return     | 2.75e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.11e+03 |
| Real Sto violation  | 0.55     |
| Reward Loss         | -690     |
| Running Env Steps   | 760000   |
| Running Forward KL  | 23.7     |
| Running Reverse KL  | 12.3     |
| Running Update Time | 152      |
----------------------------------
--2023-11-10 12:11:27.032561 CST--
| Itration            | 153      |
| Real Det Return     | 2.75e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.31e+03 |
| Real Sto violation  | 0.3      |
| Reward Loss         | -779     |
| Running Env Steps   | 765000   |
| Running Forward KL  | 23.8     |
| Running Reverse KL  | 12.3     |
| Running Update Time | 153      |
----------------------------------
--2023-11-10 12:13:34.023227 CST--
| Itration            | 154      |
| Real Det Return     | 2.73e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.59e+03 |
| Real Sto violation  | 0.15     |
| Reward Loss         | -704     |
| Running Env Steps   | 770000   |
| Running Forward KL  | 23.8     |
| Running Reverse KL  | 11.9     |
| Running Update Time | 154      |
----------------------------------
--2023-11-10 12:15:40.416894 CST--
| Itration            | 155      |
| Real Det Return     | 2.74e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.46e+03 |
| Real Sto violation  | 0.15     |
| Reward Loss         | -701     |
| Running Env Steps   | 775000   |
| Running Forward KL  | 23.6     |
| Running Reverse KL  | 12.5     |
| Running Update Time | 155      |
----------------------------------
--2023-11-10 12:17:40.003829 CST--
| Itration            | 156      |
| Real Det Return     | 2.73e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.39e+03 |
| Real Sto violation  | 0.3      |
| Reward Loss         | -822     |
| Running Env Steps   | 780000   |
| Running Forward KL  | 23.4     |
| Running Reverse KL  | 12.5     |
| Running Update Time | 156      |
----------------------------------
--2023-11-10 12:19:36.305450 CST--
| Itration            | 157      |
| Real Det Return     | 2.75e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.38e+03 |
| Real Sto violation  | 0.25     |
| Reward Loss         | -715     |
| Running Env Steps   | 785000   |
| Running Forward KL  | 23.4     |
| Running Reverse KL  | 12.6     |
| Running Update Time | 157      |
----------------------------------
--2023-11-10 12:21:42.518578 CST--
| Itration            | 158      |
| Real Det Return     | 2.72e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.32e+03 |
| Real Sto violation  | 0.25     |
| Reward Loss         | -722     |
| Running Env Steps   | 790000   |
| Running Forward KL  | 24       |
| Running Reverse KL  | 12.6     |
| Running Update Time | 158      |
----------------------------------
--2023-11-10 12:23:50.059527 CST--
| Itration            | 159      |
| Real Det Return     | 2.74e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.57e+03 |
| Real Sto violation  | 0.15     |
| Reward Loss         | -736     |
| Running Env Steps   | 795000   |
| Running Forward KL  | 23.9     |
| Running Reverse KL  | 12.3     |
| Running Update Time | 159      |
----------------------------------
--2023-11-10 12:25:53.734698 CST--
| Itration            | 160      |
| Real Det Return     | 2.68e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.86e+03 |
| Real Sto violation  | 0.65     |
| Reward Loss         | -864     |
| Running Env Steps   | 800000   |
| Running Forward KL  | 23.8     |
| Running Reverse KL  | 12.2     |
| Running Update Time | 160      |
----------------------------------
--2023-11-10 12:27:56.458647 CST--
| Itration            | 161      |
| Real Det Return     | 2.72e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.75e+03 |
| Real Sto violation  | 0.65     |
| Reward Loss         | -803     |
| Running Env Steps   | 805000   |
| Running Forward KL  | 23.6     |
| Running Reverse KL  | 12.8     |
| Running Update Time | 161      |
----------------------------------
--2023-11-10 12:30:02.909936 CST--
| Itration            | 162      |
| Real Det Return     | 2.73e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.42e+03 |
| Real Sto violation  | 0.2      |
| Reward Loss         | -846     |
| Running Env Steps   | 810000   |
| Running Forward KL  | 22.8     |
| Running Reverse KL  | 12       |
| Running Update Time | 162      |
----------------------------------
--2023-11-10 12:32:06.106301 CST--
| Itration            | 163      |
| Real Det Return     | 2.71e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.85e+03 |
| Real Sto violation  | 0.65     |
| Reward Loss         | -934     |
| Running Env Steps   | 815000   |
| Running Forward KL  | 23.2     |
| Running Reverse KL  | 12       |
| Running Update Time | 163      |
----------------------------------
--2023-11-10 12:34:13.629880 CST--
| Itration            | 164      |
| Real Det Return     | 2.7e+03  |
| Real Det violation  | 0        |
| Real Sto Return     | 2.68e+03 |
| Real Sto violation  | 0.1      |
| Reward Loss         | -716     |
| Running Env Steps   | 820000   |
| Running Forward KL  | 23.9     |
| Running Reverse KL  | 13.4     |
| Running Update Time | 164      |
----------------------------------
--2023-11-10 12:36:15.537811 CST--
| Itration            | 165      |
| Real Det Return     | 2.73e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.61e+03 |
| Real Sto violation  | 0.75     |
| Reward Loss         | -973     |
| Running Env Steps   | 825000   |
| Running Forward KL  | 24       |
| Running Reverse KL  | 11.8     |
| Running Update Time | 165      |
----------------------------------
--2023-11-10 12:38:23.494126 CST--
| Itration            | 166      |
| Real Det Return     | 2.73e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.7e+03  |
| Real Sto violation  | 0.05     |
| Reward Loss         | -735     |
| Running Env Steps   | 830000   |
| Running Forward KL  | 23.5     |
| Running Reverse KL  | 13.2     |
| Running Update Time | 166      |
----------------------------------
--2023-11-10 12:40:31.341596 CST--
| Itration            | 167      |
| Real Det Return     | 2.75e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.7e+03  |
| Real Sto violation  | 0        |
| Reward Loss         | -789     |
| Running Env Steps   | 835000   |
| Running Forward KL  | 23.5     |
| Running Reverse KL  | 12.7     |
| Running Update Time | 167      |
----------------------------------
--2023-11-10 12:42:36.127680 CST--
| Itration            | 168      |
| Real Det Return     | 2.74e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.16e+03 |
| Real Sto violation  | 0.4      |
| Reward Loss         | -777     |
| Running Env Steps   | 840000   |
| Running Forward KL  | 24       |
| Running Reverse KL  | 13.1     |
| Running Update Time | 168      |
----------------------------------
--2023-11-10 12:44:42.251419 CST--
| Itration            | 169      |
| Real Det Return     | 2.76e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.37e+03 |
| Real Sto violation  | 0.35     |
| Reward Loss         | -852     |
| Running Env Steps   | 845000   |
| Running Forward KL  | 23.4     |
| Running Reverse KL  | 12.7     |
| Running Update Time | 169      |
----------------------------------
--2023-11-10 12:46:47.984931 CST--
| Itration            | 170      |
| Real Det Return     | 2.7e+03  |
| Real Det violation  | 0        |
| Real Sto Return     | 2.32e+03 |
| Real Sto violation  | 0.25     |
| Reward Loss         | -823     |
| Running Env Steps   | 850000   |
| Running Forward KL  | 23.5     |
| Running Reverse KL  | 12.7     |
| Running Update Time | 170      |
----------------------------------
--2023-11-10 12:48:53.594892 CST--
| Itration            | 171      |
| Real Det Return     | 2.72e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.27e+03 |
| Real Sto violation  | 0.5      |
| Reward Loss         | -836     |
| Running Env Steps   | 855000   |
| Running Forward KL  | 23.3     |
| Running Reverse KL  | 12       |
| Running Update Time | 171      |
----------------------------------
--2023-11-10 12:50:59.060235 CST--
| Itration            | 172      |
| Real Det Return     | 2.72e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.23e+03 |
| Real Sto violation  | 0.35     |
| Reward Loss         | -765     |
| Running Env Steps   | 860000   |
| Running Forward KL  | 23.6     |
| Running Reverse KL  | 13.4     |
| Running Update Time | 172      |
----------------------------------
--2023-11-10 12:53:07.190412 CST--
| Itration            | 173      |
| Real Det Return     | 2.71e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.72e+03 |
| Real Sto violation  | 0.05     |
| Reward Loss         | -807     |
| Running Env Steps   | 865000   |
| Running Forward KL  | 23.5     |
| Running Reverse KL  | 13.1     |
| Running Update Time | 173      |
----------------------------------
--2023-11-10 12:55:11.869538 CST--
| Itration            | 174      |
| Real Det Return     | 2.71e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.04e+03 |
| Real Sto violation  | 0.5      |
| Reward Loss         | -861     |
| Running Env Steps   | 870000   |
| Running Forward KL  | 23.2     |
| Running Reverse KL  | 11.8     |
| Running Update Time | 174      |
----------------------------------
--2023-11-10 12:57:18.476685 CST--
| Itration            | 175      |
| Real Det Return     | 2.69e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.38e+03 |
| Real Sto violation  | 0.25     |
| Reward Loss         | -858     |
| Running Env Steps   | 875000   |
| Running Forward KL  | 23.4     |
| Running Reverse KL  | 12.2     |
| Running Update Time | 175      |
----------------------------------
--2023-11-10 12:59:25.322554 CST--
| Itration            | 176      |
| Real Det Return     | 2.69e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.4e+03  |
| Real Sto violation  | 0.25     |
| Reward Loss         | -799     |
| Running Env Steps   | 880000   |
| Running Forward KL  | 23.2     |
| Running Reverse KL  | 13.1     |
| Running Update Time | 176      |
----------------------------------
--2023-11-10 13:01:30.901913 CST--
| Itration            | 177      |
| Real Det Return     | 2.71e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.13e+03 |
| Real Sto violation  | 0.5      |
| Reward Loss         | -890     |
| Running Env Steps   | 885000   |
| Running Forward KL  | 23.1     |
| Running Reverse KL  | 11.8     |
| Running Update Time | 177      |
----------------------------------
--2023-11-10 13:03:39.005973 CST--
| Itration            | 178      |
| Real Det Return     | 2.72e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.61e+03 |
| Real Sto violation  | 0.15     |
| Reward Loss         | -848     |
| Running Env Steps   | 890000   |
| Running Forward KL  | 23.1     |
| Running Reverse KL  | 12.4     |
| Running Update Time | 178      |
----------------------------------
--2023-11-10 13:05:43.096474 CST--
| Itration            | 179      |
| Real Det Return     | 2.72e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.94e+03 |
| Real Sto violation  | 0.55     |
| Reward Loss         | -849     |
| Running Env Steps   | 895000   |
| Running Forward KL  | 22.6     |
| Running Reverse KL  | 12       |
| Running Update Time | 179      |
----------------------------------
--2023-11-10 13:07:50.994899 CST--
| Itration            | 180      |
| Real Det Return     | 2.71e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.66e+03 |
| Real Sto violation  | 0.1      |
| Reward Loss         | -828     |
| Running Env Steps   | 900000   |
| Running Forward KL  | 22.9     |
| Running Reverse KL  | 12.5     |
| Running Update Time | 180      |
----------------------------------
--2023-11-10 13:09:55.398930 CST--
| Itration            | 181      |
| Real Det Return     | 2.69e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.06e+03 |
| Real Sto violation  | 0.6      |
| Reward Loss         | -955     |
| Running Env Steps   | 905000   |
| Running Forward KL  | 22.8     |
| Running Reverse KL  | 11.8     |
| Running Update Time | 181      |
----------------------------------
--2023-11-10 13:12:01.122235 CST--
| Itration            | 182      |
| Real Det Return     | 2.71e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.22e+03 |
| Real Sto violation  | 0.4      |
| Reward Loss         | -880     |
| Running Env Steps   | 910000   |
| Running Forward KL  | 22.1     |
| Running Reverse KL  | 11.3     |
| Running Update Time | 182      |
----------------------------------
--2023-11-10 13:14:08.774475 CST--
| Itration            | 183      |
| Real Det Return     | 2.75e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.61e+03 |
| Real Sto violation  | 0.1      |
| Reward Loss         | -825     |
| Running Env Steps   | 915000   |
| Running Forward KL  | 22.3     |
| Running Reverse KL  | 12.4     |
| Running Update Time | 183      |
----------------------------------
--2023-11-10 13:15:53.390222 CST--
| Itration            | 184      |
| Real Det Return     | 657      |
| Real Det violation  | 1        |
| Real Sto Return     | 639      |
| Real Sto violation  | 1        |
| Reward Loss         | -1.1e+03 |
| Running Env Steps   | 920000   |
| Running Forward KL  | 23.2     |
| Running Reverse KL  | 11.5     |
| Running Update Time | 184      |
----------------------------------
--2023-11-10 13:17:58.133481 CST---
| Itration            | 185       |
| Real Det Return     | 2.71e+03  |
| Real Det violation  | 0         |
| Real Sto Return     | 2.06e+03  |
| Real Sto violation  | 0.5       |
| Reward Loss         | -1.02e+03 |
| Running Env Steps   | 925000    |
| Running Forward KL  | 22.6      |
| Running Reverse KL  | 11.6      |
| Running Update Time | 185       |
-----------------------------------
--2023-11-10 13:20:08.026596 CST---
| Itration            | 186       |
| Real Det Return     | 2.7e+03   |
| Real Det violation  | 0         |
| Real Sto Return     | 1.53e+03  |
| Real Sto violation  | 0.8       |
| Reward Loss         | -1.01e+03 |
| Running Env Steps   | 930000    |
| Running Forward KL  | 21.9      |
| Running Reverse KL  | 11.5      |
| Running Update Time | 186       |
-----------------------------------
--2023-11-10 13:22:17.676704 CST--
| Itration            | 187      |
| Real Det Return     | 2.71e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.52e+03 |
| Real Sto violation  | 0.9      |
| Reward Loss         | -984     |
| Running Env Steps   | 935000   |
| Running Forward KL  | 22.4     |
| Running Reverse KL  | 11.4     |
| Running Update Time | 187      |
----------------------------------
--2023-11-10 13:24:23.623787 CST---
| Itration            | 188       |
| Real Det Return     | 2.69e+03  |
| Real Det violation  | 0         |
| Real Sto Return     | 882       |
| Real Sto violation  | 1         |
| Reward Loss         | -1.12e+03 |
| Running Env Steps   | 940000    |
| Running Forward KL  | 23.1      |
| Running Reverse KL  | 11.6      |
| Running Update Time | 188       |
-----------------------------------
--2023-11-10 13:26:35.184763 CST--
| Itration            | 189      |
| Real Det Return     | 2.68e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.81e+03 |
| Real Sto violation  | 0.65     |
| Reward Loss         | -968     |
| Running Env Steps   | 945000   |
| Running Forward KL  | 21.8     |
| Running Reverse KL  | 11.2     |
| Running Update Time | 189      |
----------------------------------
--2023-11-10 13:28:31.206350 CST---
| Itration            | 190       |
| Real Det Return     | 1.3e+03   |
| Real Det violation  | 1         |
| Real Sto Return     | 575       |
| Real Sto violation  | 1         |
| Reward Loss         | -1.07e+03 |
| Running Env Steps   | 950000    |
| Running Forward KL  | 23        |
| Running Reverse KL  | 24.4      |
| Running Update Time | 190       |
-----------------------------------
--2023-11-10 13:30:32.993794 CST--
| Itration            | 191      |
| Real Det Return     | 1.29e+03 |
| Real Det violation  | 0.95     |
| Real Sto Return     | 1.52e+03 |
| Real Sto violation  | 0.7      |
| Reward Loss         | -1e+03   |
| Running Env Steps   | 955000   |
| Running Forward KL  | 21.5     |
| Running Reverse KL  | 11.1     |
| Running Update Time | 191      |
----------------------------------
--2023-11-10 13:32:24.579506 CST---
| Itration            | 192       |
| Real Det Return     | 573       |
| Real Det violation  | 1         |
| Real Sto Return     | 696       |
| Real Sto violation  | 1         |
| Reward Loss         | -1.15e+03 |
| Running Env Steps   | 960000    |
| Running Forward KL  | 23.3      |
| Running Reverse KL  | 13.4      |
| Running Update Time | 192       |
-----------------------------------
--2023-11-10 13:34:27.047866 CST---
| Itration            | 193       |
| Real Det Return     | 2.09e+03  |
| Real Det violation  | 0.35      |
| Real Sto Return     | 775       |
| Real Sto violation  | 1         |
| Reward Loss         | -1.11e+03 |
| Running Env Steps   | 965000    |
| Running Forward KL  | 22.7      |
| Running Reverse KL  | 31.7      |
| Running Update Time | 193       |
-----------------------------------
--2023-11-10 13:36:19.836274 CST---
| Itration            | 194       |
| Real Det Return     | 643       |
| Real Det violation  | 1         |
| Real Sto Return     | 726       |
| Real Sto violation  | 1         |
| Reward Loss         | -1.02e+03 |
| Running Env Steps   | 970000    |
| Running Forward KL  | 23.4      |
| Running Reverse KL  | 29.2      |
| Running Update Time | 194       |
-----------------------------------
--2023-11-10 13:38:14.898665 CST--
| Itration            | 195      |
| Real Det Return     | 655      |
| Real Det violation  | 1        |
| Real Sto Return     | 877      |
| Real Sto violation  | 1        |
| Reward Loss         | -905     |
| Running Env Steps   | 975000   |
| Running Forward KL  | 23.1     |
| Running Reverse KL  | 50       |
| Running Update Time | 195      |
----------------------------------
--2023-11-10 13:40:01.956428 CST---
| Itration            | 196       |
| Real Det Return     | 245       |
| Real Det violation  | 0         |
| Real Sto Return     | 121       |
| Real Sto violation  | 0         |
| Reward Loss         | -1.12e+03 |
| Running Env Steps   | 980000    |
| Running Forward KL  | 29.1      |
| Running Reverse KL  | 20.1      |
| Running Update Time | 196       |
-----------------------------------
--2023-11-10 13:41:54.624957 CST---
| Itration            | 197       |
| Real Det Return     | 589       |
| Real Det violation  | 0.5       |
| Real Sto Return     | 571       |
| Real Sto violation  | 0.6       |
| Reward Loss         | -1.13e+03 |
| Running Env Steps   | 985000    |
| Running Forward KL  | 24.4      |
| Running Reverse KL  | 16.3      |
| Running Update Time | 197       |
-----------------------------------
--2023-11-10 13:43:44.975866 CST---
| Itration            | 198       |
| Real Det Return     | 358       |
| Real Det violation  | 1         |
| Real Sto Return     | 357       |
| Real Sto violation  | 1         |
| Reward Loss         | -1.15e+03 |
| Running Env Steps   | 990000    |
| Running Forward KL  | 25        |
| Running Reverse KL  | 19.8      |
| Running Update Time | 198       |
-----------------------------------
--2023-11-10 13:45:36.987848 CST---
| Itration            | 199       |
| Real Det Return     | 648       |
| Real Det violation  | 1         |
| Real Sto Return     | 492       |
| Real Sto violation  | 1         |
| Reward Loss         | -1.29e+03 |
| Running Env Steps   | 995000    |
| Running Forward KL  | 24.8      |
| Running Reverse KL  | 18.8      |
| Running Update Time | 199       |
-----------------------------------
--2023-11-10 13:47:43.474673 CST--
| Itration            | 200      |
| Real Det Return     | 2.75e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 798      |
| Real Sto violation  | 1        |
| Reward Loss         | -817     |
| Running Env Steps   | 1000000  |
| Running Forward KL  | 24.4     |
| Running Reverse KL  | 23.9     |
| Running Update Time | 200      |
----------------------------------
--2023-11-10 13:49:49.239822 CST--
| Itration            | 201      |
| Real Det Return     | 2.76e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 797      |
| Real Sto violation  | 0.7      |
| Reward Loss         | -941     |
| Running Env Steps   | 1005000  |
| Running Forward KL  | 23.8     |
| Running Reverse KL  | 19.2     |
| Running Update Time | 201      |
----------------------------------
--2023-11-10 13:52:05.475946 CST--
| Itration            | 202      |
| Real Det Return     | 2.76e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.58e+03 |
| Real Sto violation  | 0.1      |
| Reward Loss         | -959     |
| Running Env Steps   | 1010000  |
| Running Forward KL  | 22.3     |
| Running Reverse KL  | 12.8     |
| Running Update Time | 202      |
----------------------------------
--2023-11-10 13:54:19.371029 CST--
| Itration            | 203      |
| Real Det Return     | 2.74e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.09e+03 |
| Real Sto violation  | 0.25     |
| Reward Loss         | -897     |
| Running Env Steps   | 1015000  |
| Running Forward KL  | 21       |
| Running Reverse KL  | 12.3     |
| Running Update Time | 203      |
----------------------------------
--2023-11-10 13:56:26.594502 CST---
| Itration            | 204       |
| Real Det Return     | 2.76e+03  |
| Real Det violation  | 0         |
| Real Sto Return     | 1.1e+03   |
| Real Sto violation  | 0.75      |
| Reward Loss         | -1.08e+03 |
| Running Env Steps   | 1020000   |
| Running Forward KL  | 22.3      |
| Running Reverse KL  | 11.8      |
| Running Update Time | 204       |
-----------------------------------
--2023-11-10 13:58:38.244774 CST--
| Itration            | 205      |
| Real Det Return     | 2.87e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.86e+03 |
| Real Sto violation  | 0.25     |
| Reward Loss         | -953     |
| Running Env Steps   | 1025000  |
| Running Forward KL  | 20.4     |
| Running Reverse KL  | 12       |
| Running Update Time | 205      |
----------------------------------
--2023-11-10 14:00:53.951825 CST--
| Itration            | 206      |
| Real Det Return     | 2.85e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.56e+03 |
| Real Sto violation  | 0.1      |
| Reward Loss         | -962     |
| Running Env Steps   | 1030000  |
| Running Forward KL  | 21.1     |
| Running Reverse KL  | 12.1     |
| Running Update Time | 206      |
----------------------------------
--2023-11-10 14:03:09.093790 CST--
| Itration            | 207      |
| Real Det Return     | 2.35e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.36e+03 |
| Real Sto violation  | 0.1      |
| Reward Loss         | -883     |
| Running Env Steps   | 1035000  |
| Running Forward KL  | 20.6     |
| Running Reverse KL  | 12.6     |
| Running Update Time | 207      |
----------------------------------
--2023-11-10 14:05:15.112778 CST---
| Itration            | 208       |
| Real Det Return     | 2.57e+03  |
| Real Det violation  | 0         |
| Real Sto Return     | 881       |
| Real Sto violation  | 0.8       |
| Reward Loss         | -1.42e+03 |
| Running Env Steps   | 1040000   |
| Running Forward KL  | 22.7      |
| Running Reverse KL  | 12.1      |
| Running Update Time | 208       |
-----------------------------------
--2023-11-10 14:07:25.848730 CST---
| Itration            | 209       |
| Real Det Return     | 2.78e+03  |
| Real Det violation  | 0         |
| Real Sto Return     | 1.59e+03  |
| Real Sto violation  | 0.6       |
| Reward Loss         | -1.14e+03 |
| Running Env Steps   | 1045000   |
| Running Forward KL  | 20.8      |
| Running Reverse KL  | 11        |
| Running Update Time | 209       |
-----------------------------------
--2023-11-10 14:09:37.122041 CST---
| Itration            | 210       |
| Real Det Return     | 2.57e+03  |
| Real Det violation  | 0         |
| Real Sto Return     | 1.6e+03   |
| Real Sto violation  | 0.7       |
| Reward Loss         | -1.09e+03 |
| Running Env Steps   | 1050000   |
| Running Forward KL  | 20.1      |
| Running Reverse KL  | 11.3      |
| Running Update Time | 210       |
-----------------------------------
--2023-11-10 14:11:36.042910 CST---
| Itration            | 211       |
| Real Det Return     | 667       |
| Real Det violation  | 0.55      |
| Real Sto Return     | 1.39e+03  |
| Real Sto violation  | 0.35      |
| Reward Loss         | -1.11e+03 |
| Running Env Steps   | 1055000   |
| Running Forward KL  | 21.5      |
| Running Reverse KL  | 10.7      |
| Running Update Time | 211       |
-----------------------------------
--2023-11-10 14:13:28.290383 CST---
| Itration            | 212       |
| Real Det Return     | 459       |
| Real Det violation  | 1         |
| Real Sto Return     | 525       |
| Real Sto violation  | 0.8       |
| Reward Loss         | -1.25e+03 |
| Running Env Steps   | 1060000   |
| Running Forward KL  | 21.6      |
| Running Reverse KL  | 12.4      |
| Running Update Time | 212       |
-----------------------------------
--2023-11-10 14:15:45.800269 CST--
| Itration            | 213      |
| Real Det Return     | 2.1e+03  |
| Real Det violation  | 0        |
| Real Sto Return     | 2.36e+03 |
| Real Sto violation  | 0.05     |
| Reward Loss         | -834     |
| Running Env Steps   | 1065000  |
| Running Forward KL  | 19.9     |
| Running Reverse KL  | 12.6     |
| Running Update Time | 213      |
----------------------------------
--2023-11-10 14:17:47.666234 CST---
| Itration            | 214       |
| Real Det Return     | 1.38e+03  |
| Real Det violation  | 0.2       |
| Real Sto Return     | 1.02e+03  |
| Real Sto violation  | 0.75      |
| Reward Loss         | -1.12e+03 |
| Running Env Steps   | 1070000   |
| Running Forward KL  | 20.3      |
| Running Reverse KL  | 11.5      |
| Running Update Time | 214       |
-----------------------------------
--2023-11-10 14:20:01.823454 CST--
| Itration            | 215      |
| Real Det Return     | 2.36e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.86e+03 |
| Real Sto violation  | 0.3      |
| Reward Loss         | -896     |
| Running Env Steps   | 1075000  |
| Running Forward KL  | 19.3     |
| Running Reverse KL  | 11.6     |
| Running Update Time | 215      |
----------------------------------
--2023-11-10 14:22:17.094637 CST--
| Itration            | 216      |
| Real Det Return     | 2.12e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.05e+03 |
| Real Sto violation  | 0.15     |
| Reward Loss         | -816     |
| Running Env Steps   | 1080000  |
| Running Forward KL  | 19.6     |
| Running Reverse KL  | 12.3     |
| Running Update Time | 216      |
----------------------------------
--2023-11-10 14:24:18.529448 CST--
| Itration            | 217      |
| Real Det Return     | 541      |
| Real Det violation  | 1        |
| Real Sto Return     | 1.86e+03 |
| Real Sto violation  | 0.25     |
| Reward Loss         | -932     |
| Running Env Steps   | 1085000  |
| Running Forward KL  | 19       |
| Running Reverse KL  | 11.6     |
| Running Update Time | 217      |
----------------------------------
--2023-11-10 14:26:36.023595 CST--
| Itration            | 218      |
| Real Det Return     | 2.12e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.24e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -888     |
| Running Env Steps   | 1090000  |
| Running Forward KL  | 19.4     |
| Running Reverse KL  | 12.5     |
| Running Update Time | 218      |
----------------------------------
--2023-11-10 14:28:31.534571 CST--
| Itration            | 219      |
| Real Det Return     | 549      |
| Real Det violation  | 1        |
| Real Sto Return     | 1.07e+03 |
| Real Sto violation  | 0.5      |
| Reward Loss         | -976     |
| Running Env Steps   | 1095000  |
| Running Forward KL  | 19.4     |
| Running Reverse KL  | 13       |
| Running Update Time | 219      |
----------------------------------
--2023-11-10 14:30:31.596787 CST---
| Itration            | 220       |
| Real Det Return     | 567       |
| Real Det violation  | 1         |
| Real Sto Return     | 1.43e+03  |
| Real Sto violation  | 0.15      |
| Reward Loss         | -1.03e+03 |
| Running Env Steps   | 1100000   |
| Running Forward KL  | 19.5      |
| Running Reverse KL  | 12.6      |
| Running Update Time | 220       |
-----------------------------------
--2023-11-10 14:32:38.954553 CST--
| Itration            | 221      |
| Real Det Return     | 733      |
| Real Det violation  | 1        |
| Real Sto Return     | 2.24e+03 |
| Real Sto violation  | 0.05     |
| Reward Loss         | -842     |
| Running Env Steps   | 1105000  |
| Running Forward KL  | 18.5     |
| Running Reverse KL  | 13.5     |
| Running Update Time | 221      |
----------------------------------
--2023-11-10 14:34:45.059795 CST--
| Itration            | 222      |
| Real Det Return     | 573      |
| Real Det violation  | 1        |
| Real Sto Return     | 2.12e+03 |
| Real Sto violation  | 0.05     |
| Reward Loss         | -813     |
| Running Env Steps   | 1110000  |
| Running Forward KL  | 17.9     |
| Running Reverse KL  | 12.8     |
| Running Update Time | 222      |
----------------------------------
--2023-11-10 14:37:02.793244 CST--
| Itration            | 223      |
| Real Det Return     | 2.42e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.13e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -825     |
| Running Env Steps   | 1115000  |
| Running Forward KL  | 18.1     |
| Running Reverse KL  | 12.8     |
| Running Update Time | 223      |
----------------------------------
--2023-11-10 14:39:20.324719 CST--
| Itration            | 224      |
| Real Det Return     | 2.2e+03  |
| Real Det violation  | 0        |
| Real Sto Return     | 2.16e+03 |
| Real Sto violation  | 0.1      |
| Reward Loss         | -815     |
| Running Env Steps   | 1120000  |
| Running Forward KL  | 17.9     |
| Running Reverse KL  | 11.9     |
| Running Update Time | 224      |
----------------------------------
--2023-11-10 14:41:23.996470 CST--
| Itration            | 225      |
| Real Det Return     | 514      |
| Real Det violation  | 1        |
| Real Sto Return     | 1.95e+03 |
| Real Sto violation  | 0.15     |
| Reward Loss         | -954     |
| Running Env Steps   | 1125000  |
| Running Forward KL  | 18       |
| Running Reverse KL  | 12.1     |
| Running Update Time | 225      |
----------------------------------
--2023-11-10 14:43:43.329554 CST--
| Itration            | 226      |
| Real Det Return     | 2.13e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.3e+03  |
| Real Sto violation  | 0        |
| Reward Loss         | -788     |
| Running Env Steps   | 1130000  |
| Running Forward KL  | 17.9     |
| Running Reverse KL  | 13       |
| Running Update Time | 226      |
----------------------------------
--2023-11-10 14:46:01.649873 CST--
| Itration            | 227      |
| Real Det Return     | 2.25e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.26e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -777     |
| Running Env Steps   | 1135000  |
| Running Forward KL  | 17.8     |
| Running Reverse KL  | 12.7     |
| Running Update Time | 227      |
----------------------------------
--2023-11-10 14:48:12.581813 CST--
| Itration            | 228      |
| Real Det Return     | 1.19e+03 |
| Real Det violation  | 0.55     |
| Real Sto Return     | 2.18e+03 |
| Real Sto violation  | 0.05     |
| Reward Loss         | -867     |
| Running Env Steps   | 1140000  |
| Running Forward KL  | 18.1     |
| Running Reverse KL  | 12.1     |
| Running Update Time | 228      |
----------------------------------
--2023-11-10 14:50:19.951038 CST--
| Itration            | 229      |
| Real Det Return     | 568      |
| Real Det violation  | 1        |
| Real Sto Return     | 2.17e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -737     |
| Running Env Steps   | 1145000  |
| Running Forward KL  | 16.7     |
| Running Reverse KL  | 12.7     |
| Running Update Time | 229      |
----------------------------------
--2023-11-10 14:52:40.153003 CST--
| Itration            | 230      |
| Real Det Return     | 2.22e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.38e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -762     |
| Running Env Steps   | 1150000  |
| Running Forward KL  | 16.5     |
| Running Reverse KL  | 12.5     |
| Running Update Time | 230      |
----------------------------------
--2023-11-10 14:54:58.968039 CST--
| Itration            | 231      |
| Real Det Return     | 2.15e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.2e+03  |
| Real Sto violation  | 0.05     |
| Reward Loss         | -807     |
| Running Env Steps   | 1155000  |
| Running Forward KL  | 16.7     |
| Running Reverse KL  | 11.8     |
| Running Update Time | 231      |
----------------------------------
--2023-11-10 14:57:18.622812 CST--
| Itration            | 232      |
| Real Det Return     | 2.17e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.33e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -825     |
| Running Env Steps   | 1160000  |
| Running Forward KL  | 16.5     |
| Running Reverse KL  | 11.9     |
| Running Update Time | 232      |
----------------------------------
--2023-11-10 14:59:38.431233 CST--
| Itration            | 233      |
| Real Det Return     | 2.04e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.2e+03  |
| Real Sto violation  | 0.05     |
| Reward Loss         | -722     |
| Running Env Steps   | 1165000  |
| Running Forward KL  | 15.9     |
| Running Reverse KL  | 13.2     |
| Running Update Time | 233      |
----------------------------------
--2023-11-10 15:01:58.611210 CST--
| Itration            | 234      |
| Real Det Return     | 1.91e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.25e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -733     |
| Running Env Steps   | 1170000  |
| Running Forward KL  | 15.7     |
| Running Reverse KL  | 12       |
| Running Update Time | 234      |
----------------------------------
--2023-11-10 15:04:18.368736 CST--
| Itration            | 235      |
| Real Det Return     | 2.03e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.11e+03 |
| Real Sto violation  | 0.05     |
| Reward Loss         | -838     |
| Running Env Steps   | 1175000  |
| Running Forward KL  | 16.1     |
| Running Reverse KL  | 11.6     |
| Running Update Time | 235      |
----------------------------------
--2023-11-10 15:06:38.405943 CST--
| Itration            | 236      |
| Real Det Return     | 1.97e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.1e+03  |
| Real Sto violation  | 0.05     |
| Reward Loss         | -833     |
| Running Env Steps   | 1180000  |
| Running Forward KL  | 16.1     |
| Running Reverse KL  | 11.5     |
| Running Update Time | 236      |
----------------------------------
--2023-11-10 15:08:58.692902 CST--
| Itration            | 237      |
| Real Det Return     | 2.05e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.29e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -772     |
| Running Env Steps   | 1185000  |
| Running Forward KL  | 15.7     |
| Running Reverse KL  | 11.8     |
| Running Update Time | 237      |
----------------------------------
--2023-11-10 15:11:19.784044 CST--
| Itration            | 238      |
| Real Det Return     | 2.01e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.28e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -764     |
| Running Env Steps   | 1190000  |
| Running Forward KL  | 15.5     |
| Running Reverse KL  | 11.9     |
| Running Update Time | 238      |
----------------------------------
--2023-11-10 15:13:40.224014 CST--
| Itration            | 239      |
| Real Det Return     | 2.08e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.23e+03 |
| Real Sto violation  | 0.05     |
| Reward Loss         | -762     |
| Running Env Steps   | 1195000  |
| Running Forward KL  | 15.6     |
| Running Reverse KL  | 12.5     |
| Running Update Time | 239      |
----------------------------------
--2023-11-10 15:16:00.875814 CST--
| Itration            | 240      |
| Real Det Return     | 2.03e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.16e+03 |
| Real Sto violation  | 0.05     |
| Reward Loss         | -886     |
| Running Env Steps   | 1200000  |
| Running Forward KL  | 15.1     |
| Running Reverse KL  | 12.2     |
| Running Update Time | 240      |
----------------------------------
--2023-11-10 15:18:22.215989 CST--
| Itration            | 241      |
| Real Det Return     | 2.06e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.19e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -738     |
| Running Env Steps   | 1205000  |
| Running Forward KL  | 15       |
| Running Reverse KL  | 11.8     |
| Running Update Time | 241      |
----------------------------------
--2023-11-10 15:20:43.934186 CST--
| Itration            | 242      |
| Real Det Return     | 2.12e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.29e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -773     |
| Running Env Steps   | 1210000  |
| Running Forward KL  | 16.3     |
| Running Reverse KL  | 12.8     |
| Running Update Time | 242      |
----------------------------------
--2023-11-10 15:23:05.006170 CST--
| Itration            | 243      |
| Real Det Return     | 1.93e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.02e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -781     |
| Running Env Steps   | 1215000  |
| Running Forward KL  | 15.1     |
| Running Reverse KL  | 11.4     |
| Running Update Time | 243      |
----------------------------------
--2023-11-10 15:25:26.977714 CST--
| Itration            | 244      |
| Real Det Return     | 1.94e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.17e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -742     |
| Running Env Steps   | 1220000  |
| Running Forward KL  | 15.8     |
| Running Reverse KL  | 13.9     |
| Running Update Time | 244      |
----------------------------------
--2023-11-10 15:27:48.530465 CST--
| Itration            | 245      |
| Real Det Return     | 1.96e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.05e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -713     |
| Running Env Steps   | 1225000  |
| Running Forward KL  | 14.5     |
| Running Reverse KL  | 12       |
| Running Update Time | 245      |
----------------------------------
--2023-11-10 15:30:10.133002 CST--
| Itration            | 246      |
| Real Det Return     | 1.98e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.02e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -678     |
| Running Env Steps   | 1230000  |
| Running Forward KL  | 13.8     |
| Running Reverse KL  | 12.6     |
| Running Update Time | 246      |
----------------------------------
--2023-11-10 15:32:32.062774 CST--
| Itration            | 247      |
| Real Det Return     | 1.95e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.07e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -716     |
| Running Env Steps   | 1235000  |
| Running Forward KL  | 14.4     |
| Running Reverse KL  | 11.9     |
| Running Update Time | 247      |
----------------------------------
--2023-11-10 15:34:54.563606 CST--
| Itration            | 248      |
| Real Det Return     | 2.02e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.06e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -721     |
| Running Env Steps   | 1240000  |
| Running Forward KL  | 14.7     |
| Running Reverse KL  | 12       |
| Running Update Time | 248      |
----------------------------------
--2023-11-10 15:37:17.546846 CST--
| Itration            | 249      |
| Real Det Return     | 2.58e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.13e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -745     |
| Running Env Steps   | 1245000  |
| Running Forward KL  | 15.3     |
| Running Reverse KL  | 13       |
| Running Update Time | 249      |
----------------------------------
--2023-11-10 15:39:40.510441 CST--
| Itration            | 250      |
| Real Det Return     | 2.14e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.27e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -744     |
| Running Env Steps   | 1250000  |
| Running Forward KL  | 15.9     |
| Running Reverse KL  | 13       |
| Running Update Time | 250      |
----------------------------------
--2023-11-10 15:42:04.465422 CST--
| Itration            | 251      |
| Real Det Return     | 2.48e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.43e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -752     |
| Running Env Steps   | 1255000  |
| Running Forward KL  | 16.3     |
| Running Reverse KL  | 14.7     |
| Running Update Time | 251      |
----------------------------------
--2023-11-10 15:44:27.492417 CST--
| Itration            | 252      |
| Real Det Return     | 2.02e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.1e+03  |
| Real Sto violation  | 0        |
| Reward Loss         | -748     |
| Running Env Steps   | 1260000  |
| Running Forward KL  | 15.3     |
| Running Reverse KL  | 12.5     |
| Running Update Time | 252      |
----------------------------------
--2023-11-10 15:46:50.968010 CST--
| Itration            | 253      |
| Real Det Return     | 2.16e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.28e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -758     |
| Running Env Steps   | 1265000  |
| Running Forward KL  | 15.6     |
| Running Reverse KL  | 14.9     |
| Running Update Time | 253      |
----------------------------------
--2023-11-10 15:49:14.424324 CST--
| Itration            | 254      |
| Real Det Return     | 1.98e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.04e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -680     |
| Running Env Steps   | 1270000  |
| Running Forward KL  | 13.9     |
| Running Reverse KL  | 12.6     |
| Running Update Time | 254      |
----------------------------------
--2023-11-10 15:51:37.957441 CST--
| Itration            | 255      |
| Real Det Return     | 1.94e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.01e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -688     |
| Running Env Steps   | 1275000  |
| Running Forward KL  | 13.2     |
| Running Reverse KL  | 11.1     |
| Running Update Time | 255      |
----------------------------------
--2023-11-10 15:54:01.162708 CST--
| Itration            | 256      |
| Real Det Return     | 2.05e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.07e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -709     |
| Running Env Steps   | 1280000  |
| Running Forward KL  | 14       |
| Running Reverse KL  | 11.7     |
| Running Update Time | 256      |
----------------------------------
--2023-11-10 15:56:16.126646 CST--
| Itration            | 257      |
| Real Det Return     | 2.02e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.11e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -682     |
| Running Env Steps   | 1285000  |
| Running Forward KL  | 14.1     |
| Running Reverse KL  | 12.6     |
| Running Update Time | 257      |
----------------------------------
--2023-11-10 15:58:32.035824 CST--
| Itration            | 258      |
| Real Det Return     | 2.23e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.43e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -804     |
| Running Env Steps   | 1290000  |
| Running Forward KL  | 16.5     |
| Running Reverse KL  | 14.1     |
| Running Update Time | 258      |
----------------------------------
--2023-11-10 16:00:47.941352 CST--
| Itration            | 259      |
| Real Det Return     | 1.96e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.98e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -668     |
| Running Env Steps   | 1295000  |
| Running Forward KL  | 13.7     |
| Running Reverse KL  | 11.9     |
| Running Update Time | 259      |
----------------------------------
--2023-11-10 16:03:03.984955 CST--
| Itration            | 260      |
| Real Det Return     | 1.92e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.06e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -653     |
| Running Env Steps   | 1300000  |
| Running Forward KL  | 14       |
| Running Reverse KL  | 12.1     |
| Running Update Time | 260      |
----------------------------------
--2023-11-10 16:05:20.597240 CST--
| Itration            | 261      |
| Real Det Return     | 1.99e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.15e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -674     |
| Running Env Steps   | 1305000  |
| Running Forward KL  | 14.4     |
| Running Reverse KL  | 12.4     |
| Running Update Time | 261      |
----------------------------------
--2023-11-10 16:07:37.290341 CST--
| Itration            | 262      |
| Real Det Return     | 1.94e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.92e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -576     |
| Running Env Steps   | 1310000  |
| Running Forward KL  | 12.9     |
| Running Reverse KL  | 12.3     |
| Running Update Time | 262      |
----------------------------------
--2023-11-10 16:09:54.105365 CST--
| Itration            | 263      |
| Real Det Return     | 2.06e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.89e+03 |
| Real Sto violation  | 0.05     |
| Reward Loss         | -533     |
| Running Env Steps   | 1315000  |
| Running Forward KL  | 13.6     |
| Running Reverse KL  | 13       |
| Running Update Time | 263      |
----------------------------------
--2023-11-10 16:12:10.995884 CST--
| Itration            | 264      |
| Real Det Return     | 1.86e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.92e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -565     |
| Running Env Steps   | 1320000  |
| Running Forward KL  | 12.9     |
| Running Reverse KL  | 12       |
| Running Update Time | 264      |
----------------------------------
--2023-11-10 16:14:28.700232 CST--
| Itration            | 265      |
| Real Det Return     | 2.29e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.15e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -596     |
| Running Env Steps   | 1325000  |
| Running Forward KL  | 14.6     |
| Running Reverse KL  | 12.9     |
| Running Update Time | 265      |
----------------------------------
--2023-11-10 16:16:45.887592 CST--
| Itration            | 266      |
| Real Det Return     | 1.97e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.09e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -589     |
| Running Env Steps   | 1330000  |
| Running Forward KL  | 13.3     |
| Running Reverse KL  | 12.2     |
| Running Update Time | 266      |
----------------------------------
--2023-11-10 16:19:03.940678 CST--
| Itration            | 267      |
| Real Det Return     | 2.03e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.04e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -552     |
| Running Env Steps   | 1335000  |
| Running Forward KL  | 13.3     |
| Running Reverse KL  | 11.9     |
| Running Update Time | 267      |
----------------------------------
--2023-11-10 16:21:21.267522 CST--
| Itration            | 268      |
| Real Det Return     | 2.15e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.13e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -597     |
| Running Env Steps   | 1340000  |
| Running Forward KL  | 13.2     |
| Running Reverse KL  | 11.6     |
| Running Update Time | 268      |
----------------------------------
--2023-11-10 16:23:38.729980 CST--
| Itration            | 269      |
| Real Det Return     | 2.07e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.07e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -538     |
| Running Env Steps   | 1345000  |
| Running Forward KL  | 13.6     |
| Running Reverse KL  | 12.8     |
| Running Update Time | 269      |
----------------------------------
--2023-11-10 16:25:55.994123 CST--
| Itration            | 270      |
| Real Det Return     | 1.97e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.01e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -576     |
| Running Env Steps   | 1350000  |
| Running Forward KL  | 13       |
| Running Reverse KL  | 11.6     |
| Running Update Time | 270      |
----------------------------------
--2023-11-10 16:28:13.276405 CST--
| Itration            | 271      |
| Real Det Return     | 2.03e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.02e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -587     |
| Running Env Steps   | 1355000  |
| Running Forward KL  | 12.7     |
| Running Reverse KL  | 11.6     |
| Running Update Time | 271      |
----------------------------------
--2023-11-10 16:30:30.847404 CST--
| Itration            | 272      |
| Real Det Return     | 2.1e+03  |
| Real Det violation  | 0        |
| Real Sto Return     | 2.09e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -599     |
| Running Env Steps   | 1360000  |
| Running Forward KL  | 13.5     |
| Running Reverse KL  | 12.3     |
| Running Update Time | 272      |
----------------------------------
--2023-11-10 16:32:48.310261 CST--
| Itration            | 273      |
| Real Det Return     | 1.9e+03  |
| Real Det violation  | 0        |
| Real Sto Return     | 1.89e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -553     |
| Running Env Steps   | 1365000  |
| Running Forward KL  | 12.4     |
| Running Reverse KL  | 12       |
| Running Update Time | 273      |
----------------------------------
--2023-11-10 16:35:05.967235 CST--
| Itration            | 274      |
| Real Det Return     | 2.05e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.03e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -558     |
| Running Env Steps   | 1370000  |
| Running Forward KL  | 12.7     |
| Running Reverse KL  | 11.8     |
| Running Update Time | 274      |
----------------------------------
--2023-11-10 16:37:23.155300 CST--
| Itration            | 275      |
| Real Det Return     | 1.98e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.97e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -548     |
| Running Env Steps   | 1375000  |
| Running Forward KL  | 12.1     |
| Running Reverse KL  | 11.7     |
| Running Update Time | 275      |
----------------------------------
--2023-11-10 16:39:41.035742 CST--
| Itration            | 276      |
| Real Det Return     | 1.95e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.99e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -555     |
| Running Env Steps   | 1380000  |
| Running Forward KL  | 12.4     |
| Running Reverse KL  | 11.4     |
| Running Update Time | 276      |
----------------------------------
--2023-11-10 16:41:58.597746 CST--
| Itration            | 277      |
| Real Det Return     | 1.97e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.03e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -538     |
| Running Env Steps   | 1385000  |
| Running Forward KL  | 12.5     |
| Running Reverse KL  | 11.7     |
| Running Update Time | 277      |
----------------------------------
--2023-11-10 16:44:16.823819 CST--
| Itration            | 278      |
| Real Det Return     | 1.88e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.93e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -553     |
| Running Env Steps   | 1390000  |
| Running Forward KL  | 12       |
| Running Reverse KL  | 11.4     |
| Running Update Time | 278      |
----------------------------------
--2023-11-10 16:46:34.074564 CST--
| Itration            | 279      |
| Real Det Return     | 2.14e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.08e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -551     |
| Running Env Steps   | 1395000  |
| Running Forward KL  | 13.9     |
| Running Reverse KL  | 13.1     |
| Running Update Time | 279      |
----------------------------------
--2023-11-10 16:48:51.396058 CST--
| Itration            | 280      |
| Real Det Return     | 1.95e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.96e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -566     |
| Running Env Steps   | 1400000  |
| Running Forward KL  | 12.4     |
| Running Reverse KL  | 11.8     |
| Running Update Time | 280      |
----------------------------------
--2023-11-10 16:51:09.328353 CST--
| Itration            | 281      |
| Real Det Return     | 2e+03    |
| Real Det violation  | 0        |
| Real Sto Return     | 2.06e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -598     |
| Running Env Steps   | 1405000  |
| Running Forward KL  | 13       |
| Running Reverse KL  | 12.1     |
| Running Update Time | 281      |
----------------------------------
--2023-11-10 16:53:27.141381 CST--
| Itration            | 282      |
| Real Det Return     | 2e+03    |
| Real Det violation  | 0        |
| Real Sto Return     | 2.02e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -567     |
| Running Env Steps   | 1410000  |
| Running Forward KL  | 13.3     |
| Running Reverse KL  | 12.6     |
| Running Update Time | 282      |
----------------------------------
--2023-11-10 16:55:45.335547 CST--
| Itration            | 283      |
| Real Det Return     | 2e+03    |
| Real Det violation  | 0        |
| Real Sto Return     | 2.01e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -577     |
| Running Env Steps   | 1415000  |
| Running Forward KL  | 13.9     |
| Running Reverse KL  | 12.6     |
| Running Update Time | 283      |
----------------------------------
--2023-11-10 16:58:03.376611 CST--
| Itration            | 284      |
| Real Det Return     | 1.93e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.97e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -576     |
| Running Env Steps   | 1420000  |
| Running Forward KL  | 12.7     |
| Running Reverse KL  | 12.2     |
| Running Update Time | 284      |
----------------------------------
--2023-11-10 17:00:21.295816 CST--
| Itration            | 285      |
| Real Det Return     | 1.93e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.98e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -559     |
| Running Env Steps   | 1425000  |
| Running Forward KL  | 12.5     |
| Running Reverse KL  | 12.4     |
| Running Update Time | 285      |
----------------------------------
--2023-11-10 17:02:38.948412 CST--
| Itration            | 286      |
| Real Det Return     | 1.93e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.94e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -536     |
| Running Env Steps   | 1430000  |
| Running Forward KL  | 11.6     |
| Running Reverse KL  | 12.1     |
| Running Update Time | 286      |
----------------------------------
--2023-11-10 17:04:57.170931 CST--
| Itration            | 287      |
| Real Det Return     | 1.89e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.91e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -561     |
| Running Env Steps   | 1435000  |
| Running Forward KL  | 12.3     |
| Running Reverse KL  | 12.2     |
| Running Update Time | 287      |
----------------------------------
--2023-11-10 17:07:14.816894 CST--
| Itration            | 288      |
| Real Det Return     | 1.95e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.01e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -568     |
| Running Env Steps   | 1440000  |
| Running Forward KL  | 12.4     |
| Running Reverse KL  | 12.3     |
| Running Update Time | 288      |
----------------------------------
--2023-11-10 17:09:33.387614 CST--
| Itration            | 289      |
| Real Det Return     | 1.93e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.97e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -552     |
| Running Env Steps   | 1445000  |
| Running Forward KL  | 12.7     |
| Running Reverse KL  | 12.7     |
| Running Update Time | 289      |
----------------------------------
--2023-11-10 17:11:51.049772 CST--
| Itration            | 290      |
| Real Det Return     | 1.72e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.75e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -450     |
| Running Env Steps   | 1450000  |
| Running Forward KL  | 10.8     |
| Running Reverse KL  | 12.7     |
| Running Update Time | 290      |
----------------------------------
--2023-11-10 17:14:08.794061 CST--
| Itration            | 291      |
| Real Det Return     | 1.89e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.94e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -548     |
| Running Env Steps   | 1455000  |
| Running Forward KL  | 12.8     |
| Running Reverse KL  | 12.7     |
| Running Update Time | 291      |
----------------------------------
--2023-11-10 17:16:26.677126 CST--
| Itration            | 292      |
| Real Det Return     | 1.77e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.79e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -530     |
| Running Env Steps   | 1460000  |
| Running Forward KL  | 11.8     |
| Running Reverse KL  | 11.3     |
| Running Update Time | 292      |
----------------------------------
--2023-11-10 17:18:44.618486 CST--
| Itration            | 293      |
| Real Det Return     | 1.75e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.77e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -457     |
| Running Env Steps   | 1465000  |
| Running Forward KL  | 10.4     |
| Running Reverse KL  | 12.2     |
| Running Update Time | 293      |
----------------------------------
--2023-11-10 17:21:05.937609 CST--
| Itration            | 294      |
| Real Det Return     | 1.75e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.78e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -476     |
| Running Env Steps   | 1470000  |
| Running Forward KL  | 10.2     |
| Running Reverse KL  | 11.8     |
| Running Update Time | 294      |
----------------------------------
--2023-11-10 17:23:27.105225 CST--
| Itration            | 295      |
| Real Det Return     | 1.75e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.78e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -511     |
| Running Env Steps   | 1475000  |
| Running Forward KL  | 11.2     |
| Running Reverse KL  | 11.6     |
| Running Update Time | 295      |
----------------------------------
--2023-11-10 17:25:48.047226 CST--
| Itration            | 296      |
| Real Det Return     | 1.8e+03  |
| Real Det violation  | 0        |
| Real Sto Return     | 1.83e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -539     |
| Running Env Steps   | 1480000  |
| Running Forward KL  | 11       |
| Running Reverse KL  | 11.2     |
| Running Update Time | 296      |
----------------------------------
--2023-11-10 17:28:09.048897 CST--
| Itration            | 297      |
| Real Det Return     | 1.7e+03  |
| Real Det violation  | 0        |
| Real Sto Return     | 1.71e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -465     |
| Running Env Steps   | 1485000  |
| Running Forward KL  | 11       |
| Running Reverse KL  | 12.4     |
| Running Update Time | 297      |
----------------------------------
--2023-11-10 17:30:26.996868 CST--
| Itration            | 298      |
| Real Det Return     | 1.7e+03  |
| Real Det violation  | 0        |
| Real Sto Return     | 1.73e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -449     |
| Running Env Steps   | 1490000  |
| Running Forward KL  | 10.4     |
| Running Reverse KL  | 12.1     |
| Running Update Time | 298      |
----------------------------------
--2023-11-10 17:32:45.097168 CST--
| Itration            | 299      |
| Real Det Return     | 1.66e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.66e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -466     |
| Running Env Steps   | 1495000  |
| Running Forward KL  | 9.54     |
| Running Reverse KL  | 11.8     |
| Running Update Time | 299      |
----------------------------------
--2023-11-10 17:35:03.642808 CST--
| Itration            | 300      |
| Real Det Return     | 1.75e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.81e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -497     |
| Running Env Steps   | 1500000  |
| Running Forward KL  | 10.6     |
| Running Reverse KL  | 12.1     |
| Running Update Time | 300      |
----------------------------------
--2023-11-10 17:37:22.003028 CST--
| Itration            | 301      |
| Real Det Return     | 1.68e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.76e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -500     |
| Running Env Steps   | 1505000  |
| Running Forward KL  | 10.4     |
| Running Reverse KL  | 11.2     |
| Running Update Time | 301      |
----------------------------------
--2023-11-10 17:39:40.471590 CST--
| Itration            | 302      |
| Real Det Return     | 1.66e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.72e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -455     |
| Running Env Steps   | 1510000  |
| Running Forward KL  | 9.24     |
| Running Reverse KL  | 11.8     |
| Running Update Time | 302      |
----------------------------------
--2023-11-10 17:41:58.936407 CST--
| Itration            | 303      |
| Real Det Return     | 1.64e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.65e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -442     |
| Running Env Steps   | 1515000  |
| Running Forward KL  | 8.17     |
| Running Reverse KL  | 11.1     |
| Running Update Time | 303      |
----------------------------------
--2023-11-10 17:44:17.569565 CST--
| Itration            | 304      |
| Real Det Return     | 1.68e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.73e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -418     |
| Running Env Steps   | 1520000  |
| Running Forward KL  | 8.29     |
| Running Reverse KL  | 11.3     |
| Running Update Time | 304      |
----------------------------------
--2023-11-10 17:46:32.899577 CST--
| Itration            | 305      |
| Real Det Return     | 1.64e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.7e+03  |
| Real Sto violation  | 0        |
| Reward Loss         | -458     |
| Running Env Steps   | 1525000  |
| Running Forward KL  | 7.89     |
| Running Reverse KL  | 10.7     |
| Running Update Time | 305      |
----------------------------------
--2023-11-10 17:48:51.348965 CST--
| Itration            | 306      |
| Real Det Return     | 1.53e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.6e+03  |
| Real Sto violation  | 0        |
| Reward Loss         | -400     |
| Running Env Steps   | 1530000  |
| Running Forward KL  | 7.76     |
| Running Reverse KL  | 10.9     |
| Running Update Time | 306      |
----------------------------------
--2023-11-10 17:51:09.888677 CST--
| Itration            | 307      |
| Real Det Return     | 1.66e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.68e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -423     |
| Running Env Steps   | 1535000  |
| Running Forward KL  | 8.42     |
| Running Reverse KL  | 11.5     |
| Running Update Time | 307      |
----------------------------------
--2023-11-10 17:53:28.657132 CST--
| Itration            | 308      |
| Real Det Return     | 1.68e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.78e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -483     |
| Running Env Steps   | 1540000  |
| Running Forward KL  | 9.88     |
| Running Reverse KL  | 11.9     |
| Running Update Time | 308      |
----------------------------------
--2023-11-10 17:55:47.074119 CST--
| Itration            | 309      |
| Real Det Return     | 1.62e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.7e+03  |
| Real Sto violation  | 0        |
| Reward Loss         | -412     |
| Running Env Steps   | 1545000  |
| Running Forward KL  | 8.57     |
| Running Reverse KL  | 11.9     |
| Running Update Time | 309      |
----------------------------------
--2023-11-10 17:58:05.487108 CST--
| Itration            | 310      |
| Real Det Return     | 1.62e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.64e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -405     |
| Running Env Steps   | 1550000  |
| Running Forward KL  | 7.38     |
| Running Reverse KL  | 11.5     |
| Running Update Time | 310      |
----------------------------------
--2023-11-10 18:00:23.793619 CST--
| Itration            | 311      |
| Real Det Return     | 1.53e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.65e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -424     |
| Running Env Steps   | 1555000  |
| Running Forward KL  | 7.98     |
| Running Reverse KL  | 11       |
| Running Update Time | 311      |
----------------------------------
--2023-11-10 18:02:41.715497 CST--
| Itration            | 312      |
| Real Det Return     | 1.46e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.46e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -354     |
| Running Env Steps   | 1560000  |
| Running Forward KL  | 6.89     |
| Running Reverse KL  | 10.9     |
| Running Update Time | 312      |
----------------------------------
--2023-11-10 18:04:59.673971 CST--
| Itration            | 313      |
| Real Det Return     | 1.32e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.39e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -305     |
| Running Env Steps   | 1565000  |
| Running Forward KL  | 4.86     |
| Running Reverse KL  | 9.44     |
| Running Update Time | 313      |
----------------------------------
--2023-11-10 18:07:17.561758 CST--
| Itration            | 314      |
| Real Det Return     | 1.4e+03  |
| Real Det violation  | 0        |
| Real Sto Return     | 1.44e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -292     |
| Running Env Steps   | 1570000  |
| Running Forward KL  | 5.37     |
| Running Reverse KL  | 9.9      |
| Running Update Time | 314      |
----------------------------------
--2023-11-10 18:09:35.508661 CST--
| Itration            | 315      |
| Real Det Return     | 1.58e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.69e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -437     |
| Running Env Steps   | 1575000  |
| Running Forward KL  | 6.83     |
| Running Reverse KL  | 10.6     |
| Running Update Time | 315      |
----------------------------------
--2023-11-10 18:11:53.392396 CST--
| Itration            | 316      |
| Real Det Return     | 1.35e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.36e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -264     |
| Running Env Steps   | 1580000  |
| Running Forward KL  | 4.21     |
| Running Reverse KL  | 9.87     |
| Running Update Time | 316      |
----------------------------------
--2023-11-10 18:14:11.237714 CST--
| Itration            | 317      |
| Real Det Return     | 1.54e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.53e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -383     |
| Running Env Steps   | 1585000  |
| Running Forward KL  | 5.08     |
| Running Reverse KL  | 9.35     |
| Running Update Time | 317      |
----------------------------------
--2023-11-10 18:16:29.222424 CST--
| Itration            | 318      |
| Real Det Return     | 1.48e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.5e+03  |
| Real Sto violation  | 0        |
| Reward Loss         | -295     |
| Running Env Steps   | 1590000  |
| Running Forward KL  | 4.22     |
| Running Reverse KL  | 9.2      |
| Running Update Time | 318      |
----------------------------------
--2023-11-10 18:18:47.197734 CST--
| Itration            | 319      |
| Real Det Return     | 1.43e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.53e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -338     |
| Running Env Steps   | 1595000  |
| Running Forward KL  | 5.23     |
| Running Reverse KL  | 9.5      |
| Running Update Time | 319      |
----------------------------------
--2023-11-10 18:21:03.059901 CST--
| Itration            | 320      |
| Real Det Return     | 1.28e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.15e+03 |
| Real Sto violation  | 0.15     |
| Reward Loss         | -362     |
| Running Env Steps   | 1600000  |
| Running Forward KL  | 3.36     |
| Running Reverse KL  | 8        |
| Running Update Time | 320      |
----------------------------------
--2023-11-10 18:23:21.169900 CST--
| Itration            | 321      |
| Real Det Return     | 1.38e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.45e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -284     |
| Running Env Steps   | 1605000  |
| Running Forward KL  | 4.35     |
| Running Reverse KL  | 9.52     |
| Running Update Time | 321      |
----------------------------------
--2023-11-10 18:25:38.551644 CST--
| Itration            | 322      |
| Real Det Return     | 1.48e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.39e+03 |
| Real Sto violation  | 0.05     |
| Reward Loss         | -341     |
| Running Env Steps   | 1610000  |
| Running Forward KL  | 3.78     |
| Running Reverse KL  | 8.54     |
| Running Update Time | 322      |
----------------------------------
--2023-11-10 18:27:55.961524 CST--
| Itration            | 323      |
| Real Det Return     | 1.3e+03  |
| Real Det violation  | 0        |
| Real Sto Return     | 1.28e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -232     |
| Running Env Steps   | 1615000  |
| Running Forward KL  | 3.51     |
| Running Reverse KL  | 9.12     |
| Running Update Time | 323      |
----------------------------------
--2023-11-10 18:30:13.675234 CST--
| Itration            | 324      |
| Real Det Return     | 1.39e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.39e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -252     |
| Running Env Steps   | 1620000  |
| Running Forward KL  | 3.25     |
| Running Reverse KL  | 9.03     |
| Running Update Time | 324      |
----------------------------------
--2023-11-10 18:32:31.283753 CST--
| Itration            | 325      |
| Real Det Return     | 1.43e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.36e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -266     |
| Running Env Steps   | 1625000  |
| Running Forward KL  | 2.78     |
| Running Reverse KL  | 8.54     |
| Running Update Time | 325      |
----------------------------------
--2023-11-10 18:34:48.946361 CST--
| Itration            | 326      |
| Real Det Return     | 1.41e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.4e+03  |
| Real Sto violation  | 0        |
| Reward Loss         | -247     |
| Running Env Steps   | 1630000  |
| Running Forward KL  | 4.39     |
| Running Reverse KL  | 9.38     |
| Running Update Time | 326      |
----------------------------------
--2023-11-10 18:37:06.707348 CST--
| Itration            | 327      |
| Real Det Return     | 1.38e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.38e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -280     |
| Running Env Steps   | 1635000  |
| Running Forward KL  | 2.87     |
| Running Reverse KL  | 8.67     |
| Running Update Time | 327      |
----------------------------------
--2023-11-10 18:39:24.459333 CST--
| Itration            | 328      |
| Real Det Return     | 1.45e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.44e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -313     |
| Running Env Steps   | 1640000  |
| Running Forward KL  | 3.83     |
| Running Reverse KL  | 9.39     |
| Running Update Time | 328      |
----------------------------------
--2023-11-10 18:41:42.340303 CST--
| Itration            | 329      |
| Real Det Return     | 1.32e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.31e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -182     |
| Running Env Steps   | 1645000  |
| Running Forward KL  | 2.26     |
| Running Reverse KL  | 8.04     |
| Running Update Time | 329      |
----------------------------------
--2023-11-10 18:44:00.314716 CST--
| Itration            | 330      |
| Real Det Return     | 1.24e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.24e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -179     |
| Running Env Steps   | 1650000  |
| Running Forward KL  | 2.82     |
| Running Reverse KL  | 8.26     |
| Running Update Time | 330      |
----------------------------------
--2023-11-10 18:46:18.212642 CST--
| Itration            | 331      |
| Real Det Return     | 1.27e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.27e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -216     |
| Running Env Steps   | 1655000  |
| Running Forward KL  | 3.55     |
| Running Reverse KL  | 8.71     |
| Running Update Time | 331      |
----------------------------------
--2023-11-10 18:48:36.315022 CST--
| Itration            | 332      |
| Real Det Return     | 1.27e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.29e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -165     |
| Running Env Steps   | 1660000  |
| Running Forward KL  | 2.86     |
| Running Reverse KL  | 9.14     |
| Running Update Time | 332      |
----------------------------------
--2023-11-10 18:50:54.487682 CST--
| Itration            | 333      |
| Real Det Return     | 1.41e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.36e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -235     |
| Running Env Steps   | 1665000  |
| Running Forward KL  | 2.69     |
| Running Reverse KL  | 8.53     |
| Running Update Time | 333      |
----------------------------------
--2023-11-10 18:53:12.853197 CST--
| Itration            | 334      |
| Real Det Return     | 1.36e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.41e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -248     |
| Running Env Steps   | 1670000  |
| Running Forward KL  | 3.02     |
| Running Reverse KL  | 8.62     |
| Running Update Time | 334      |
----------------------------------
--2023-11-10 18:55:31.158176 CST--
| Itration            | 335      |
| Real Det Return     | 1.32e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.32e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -206     |
| Running Env Steps   | 1675000  |
| Running Forward KL  | 2.61     |
| Running Reverse KL  | 8.65     |
| Running Update Time | 335      |
----------------------------------
--2023-11-10 18:57:49.578176 CST--
| Itration            | 336      |
| Real Det Return     | 1.44e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.43e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -299     |
| Running Env Steps   | 1680000  |
| Running Forward KL  | 3.9      |
| Running Reverse KL  | 9.47     |
| Running Update Time | 336      |
----------------------------------
--2023-11-10 19:00:07.937369 CST--
| Itration            | 337      |
| Real Det Return     | 1.36e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.32e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -243     |
| Running Env Steps   | 1685000  |
| Running Forward KL  | 3.39     |
| Running Reverse KL  | 8.49     |
| Running Update Time | 337      |
----------------------------------
--2023-11-10 19:02:26.256997 CST--
| Itration            | 338      |
| Real Det Return     | 1.36e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.33e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -274     |
| Running Env Steps   | 1690000  |
| Running Forward KL  | 2.51     |
| Running Reverse KL  | 7.86     |
| Running Update Time | 338      |
----------------------------------
--2023-11-10 19:04:44.537287 CST--
| Itration            | 339      |
| Real Det Return     | 1.35e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.34e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -202     |
| Running Env Steps   | 1695000  |
| Running Forward KL  | 3.14     |
| Running Reverse KL  | 9.88     |
| Running Update Time | 339      |
----------------------------------
--2023-11-10 19:07:02.886600 CST--
| Itration            | 340      |
| Real Det Return     | 1.41e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.4e+03  |
| Real Sto violation  | 0        |
| Reward Loss         | -285     |
| Running Env Steps   | 1700000  |
| Running Forward KL  | 2.88     |
| Running Reverse KL  | 8.52     |
| Running Update Time | 340      |
----------------------------------
--2023-11-10 19:09:20.011238 CST--
| Itration            | 341      |
| Real Det Return     | 1.28e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.3e+03  |
| Real Sto violation  | 0        |
| Reward Loss         | -179     |
| Running Env Steps   | 1705000  |
| Running Forward KL  | 2.32     |
| Running Reverse KL  | 8.44     |
| Running Update Time | 341      |
----------------------------------
--2023-11-10 19:11:37.249062 CST--
| Itration            | 342      |
| Real Det Return     | 1.22e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.21e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -170     |
| Running Env Steps   | 1710000  |
| Running Forward KL  | 2.94     |
| Running Reverse KL  | 8.82     |
| Running Update Time | 342      |
----------------------------------
--2023-11-10 19:13:54.640133 CST--
| Itration            | 343      |
| Real Det Return     | 1.29e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.31e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -195     |
| Running Env Steps   | 1715000  |
| Running Forward KL  | 2.63     |
| Running Reverse KL  | 8.45     |
| Running Update Time | 343      |
----------------------------------
--2023-11-10 19:16:11.846069 CST--
| Itration            | 344      |
| Real Det Return     | 1.32e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.3e+03  |
| Real Sto violation  | 0        |
| Reward Loss         | -213     |
| Running Env Steps   | 1720000  |
| Running Forward KL  | 2.26     |
| Running Reverse KL  | 8.29     |
| Running Update Time | 344      |
----------------------------------
--2023-11-10 19:18:29.035335 CST--
| Itration            | 345      |
| Real Det Return     | 1.27e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.27e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -198     |
| Running Env Steps   | 1725000  |
| Running Forward KL  | 3.03     |
| Running Reverse KL  | 8.46     |
| Running Update Time | 345      |
----------------------------------
--2023-11-10 19:20:45.952380 CST--
| Itration            | 346      |
| Real Det Return     | 1.24e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.26e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -160     |
| Running Env Steps   | 1730000  |
| Running Forward KL  | 2.81     |
| Running Reverse KL  | 9.23     |
| Running Update Time | 346      |
----------------------------------
--2023-11-10 19:23:03.114414 CST--
| Itration            | 347      |
| Real Det Return     | 1.26e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.26e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -205     |
| Running Env Steps   | 1735000  |
| Running Forward KL  | 2.79     |
| Running Reverse KL  | 8.59     |
| Running Update Time | 347      |
----------------------------------
--2023-11-10 19:25:20.531346 CST--
| Itration            | 348      |
| Real Det Return     | 1.26e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.22e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -134     |
| Running Env Steps   | 1740000  |
| Running Forward KL  | 2.02     |
| Running Reverse KL  | 8.25     |
| Running Update Time | 348      |
----------------------------------
--2023-11-10 19:27:38.157036 CST--
| Itration            | 349      |
| Real Det Return     | 1.31e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.32e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -207     |
| Running Env Steps   | 1745000  |
| Running Forward KL  | 2.85     |
| Running Reverse KL  | 8.86     |
| Running Update Time | 349      |
----------------------------------
--2023-11-10 19:29:55.678709 CST--
| Itration            | 350      |
| Real Det Return     | 1.19e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.22e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -128     |
| Running Env Steps   | 1750000  |
| Running Forward KL  | 2.66     |
| Running Reverse KL  | 8.59     |
| Running Update Time | 350      |
----------------------------------
--2023-11-10 19:32:13.032816 CST--
| Itration            | 351      |
| Real Det Return     | 1.32e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.32e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -244     |
| Running Env Steps   | 1755000  |
| Running Forward KL  | 3.35     |
| Running Reverse KL  | 8.83     |
| Running Update Time | 351      |
----------------------------------
--2023-11-10 19:34:30.840684 CST--
| Itration            | 352      |
| Real Det Return     | 1.3e+03  |
| Real Det violation  | 0        |
| Real Sto Return     | 1.24e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -176     |
| Running Env Steps   | 1760000  |
| Running Forward KL  | 2.77     |
| Running Reverse KL  | 8.31     |
| Running Update Time | 352      |
----------------------------------
--2023-11-10 19:36:48.551769 CST--
| Itration            | 353      |
| Real Det Return     | 1.25e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.25e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -159     |
| Running Env Steps   | 1765000  |
| Running Forward KL  | 2.2      |
| Running Reverse KL  | 8.4      |
| Running Update Time | 353      |
----------------------------------
--2023-11-10 19:39:05.926843 CST--
| Itration            | 354      |
| Real Det Return     | 1.26e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.2e+03  |
| Real Sto violation  | 0.05     |
| Reward Loss         | -184     |
| Running Env Steps   | 1770000  |
| Running Forward KL  | 3.44     |
| Running Reverse KL  | 8.65     |
| Running Update Time | 354      |
----------------------------------
--2023-11-10 19:41:23.534524 CST--
| Itration            | 355      |
| Real Det Return     | 1.26e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.21e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -165     |
| Running Env Steps   | 1775000  |
| Running Forward KL  | 3.21     |
| Running Reverse KL  | 8.99     |
| Running Update Time | 355      |
----------------------------------
--2023-11-10 19:43:41.020115 CST--
| Itration            | 356      |
| Real Det Return     | 1.39e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.34e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -288     |
| Running Env Steps   | 1780000  |
| Running Forward KL  | 3.66     |
| Running Reverse KL  | 8.82     |
| Running Update Time | 356      |
----------------------------------
--2023-11-10 19:45:58.569694 CST--
| Itration            | 357      |
| Real Det Return     | 1.22e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.18e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -126     |
| Running Env Steps   | 1785000  |
| Running Forward KL  | 2.51     |
| Running Reverse KL  | 8.15     |
| Running Update Time | 357      |
----------------------------------
--2023-11-10 19:48:16.038501 CST--
| Itration            | 358      |
| Real Det Return     | 1.22e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.18e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -143     |
| Running Env Steps   | 1790000  |
| Running Forward KL  | 2.54     |
| Running Reverse KL  | 7.92     |
| Running Update Time | 358      |
----------------------------------
--2023-11-10 19:50:33.808859 CST--
| Itration            | 359      |
| Real Det Return     | 1.18e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.16e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -166     |
| Running Env Steps   | 1795000  |
| Running Forward KL  | 3.44     |
| Running Reverse KL  | 7.8      |
| Running Update Time | 359      |
----------------------------------
--2023-11-10 19:52:51.898307 CST--
| Itration            | 360      |
| Real Det Return     | 1.26e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.23e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -168     |
| Running Env Steps   | 1800000  |
| Running Forward KL  | 2.38     |
| Running Reverse KL  | 8.05     |
| Running Update Time | 360      |
----------------------------------
--2023-11-10 19:55:09.494234 CST--
| Itration            | 361      |
| Real Det Return     | 1.21e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.17e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -124     |
| Running Env Steps   | 1805000  |
| Running Forward KL  | 3.56     |
| Running Reverse KL  | 9.28     |
| Running Update Time | 361      |
----------------------------------
--2023-11-10 19:57:26.855280 CST--
| Itration            | 362      |
| Real Det Return     | 1.15e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.11e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -95.7    |
| Running Env Steps   | 1810000  |
| Running Forward KL  | 2.48     |
| Running Reverse KL  | 7.85     |
| Running Update Time | 362      |
----------------------------------
--2023-11-10 19:59:44.658594 CST--
| Itration            | 363      |
| Real Det Return     | 1.13e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.12e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -92.3    |
| Running Env Steps   | 1815000  |
| Running Forward KL  | 3.44     |
| Running Reverse KL  | 8.24     |
| Running Update Time | 363      |
----------------------------------
--2023-11-10 20:02:02.381036 CST--
| Itration            | 364      |
| Real Det Return     | 1.07e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.02e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -57.4    |
| Running Env Steps   | 1820000  |
| Running Forward KL  | 4.63     |
| Running Reverse KL  | 8.41     |
| Running Update Time | 364      |
----------------------------------
--2023-11-10 20:04:20.298733 CST--
| Itration            | 365      |
| Real Det Return     | 1.13e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.08e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -98.8    |
| Running Env Steps   | 1825000  |
| Running Forward KL  | 3.85     |
| Running Reverse KL  | 8.65     |
| Running Update Time | 365      |
----------------------------------
--2023-11-10 20:06:38.579241 CST--
| Itration            | 366      |
| Real Det Return     | 1.1e+03  |
| Real Det violation  | 0        |
| Real Sto Return     | 1.07e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -118     |
| Running Env Steps   | 1830000  |
| Running Forward KL  | 3.85     |
| Running Reverse KL  | 8.07     |
| Running Update Time | 366      |
----------------------------------
--2023-11-10 20:08:54.356334 CST--
| Itration            | 367      |
| Real Det Return     | 1.12e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.11e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -135     |
| Running Env Steps   | 1835000  |
| Running Forward KL  | 3.58     |
| Running Reverse KL  | 9.05     |
| Running Update Time | 367      |
----------------------------------
--2023-11-10 20:11:21.329778 CST--
| Itration            | 368      |
| Real Det Return     | 1.14e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.15e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -133     |
| Running Env Steps   | 1840000  |
| Running Forward KL  | 3.89     |
| Running Reverse KL  | 8.87     |
| Running Update Time | 368      |
----------------------------------
--2023-11-10 20:13:47.716694 CST--
| Itration            | 369      |
| Real Det Return     | 1.17e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.2e+03  |
| Real Sto violation  | 0        |
| Reward Loss         | -126     |
| Running Env Steps   | 1845000  |
| Running Forward KL  | 2.42     |
| Running Reverse KL  | 8.55     |
| Running Update Time | 369      |
----------------------------------
--2023-11-10 20:16:14.123558 CST--
| Itration            | 370      |
| Real Det Return     | 1.13e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.14e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -155     |
| Running Env Steps   | 1850000  |
| Running Forward KL  | 3.87     |
| Running Reverse KL  | 8.23     |
| Running Update Time | 370      |
----------------------------------
--2023-11-10 20:18:40.366957 CST--
| Itration            | 371      |
| Real Det Return     | 1.09e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.06e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -93      |
| Running Env Steps   | 1855000  |
| Running Forward KL  | 4.08     |
| Running Reverse KL  | 8.32     |
| Running Update Time | 371      |
----------------------------------
--2023-11-10 20:21:07.090472 CST--
| Itration            | 372      |
| Real Det Return     | 1.17e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.19e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -146     |
| Running Env Steps   | 1860000  |
| Running Forward KL  | 3.01     |
| Running Reverse KL  | 7.99     |
| Running Update Time | 372      |
----------------------------------
--2023-11-10 20:23:33.747438 CST--
| Itration            | 373      |
| Real Det Return     | 1.19e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.14e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -144     |
| Running Env Steps   | 1865000  |
| Running Forward KL  | 3.67     |
| Running Reverse KL  | 8.39     |
| Running Update Time | 373      |
----------------------------------
--2023-11-10 20:26:00.700196 CST--
| Itration            | 374      |
| Real Det Return     | 1.12e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.13e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -121     |
| Running Env Steps   | 1870000  |
| Running Forward KL  | 3.31     |
| Running Reverse KL  | 8.59     |
| Running Update Time | 374      |
----------------------------------
--2023-11-10 20:28:27.465684 CST--
| Itration            | 375      |
| Real Det Return     | 1.1e+03  |
| Real Det violation  | 0        |
| Real Sto Return     | 1.09e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -116     |
| Running Env Steps   | 1875000  |
| Running Forward KL  | 3.82     |
| Running Reverse KL  | 8.32     |
| Running Update Time | 375      |
----------------------------------
--2023-11-10 20:30:54.194910 CST--
| Itration            | 376      |
| Real Det Return     | 1.14e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.15e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -181     |
| Running Env Steps   | 1880000  |
| Running Forward KL  | 3.67     |
| Running Reverse KL  | 8.61     |
| Running Update Time | 376      |
----------------------------------
--2023-11-10 20:33:20.166963 CST--
| Itration            | 377      |
| Real Det Return     | 1.13e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.1e+03  |
| Real Sto violation  | 0        |
| Reward Loss         | -127     |
| Running Env Steps   | 1885000  |
| Running Forward KL  | 4.53     |
| Running Reverse KL  | 8.73     |
| Running Update Time | 377      |
----------------------------------
--2023-11-10 20:35:46.754242 CST--
| Itration            | 378      |
| Real Det Return     | 1.19e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.14e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -132     |
| Running Env Steps   | 1890000  |
| Running Forward KL  | 3.69     |
| Running Reverse KL  | 8.27     |
| Running Update Time | 378      |
----------------------------------
--2023-11-10 20:38:13.086368 CST--
| Itration            | 379      |
| Real Det Return     | 1.1e+03  |
| Real Det violation  | 0        |
| Real Sto Return     | 1.09e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -112     |
| Running Env Steps   | 1895000  |
| Running Forward KL  | 3.63     |
| Running Reverse KL  | 8.66     |
| Running Update Time | 379      |
----------------------------------
--2023-11-10 20:40:39.404493 CST--
| Itration            | 380      |
| Real Det Return     | 1.11e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.08e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -106     |
| Running Env Steps   | 1900000  |
| Running Forward KL  | 4.01     |
| Running Reverse KL  | 8.13     |
| Running Update Time | 380      |
----------------------------------
--2023-11-10 20:43:05.242364 CST--
| Itration            | 381      |
| Real Det Return     | 1e+03    |
| Real Det violation  | 0        |
| Real Sto Return     | 1.01e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -24.2    |
| Running Env Steps   | 1905000  |
| Running Forward KL  | 4.9      |
| Running Reverse KL  | 8.72     |
| Running Update Time | 381      |
----------------------------------
--2023-11-10 20:45:31.360253 CST--
| Itration            | 382      |
| Real Det Return     | 1e+03    |
| Real Det violation  | 0        |
| Real Sto Return     | 953      |
| Real Sto violation  | 0        |
| Reward Loss         | -29.3    |
| Running Env Steps   | 1910000  |
| Running Forward KL  | 5.11     |
| Running Reverse KL  | 9.05     |
| Running Update Time | 382      |
----------------------------------
--2023-11-10 20:47:57.228963 CST--
| Itration            | 383      |
| Real Det Return     | 1.09e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.04e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -114     |
| Running Env Steps   | 1915000  |
| Running Forward KL  | 4.75     |
| Running Reverse KL  | 8.58     |
| Running Update Time | 383      |
----------------------------------
--2023-11-10 20:50:23.177375 CST--
| Itration            | 384      |
| Real Det Return     | 1.06e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.03e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -45.2    |
| Running Env Steps   | 1920000  |
| Running Forward KL  | 3.85     |
| Running Reverse KL  | 8.77     |
| Running Update Time | 384      |
----------------------------------
--2023-11-10 20:52:49.108423 CST--
| Itration            | 385      |
| Real Det Return     | 1.13e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.08e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -131     |
| Running Env Steps   | 1925000  |
| Running Forward KL  | 3.27     |
| Running Reverse KL  | 8.31     |
| Running Update Time | 385      |
----------------------------------
--2023-11-10 20:55:15.016553 CST--
| Itration            | 386      |
| Real Det Return     | 1.12e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.15e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -151     |
| Running Env Steps   | 1930000  |
| Running Forward KL  | 3.39     |
| Running Reverse KL  | 8.42     |
| Running Update Time | 386      |
----------------------------------
--2023-11-10 20:57:41.216922 CST--
| Itration            | 387      |
| Real Det Return     | 1.09e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.08e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -66.2    |
| Running Env Steps   | 1935000  |
| Running Forward KL  | 3.17     |
| Running Reverse KL  | 8.3      |
| Running Update Time | 387      |
----------------------------------
--2023-11-10 21:00:07.067296 CST--
| Itration            | 388      |
| Real Det Return     | 1.03e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 992      |
| Real Sto violation  | 0        |
| Reward Loss         | -32.9    |
| Running Env Steps   | 1940000  |
| Running Forward KL  | 4.46     |
| Running Reverse KL  | 8.44     |
| Running Update Time | 388      |
----------------------------------
--2023-11-10 21:02:33.102283 CST--
| Itration            | 389      |
| Real Det Return     | 1e+03    |
| Real Det violation  | 0        |
| Real Sto Return     | 977      |
| Real Sto violation  | 0        |
| Reward Loss         | -57.3    |
| Running Env Steps   | 1945000  |
| Running Forward KL  | 4.47     |
| Running Reverse KL  | 8.52     |
| Running Update Time | 389      |
----------------------------------
--2023-11-10 21:04:59.345894 CST--
| Itration            | 390      |
| Real Det Return     | 966      |
| Real Det violation  | 0        |
| Real Sto Return     | 973      |
| Real Sto violation  | 0        |
| Reward Loss         | -54      |
| Running Env Steps   | 1950000  |
| Running Forward KL  | 4.92     |
| Running Reverse KL  | 9.05     |
| Running Update Time | 390      |
----------------------------------
--2023-11-10 21:07:25.674297 CST--
| Itration            | 391      |
| Real Det Return     | 1.03e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.06e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -85.7    |
| Running Env Steps   | 1955000  |
| Running Forward KL  | 4.4      |
| Running Reverse KL  | 8.35     |
| Running Update Time | 391      |
----------------------------------
--2023-11-10 21:09:51.513153 CST--
| Itration            | 392      |
| Real Det Return     | 990      |
| Real Det violation  | 0        |
| Real Sto Return     | 950      |
| Real Sto violation  | 0        |
| Reward Loss         | -80.2    |
| Running Env Steps   | 1960000  |
| Running Forward KL  | 5.11     |
| Running Reverse KL  | 8.32     |
| Running Update Time | 392      |
----------------------------------
--2023-11-10 21:12:17.824155 CST--
| Itration            | 393      |
| Real Det Return     | 1.04e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 995      |
| Real Sto violation  | 0        |
| Reward Loss         | -62.4    |
| Running Env Steps   | 1965000  |
| Running Forward KL  | 4.14     |
| Running Reverse KL  | 8.48     |
| Running Update Time | 393      |
----------------------------------
--2023-11-10 21:14:43.929905 CST--
| Itration            | 394      |
| Real Det Return     | 1.06e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.04e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -104     |
| Running Env Steps   | 1970000  |
| Running Forward KL  | 4.1      |
| Running Reverse KL  | 8.31     |
| Running Update Time | 394      |
----------------------------------
--2023-11-10 21:17:10.295278 CST--
| Itration            | 395      |
| Real Det Return     | 947      |
| Real Det violation  | 0        |
| Real Sto Return     | 925      |
| Real Sto violation  | 0        |
| Reward Loss         | 7.62     |
| Running Env Steps   | 1975000  |
| Running Forward KL  | 4.8      |
| Running Reverse KL  | 8.86     |
| Running Update Time | 395      |
----------------------------------
--2023-11-10 21:19:36.574097 CST--
| Itration            | 396      |
| Real Det Return     | 936      |
| Real Det violation  | 0        |
| Real Sto Return     | 908      |
| Real Sto violation  | 0        |
| Reward Loss         | -19.4    |
| Running Env Steps   | 1980000  |
| Running Forward KL  | 5.19     |
| Running Reverse KL  | 8.77     |
| Running Update Time | 396      |
----------------------------------
--2023-11-10 21:22:03.330952 CST--
| Itration            | 397      |
| Real Det Return     | 1.1e+03  |
| Real Det violation  | 0        |
| Real Sto Return     | 1.11e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -164     |
| Running Env Steps   | 1985000  |
| Running Forward KL  | 3.81     |
| Running Reverse KL  | 8.65     |
| Running Update Time | 397      |
----------------------------------
--2023-11-10 21:24:30.144161 CST--
| Itration            | 398      |
| Real Det Return     | 946      |
| Real Det violation  | 0        |
| Real Sto Return     | 925      |
| Real Sto violation  | 0        |
| Reward Loss         | -34.3    |
| Running Env Steps   | 1990000  |
| Running Forward KL  | 4.95     |
| Running Reverse KL  | 8.99     |
| Running Update Time | 398      |
----------------------------------
--2023-11-10 21:26:57.028177 CST--
| Itration            | 399      |
| Real Det Return     | 1.01e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 986      |
| Real Sto violation  | 0        |
| Reward Loss         | -42.9    |
| Running Env Steps   | 1995000  |
| Running Forward KL  | 4.69     |
| Running Reverse KL  | 8.65     |
| Running Update Time | 399      |
----------------------------------
--2023-11-10 21:29:24.049885 CST--
| Itration            | 400      |
| Real Det Return     | 1.03e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.03e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -87.6    |
| Running Env Steps   | 2000000  |
| Running Forward KL  | 4.44     |
| Running Reverse KL  | 8.8      |
| Running Update Time | 400      |
----------------------------------
--2023-11-10 21:31:51.144383 CST--
| Itration            | 401      |
| Real Det Return     | 962      |
| Real Det violation  | 0        |
| Real Sto Return     | 923      |
| Real Sto violation  | 0        |
| Reward Loss         | -65.6    |
| Running Env Steps   | 2005000  |
| Running Forward KL  | 5.25     |
| Running Reverse KL  | 8.63     |
| Running Update Time | 401      |
----------------------------------
--2023-11-10 21:34:18.427729 CST--
| Itration            | 402      |
| Real Det Return     | 926      |
| Real Det violation  | 0        |
| Real Sto Return     | 916      |
| Real Sto violation  | 0        |
| Reward Loss         | -38.2    |
| Running Env Steps   | 2010000  |
| Running Forward KL  | 5.39     |
| Running Reverse KL  | 9.17     |
| Running Update Time | 402      |
----------------------------------
--2023-11-10 21:36:44.981612 CST--
| Itration            | 403      |
| Real Det Return     | 901      |
| Real Det violation  | 0        |
| Real Sto Return     | 901      |
| Real Sto violation  | 0        |
| Reward Loss         | -15      |
| Running Env Steps   | 2015000  |
| Running Forward KL  | 5.21     |
| Running Reverse KL  | 8.9      |
| Running Update Time | 403      |
----------------------------------
--2023-11-10 21:39:11.844378 CST--
| Itration            | 404      |
| Real Det Return     | 762      |
| Real Det violation  | 0        |
| Real Sto Return     | 785      |
| Real Sto violation  | 0        |
| Reward Loss         | 68.6     |
| Running Env Steps   | 2020000  |
| Running Forward KL  | 6.48     |
| Running Reverse KL  | 9.81     |
| Running Update Time | 404      |
----------------------------------
--2023-11-10 21:41:38.959340 CST--
| Itration            | 405      |
| Real Det Return     | 887      |
| Real Det violation  | 0        |
| Real Sto Return     | 875      |
| Real Sto violation  | 0        |
| Reward Loss         | 11       |
| Running Env Steps   | 2025000  |
| Running Forward KL  | 6.12     |
| Running Reverse KL  | 9.25     |
| Running Update Time | 405      |
----------------------------------
--2023-11-10 21:44:05.877094 CST--
| Itration            | 406      |
| Real Det Return     | 817      |
| Real Det violation  | 0        |
| Real Sto Return     | 817      |
| Real Sto violation  | 0        |
| Reward Loss         | 46.9     |
| Running Env Steps   | 2030000  |
| Running Forward KL  | 6.88     |
| Running Reverse KL  | 9.45     |
| Running Update Time | 406      |
----------------------------------
--2023-11-10 21:46:33.037726 CST--
| Itration            | 407      |
| Real Det Return     | 902      |
| Real Det violation  | 0        |
| Real Sto Return     | 877      |
| Real Sto violation  | 0        |
| Reward Loss         | 34.7     |
| Running Env Steps   | 2035000  |
| Running Forward KL  | 6.26     |
| Running Reverse KL  | 9.45     |
| Running Update Time | 407      |
----------------------------------
--2023-11-10 21:49:00.414167 CST--
| Itration            | 408      |
| Real Det Return     | 777      |
| Real Det violation  | 0        |
| Real Sto Return     | 831      |
| Real Sto violation  | 0        |
| Reward Loss         | 12.9     |
| Running Env Steps   | 2040000  |
| Running Forward KL  | 6.33     |
| Running Reverse KL  | 9.4      |
| Running Update Time | 408      |
----------------------------------
--2023-11-10 21:51:27.661771 CST--
| Itration            | 409      |
| Real Det Return     | 822      |
| Real Det violation  | 0        |
| Real Sto Return     | 805      |
| Real Sto violation  | 0        |
| Reward Loss         | 18.3     |
| Running Env Steps   | 2045000  |
| Running Forward KL  | 6.6      |
| Running Reverse KL  | 9.4      |
| Running Update Time | 409      |
----------------------------------
--2023-11-10 21:53:54.592282 CST--
| Itration            | 410      |
| Real Det Return     | 750      |
| Real Det violation  | 0        |
| Real Sto Return     | 747      |
| Real Sto violation  | 0        |
| Reward Loss         | 70.9     |
| Running Env Steps   | 2050000  |
| Running Forward KL  | 6.58     |
| Running Reverse KL  | 9.79     |
| Running Update Time | 410      |
----------------------------------
--2023-11-10 21:56:21.920440 CST--
| Itration            | 411      |
| Real Det Return     | 864      |
| Real Det violation  | 0        |
| Real Sto Return     | 793      |
| Real Sto violation  | 0        |
| Reward Loss         | 38.2     |
| Running Env Steps   | 2055000  |
| Running Forward KL  | 6.68     |
| Running Reverse KL  | 9.66     |
| Running Update Time | 411      |
----------------------------------
--2023-11-10 21:58:49.556355 CST--
| Itration            | 412      |
| Real Det Return     | 812      |
| Real Det violation  | 0        |
| Real Sto Return     | 807      |
| Real Sto violation  | 0        |
| Reward Loss         | 8.94     |
| Running Env Steps   | 2060000  |
| Running Forward KL  | 6.9      |
| Running Reverse KL  | 9.25     |
| Running Update Time | 412      |
----------------------------------
--2023-11-10 22:01:17.725529 CST--
| Itration            | 413      |
| Real Det Return     | 814      |
| Real Det violation  | 0        |
| Real Sto Return     | 772      |
| Real Sto violation  | 0        |
| Reward Loss         | 60.6     |
| Running Env Steps   | 2065000  |
| Running Forward KL  | 5.96     |
| Running Reverse KL  | 9.65     |
| Running Update Time | 413      |
----------------------------------
--2023-11-10 22:03:45.294285 CST--
| Itration            | 414      |
| Real Det Return     | 636      |
| Real Det violation  | 0        |
| Real Sto Return     | 698      |
| Real Sto violation  | 0        |
| Reward Loss         | 67.5     |
| Running Env Steps   | 2070000  |
| Running Forward KL  | 7.42     |
| Running Reverse KL  | 9.69     |
| Running Update Time | 414      |
----------------------------------
--2023-11-10 22:06:13.016907 CST--
| Itration            | 415      |
| Real Det Return     | 874      |
| Real Det violation  | 0        |
| Real Sto Return     | 831      |
| Real Sto violation  | 0        |
| Reward Loss         | 25       |
| Running Env Steps   | 2075000  |
| Running Forward KL  | 6.34     |
| Running Reverse KL  | 9.54     |
| Running Update Time | 415      |
----------------------------------
--2023-11-10 22:08:31.982284 CST--
| Itration            | 416      |
| Real Det Return     | 758      |
| Real Det violation  | 0        |
| Real Sto Return     | 760      |
| Real Sto violation  | 0        |
| Reward Loss         | 20.7     |
| Running Env Steps   | 2080000  |
| Running Forward KL  | 7.44     |
| Running Reverse KL  | 9.59     |
| Running Update Time | 416      |
----------------------------------
--2023-11-10 22:10:51.910620 CST--
| Itration            | 417      |
| Real Det Return     | 853      |
| Real Det violation  | 0        |
| Real Sto Return     | 836      |
| Real Sto violation  | 0        |
| Reward Loss         | -16      |
| Running Env Steps   | 2085000  |
| Running Forward KL  | 7.39     |
| Running Reverse KL  | 9.4      |
| Running Update Time | 417      |
----------------------------------
--2023-11-10 22:13:11.934365 CST--
| Itration            | 418      |
| Real Det Return     | 576      |
| Real Det violation  | 0        |
| Real Sto Return     | 719      |
| Real Sto violation  | 0        |
| Reward Loss         | 57.3     |
| Running Env Steps   | 2090000  |
| Running Forward KL  | 7.56     |
| Running Reverse KL  | 10.2     |
| Running Update Time | 418      |
----------------------------------
--2023-11-10 22:15:32.240654 CST--
| Itration            | 419      |
| Real Det Return     | 809      |
| Real Det violation  | 0        |
| Real Sto Return     | 844      |
| Real Sto violation  | 0        |
| Reward Loss         | -16.4    |
| Running Env Steps   | 2095000  |
| Running Forward KL  | 7.41     |
| Running Reverse KL  | 9.72     |
| Running Update Time | 419      |
----------------------------------
--2023-11-10 22:17:52.811678 CST--
| Itration            | 420      |
| Real Det Return     | 750      |
| Real Det violation  | 0        |
| Real Sto Return     | 729      |
| Real Sto violation  | 0        |
| Reward Loss         | 38.4     |
| Running Env Steps   | 2100000  |
| Running Forward KL  | 6.39     |
| Running Reverse KL  | 9.15     |
| Running Update Time | 420      |
----------------------------------
--2023-11-10 22:20:13.383253 CST--
| Itration            | 421      |
| Real Det Return     | 753      |
| Real Det violation  | 0        |
| Real Sto Return     | 798      |
| Real Sto violation  | 0        |
| Reward Loss         | 11.3     |
| Running Env Steps   | 2105000  |
| Running Forward KL  | 7.48     |
| Running Reverse KL  | 9.96     |
| Running Update Time | 421      |
----------------------------------
--2023-11-10 22:22:33.639576 CST--
| Itration            | 422      |
| Real Det Return     | 710      |
| Real Det violation  | 0        |
| Real Sto Return     | 729      |
| Real Sto violation  | 0.05     |
| Reward Loss         | 65       |
| Running Env Steps   | 2110000  |
| Running Forward KL  | 6.62     |
| Running Reverse KL  | 9.85     |
| Running Update Time | 422      |
----------------------------------
--2023-11-10 22:24:54.353608 CST--
| Itration            | 423      |
| Real Det Return     | 551      |
| Real Det violation  | 0        |
| Real Sto Return     | 634      |
| Real Sto violation  | 0        |
| Reward Loss         | 107      |
| Running Env Steps   | 2115000  |
| Running Forward KL  | 8.4      |
| Running Reverse KL  | 10.6     |
| Running Update Time | 423      |
----------------------------------
--2023-11-10 22:27:14.234267 CST--
| Itration            | 424      |
| Real Det Return     | 559      |
| Real Det violation  | 0        |
| Real Sto Return     | 565      |
| Real Sto violation  | 0.1      |
| Reward Loss         | -116     |
| Running Env Steps   | 2120000  |
| Running Forward KL  | 9.7      |
| Running Reverse KL  | 11.2     |
| Running Update Time | 424      |
----------------------------------
--2023-11-10 22:29:34.913915 CST--
| Itration            | 425      |
| Real Det Return     | 680      |
| Real Det violation  | 0        |
| Real Sto Return     | 746      |
| Real Sto violation  | 0        |
| Reward Loss         | 78.5     |
| Running Env Steps   | 2125000  |
| Running Forward KL  | 7.76     |
| Running Reverse KL  | 9.96     |
| Running Update Time | 425      |
----------------------------------
