Logging to logs/HalfCheetah-v3/exp-1/maxentirl_sa/2023_11_08_12_12_52
--2023-11-08 12:14:12.039106 CST--
| Itration            | 0        |
| Real Det Return     | 1.51e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.69e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | 69.5     |
| Running Env Steps   | 0        |
| Running Forward KL  | 19.1     |
| Running Reverse KL  | 10       |
| Running Update Time | 0        |
----------------------------------
--2023-11-08 12:15:39.189312 CST--
| Itration            | 1        |
| Real Det Return     | 1.76e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.61e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | 109      |
| Running Env Steps   | 5000     |
| Running Forward KL  | 18.1     |
| Running Reverse KL  | 10.5     |
| Running Update Time | 1        |
----------------------------------
--2023-11-08 12:17:06.498735 CST--
| Itration            | 2        |
| Real Det Return     | 1.55e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.59e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | 87.9     |
| Running Env Steps   | 10000    |
| Running Forward KL  | 17.6     |
| Running Reverse KL  | 10.4     |
| Running Update Time | 2        |
----------------------------------
--2023-11-08 12:18:34.407705 CST--
| Itration            | 3        |
| Real Det Return     | 1.59e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.62e+03 |
| Real Sto violation  | 0.9      |
| Reward Loss         | 80.7     |
| Running Env Steps   | 15000    |
| Running Forward KL  | 18.6     |
| Running Reverse KL  | 9.81     |
| Running Update Time | 3        |
----------------------------------
--2023-11-08 12:20:02.085927 CST--
| Itration            | 4        |
| Real Det Return     | 1.65e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.65e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | 92.5     |
| Running Env Steps   | 20000    |
| Running Forward KL  | 17.2     |
| Running Reverse KL  | 10.1     |
| Running Update Time | 4        |
----------------------------------
--2023-11-08 12:21:29.824607 CST--
| Itration            | 5        |
| Real Det Return     | 1.91e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.64e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | 50.8     |
| Running Env Steps   | 25000    |
| Running Forward KL  | 18       |
| Running Reverse KL  | 10.2     |
| Running Update Time | 5        |
----------------------------------
--2023-11-08 12:22:57.775940 CST--
| Itration            | 6        |
| Real Det Return     | 1.86e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.62e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | 39.9     |
| Running Env Steps   | 30000    |
| Running Forward KL  | 17.7     |
| Running Reverse KL  | 10.2     |
| Running Update Time | 6        |
----------------------------------
--2023-11-08 12:24:25.561815 CST--
| Itration            | 7        |
| Real Det Return     | 1.71e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.61e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | 33.3     |
| Running Env Steps   | 35000    |
| Running Forward KL  | 17.2     |
| Running Reverse KL  | 10       |
| Running Update Time | 7        |
----------------------------------
--2023-11-08 12:25:54.189174 CST--
| Itration            | 8        |
| Real Det Return     | 1.79e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.66e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | 4.97     |
| Running Env Steps   | 40000    |
| Running Forward KL  | 17       |
| Running Reverse KL  | 10.1     |
| Running Update Time | 8        |
----------------------------------
--2023-11-08 12:27:23.311396 CST--
| Itration            | 9        |
| Real Det Return     | 1.76e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.67e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -13      |
| Running Env Steps   | 45000    |
| Running Forward KL  | 17       |
| Running Reverse KL  | 9.99     |
| Running Update Time | 9        |
----------------------------------
--2023-11-08 12:28:54.299949 CST--
| Itration            | 10       |
| Real Det Return     | 1.84e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.7e+03  |
| Real Sto violation  | 1        |
| Reward Loss         | -14.8    |
| Running Env Steps   | 50000    |
| Running Forward KL  | 17.3     |
| Running Reverse KL  | 9.68     |
| Running Update Time | 10       |
----------------------------------
--2023-11-08 12:30:27.564791 CST--
| Itration            | 11       |
| Real Det Return     | 2e+03    |
| Real Det violation  | 0        |
| Real Sto Return     | 1.72e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -11.6    |
| Running Env Steps   | 55000    |
| Running Forward KL  | 17.8     |
| Running Reverse KL  | 9.54     |
| Running Update Time | 11       |
----------------------------------
--2023-11-08 12:32:02.042404 CST--
| Itration            | 12       |
| Real Det Return     | 1.79e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.72e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -40.8    |
| Running Env Steps   | 60000    |
| Running Forward KL  | 16.9     |
| Running Reverse KL  | 9.49     |
| Running Update Time | 12       |
----------------------------------
--2023-11-08 12:33:37.690608 CST--
| Itration            | 13       |
| Real Det Return     | 1.87e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.7e+03  |
| Real Sto violation  | 1        |
| Reward Loss         | -46.6    |
| Running Env Steps   | 65000    |
| Running Forward KL  | 17       |
| Running Reverse KL  | 9.39     |
| Running Update Time | 13       |
----------------------------------
--2023-11-08 12:35:16.541850 CST--
| Itration            | 14       |
| Real Det Return     | 2.08e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.73e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -46.6    |
| Running Env Steps   | 70000    |
| Running Forward KL  | 16.9     |
| Running Reverse KL  | 9.46     |
| Running Update Time | 14       |
----------------------------------
--2023-11-08 12:37:00.356086 CST--
| Itration            | 15       |
| Real Det Return     | 1.82e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.74e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -75.1    |
| Running Env Steps   | 75000    |
| Running Forward KL  | 16.2     |
| Running Reverse KL  | 9.36     |
| Running Update Time | 15       |
----------------------------------
--2023-11-08 12:38:51.761267 CST--
| Itration            | 16       |
| Real Det Return     | 2.1e+03  |
| Real Det violation  | 0        |
| Real Sto Return     | 1.7e+03  |
| Real Sto violation  | 1        |
| Reward Loss         | -30.3    |
| Running Env Steps   | 80000    |
| Running Forward KL  | 17.5     |
| Running Reverse KL  | 9.13     |
| Running Update Time | 16       |
----------------------------------
--2023-11-08 12:40:44.658419 CST--
| Itration            | 17       |
| Real Det Return     | 2.02e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.72e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -68.1    |
| Running Env Steps   | 85000    |
| Running Forward KL  | 16.7     |
| Running Reverse KL  | 8.95     |
| Running Update Time | 17       |
----------------------------------
--2023-11-08 12:42:38.993186 CST--
| Itration            | 18       |
| Real Det Return     | 2.06e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.74e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -73.2    |
| Running Env Steps   | 90000    |
| Running Forward KL  | 17.1     |
| Running Reverse KL  | 8.86     |
| Running Update Time | 18       |
----------------------------------
--2023-11-08 12:44:34.535259 CST--
| Itration            | 19       |
| Real Det Return     | 2.2e+03  |
| Real Det violation  | 0        |
| Real Sto Return     | 1.77e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -103     |
| Running Env Steps   | 95000    |
| Running Forward KL  | 16.4     |
| Running Reverse KL  | 8.9      |
| Running Update Time | 19       |
----------------------------------
--2023-11-08 12:46:31.449121 CST--
| Itration            | 20       |
| Real Det Return     | 2.1e+03  |
| Real Det violation  | 0        |
| Real Sto Return     | 1.72e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -80.9    |
| Running Env Steps   | 100000   |
| Running Forward KL  | 16.7     |
| Running Reverse KL  | 8.76     |
| Running Update Time | 20       |
----------------------------------
--2023-11-08 12:48:29.022110 CST--
| Itration            | 21       |
| Real Det Return     | 1.94e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.74e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -108     |
| Running Env Steps   | 105000   |
| Running Forward KL  | 16.3     |
| Running Reverse KL  | 8.47     |
| Running Update Time | 21       |
----------------------------------
--2023-11-08 12:50:27.731791 CST--
| Itration            | 22       |
| Real Det Return     | 2.1e+03  |
| Real Det violation  | 0        |
| Real Sto Return     | 1.71e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -103     |
| Running Env Steps   | 110000   |
| Running Forward KL  | 16.2     |
| Running Reverse KL  | 8.64     |
| Running Update Time | 22       |
----------------------------------
--2023-11-08 12:52:27.524328 CST--
| Itration            | 23       |
| Real Det Return     | 1.95e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.82e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -111     |
| Running Env Steps   | 115000   |
| Running Forward KL  | 16.4     |
| Running Reverse KL  | 8.42     |
| Running Update Time | 23       |
----------------------------------
--2023-11-08 12:54:24.182200 CST--
| Itration            | 24       |
| Real Det Return     | 2.16e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.8e+03  |
| Real Sto violation  | 0.95     |
| Reward Loss         | -128     |
| Running Env Steps   | 120000   |
| Running Forward KL  | 16.1     |
| Running Reverse KL  | 8.58     |
| Running Update Time | 24       |
----------------------------------
--2023-11-08 12:56:21.545387 CST--
| Itration            | 25       |
| Real Det Return     | 1.97e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.72e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -121     |
| Running Env Steps   | 125000   |
| Running Forward KL  | 16.6     |
| Running Reverse KL  | 8.43     |
| Running Update Time | 25       |
----------------------------------
--2023-11-08 12:58:19.644437 CST--
| Itration            | 26       |
| Real Det Return     | 1.97e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.76e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -130     |
| Running Env Steps   | 130000   |
| Running Forward KL  | 16.7     |
| Running Reverse KL  | 8.39     |
| Running Update Time | 26       |
----------------------------------
--2023-11-08 13:00:18.142874 CST--
| Itration            | 27       |
| Real Det Return     | 1.99e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.72e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -114     |
| Running Env Steps   | 135000   |
| Running Forward KL  | 17       |
| Running Reverse KL  | 8.37     |
| Running Update Time | 27       |
----------------------------------
--2023-11-08 13:02:16.691314 CST--
| Itration            | 28       |
| Real Det Return     | 2.01e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.73e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -146     |
| Running Env Steps   | 140000   |
| Running Forward KL  | 16.3     |
| Running Reverse KL  | 8.27     |
| Running Update Time | 28       |
----------------------------------
--2023-11-08 13:04:15.768508 CST--
| Itration            | 29       |
| Real Det Return     | 2.01e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.79e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -146     |
| Running Env Steps   | 145000   |
| Running Forward KL  | 16.3     |
| Running Reverse KL  | 8.23     |
| Running Update Time | 29       |
----------------------------------
--2023-11-08 13:06:15.692793 CST--
| Itration            | 30       |
| Real Det Return     | 1.93e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.73e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -164     |
| Running Env Steps   | 150000   |
| Running Forward KL  | 16       |
| Running Reverse KL  | 8.27     |
| Running Update Time | 30       |
----------------------------------
--2023-11-08 13:08:16.254952 CST--
| Itration            | 31       |
| Real Det Return     | 1.93e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.79e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -183     |
| Running Env Steps   | 155000   |
| Running Forward KL  | 15.6     |
| Running Reverse KL  | 8.43     |
| Running Update Time | 31       |
----------------------------------
--2023-11-08 13:10:16.656651 CST--
| Itration            | 32       |
| Real Det Return     | 1.94e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.76e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -151     |
| Running Env Steps   | 160000   |
| Running Forward KL  | 17.1     |
| Running Reverse KL  | 8        |
| Running Update Time | 32       |
----------------------------------
--2023-11-08 13:12:17.860264 CST--
| Itration            | 33       |
| Real Det Return     | 1.91e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.78e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -177     |
| Running Env Steps   | 165000   |
| Running Forward KL  | 15.8     |
| Running Reverse KL  | 8.2      |
| Running Update Time | 33       |
----------------------------------
--2023-11-08 13:14:18.995762 CST--
| Itration            | 34       |
| Real Det Return     | 1.81e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.75e+03 |
| Real Sto violation  | 0.95     |
| Reward Loss         | -185     |
| Running Env Steps   | 170000   |
| Running Forward KL  | 15.7     |
| Running Reverse KL  | 8.19     |
| Running Update Time | 34       |
----------------------------------
--2023-11-08 13:16:20.199702 CST--
| Itration            | 35       |
| Real Det Return     | 1.89e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.78e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -197     |
| Running Env Steps   | 175000   |
| Running Forward KL  | 16.5     |
| Running Reverse KL  | 8.15     |
| Running Update Time | 35       |
----------------------------------
--2023-11-08 13:18:21.515489 CST--
| Itration            | 36       |
| Real Det Return     | 1.83e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.76e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -195     |
| Running Env Steps   | 180000   |
| Running Forward KL  | 16.2     |
| Running Reverse KL  | 7.97     |
| Running Update Time | 36       |
----------------------------------
--2023-11-08 13:20:22.910955 CST--
| Itration            | 37       |
| Real Det Return     | 1.91e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.76e+03 |
| Real Sto violation  | 0.95     |
| Reward Loss         | -213     |
| Running Env Steps   | 185000   |
| Running Forward KL  | 15.8     |
| Running Reverse KL  | 7.98     |
| Running Update Time | 37       |
----------------------------------
--2023-11-08 13:22:24.245149 CST--
| Itration            | 38       |
| Real Det Return     | 1.85e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.81e+03 |
| Real Sto violation  | 0.95     |
| Reward Loss         | -214     |
| Running Env Steps   | 190000   |
| Running Forward KL  | 16.1     |
| Running Reverse KL  | 8.12     |
| Running Update Time | 38       |
----------------------------------
--2023-11-08 13:24:25.411873 CST--
| Itration            | 39       |
| Real Det Return     | 1.93e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.76e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -192     |
| Running Env Steps   | 195000   |
| Running Forward KL  | 16       |
| Running Reverse KL  | 7.85     |
| Running Update Time | 39       |
----------------------------------
--2023-11-08 13:26:27.074941 CST--
| Itration            | 40       |
| Real Det Return     | 1.94e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.79e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -194     |
| Running Env Steps   | 200000   |
| Running Forward KL  | 15.4     |
| Running Reverse KL  | 7.92     |
| Running Update Time | 40       |
----------------------------------
--2023-11-08 13:28:28.783116 CST--
| Itration            | 41       |
| Real Det Return     | 2.03e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.81e+03 |
| Real Sto violation  | 0.95     |
| Reward Loss         | -222     |
| Running Env Steps   | 205000   |
| Running Forward KL  | 15.1     |
| Running Reverse KL  | 8        |
| Running Update Time | 41       |
----------------------------------
--2023-11-08 13:30:30.540887 CST--
| Itration            | 42       |
| Real Det Return     | 2.04e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.74e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -198     |
| Running Env Steps   | 210000   |
| Running Forward KL  | 16.3     |
| Running Reverse KL  | 7.36     |
| Running Update Time | 42       |
----------------------------------
--2023-11-08 13:32:32.341200 CST--
| Itration            | 43       |
| Real Det Return     | 1.88e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.77e+03 |
| Real Sto violation  | 0.95     |
| Reward Loss         | -233     |
| Running Env Steps   | 215000   |
| Running Forward KL  | 15.4     |
| Running Reverse KL  | 7.9      |
| Running Update Time | 43       |
----------------------------------
--2023-11-08 13:34:34.869316 CST--
| Itration            | 44       |
| Real Det Return     | 1.89e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.72e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -240     |
| Running Env Steps   | 220000   |
| Running Forward KL  | 16       |
| Running Reverse KL  | 7.72     |
| Running Update Time | 44       |
----------------------------------
--2023-11-08 13:36:36.477412 CST--
| Itration            | 45       |
| Real Det Return     | 1.87e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.74e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -238     |
| Running Env Steps   | 225000   |
| Running Forward KL  | 15.4     |
| Running Reverse KL  | 7.57     |
| Running Update Time | 45       |
----------------------------------
--2023-11-08 13:38:37.956518 CST--
| Itration            | 46       |
| Real Det Return     | 2.01e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.78e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -243     |
| Running Env Steps   | 230000   |
| Running Forward KL  | 15.5     |
| Running Reverse KL  | 7.54     |
| Running Update Time | 46       |
----------------------------------
--2023-11-08 13:40:39.677309 CST--
| Itration            | 47       |
| Real Det Return     | 2.2e+03  |
| Real Det violation  | 0        |
| Real Sto Return     | 1.81e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -248     |
| Running Env Steps   | 235000   |
| Running Forward KL  | 15.5     |
| Running Reverse KL  | 7.51     |
| Running Update Time | 47       |
----------------------------------
--2023-11-08 13:42:41.335865 CST--
| Itration            | 48       |
| Real Det Return     | 2.08e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.81e+03 |
| Real Sto violation  | 0.95     |
| Reward Loss         | -255     |
| Running Env Steps   | 240000   |
| Running Forward KL  | 14.6     |
| Running Reverse KL  | 7.89     |
| Running Update Time | 48       |
----------------------------------
--2023-11-08 13:44:42.847765 CST--
| Itration            | 49       |
| Real Det Return     | 1.94e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.79e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -273     |
| Running Env Steps   | 245000   |
| Running Forward KL  | 14.7     |
| Running Reverse KL  | 7.75     |
| Running Update Time | 49       |
----------------------------------
--2023-11-08 13:46:44.512890 CST--
| Itration            | 50       |
| Real Det Return     | 2.15e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.79e+03 |
| Real Sto violation  | 0.95     |
| Reward Loss         | -276     |
| Running Env Steps   | 250000   |
| Running Forward KL  | 15.1     |
| Running Reverse KL  | 7.62     |
| Running Update Time | 50       |
----------------------------------
--2023-11-08 13:48:44.589440 CST--
| Itration            | 51       |
| Real Det Return     | 2.1e+03  |
| Real Det violation  | 0        |
| Real Sto Return     | 1.81e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -283     |
| Running Env Steps   | 255000   |
| Running Forward KL  | 14.7     |
| Running Reverse KL  | 7.75     |
| Running Update Time | 51       |
----------------------------------
--2023-11-08 13:50:46.822491 CST--
| Itration            | 52       |
| Real Det Return     | 2.02e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.76e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -286     |
| Running Env Steps   | 260000   |
| Running Forward KL  | 14.5     |
| Running Reverse KL  | 7.6      |
| Running Update Time | 52       |
----------------------------------
--2023-11-08 13:52:49.402664 CST--
| Itration            | 53       |
| Real Det Return     | 2.04e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.83e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -294     |
| Running Env Steps   | 265000   |
| Running Forward KL  | 15       |
| Running Reverse KL  | 7.5      |
| Running Update Time | 53       |
----------------------------------
--2023-11-08 13:54:51.940904 CST--
| Itration            | 54       |
| Real Det Return     | 2.18e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.8e+03  |
| Real Sto violation  | 1        |
| Reward Loss         | -303     |
| Running Env Steps   | 270000   |
| Running Forward KL  | 14.9     |
| Running Reverse KL  | 7.58     |
| Running Update Time | 54       |
----------------------------------
--2023-11-08 13:56:55.013892 CST--
| Itration            | 55       |
| Real Det Return     | 2.28e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.94e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -295     |
| Running Env Steps   | 275000   |
| Running Forward KL  | 15       |
| Running Reverse KL  | 7.64     |
| Running Update Time | 55       |
----------------------------------
--2023-11-08 13:58:57.907601 CST--
| Itration            | 56       |
| Real Det Return     | 2.3e+03  |
| Real Det violation  | 0        |
| Real Sto Return     | 1.85e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -317     |
| Running Env Steps   | 280000   |
| Running Forward KL  | 14       |
| Running Reverse KL  | 7.62     |
| Running Update Time | 56       |
----------------------------------
--2023-11-08 14:01:00.798175 CST--
| Itration            | 57       |
| Real Det Return     | 2.28e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.84e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -322     |
| Running Env Steps   | 285000   |
| Running Forward KL  | 14.6     |
| Running Reverse KL  | 7.67     |
| Running Update Time | 57       |
----------------------------------
--2023-11-08 14:03:04.478280 CST--
| Itration            | 58       |
| Real Det Return     | 2.21e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.92e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -290     |
| Running Env Steps   | 290000   |
| Running Forward KL  | 15.4     |
| Running Reverse KL  | 7.29     |
| Running Update Time | 58       |
----------------------------------
--2023-11-08 14:05:06.377170 CST--
| Itration            | 59       |
| Real Det Return     | 2.33e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.88e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -302     |
| Running Env Steps   | 295000   |
| Running Forward KL  | 14.4     |
| Running Reverse KL  | 7.41     |
| Running Update Time | 59       |
----------------------------------
--2023-11-08 14:07:08.606214 CST--
| Itration            | 60       |
| Real Det Return     | 2.35e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.88e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -291     |
| Running Env Steps   | 300000   |
| Running Forward KL  | 14.7     |
| Running Reverse KL  | 7.16     |
| Running Update Time | 60       |
----------------------------------
--2023-11-08 14:09:10.987825 CST--
| Itration            | 61       |
| Real Det Return     | 2.04e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.83e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -314     |
| Running Env Steps   | 305000   |
| Running Forward KL  | 14.5     |
| Running Reverse KL  | 7.5      |
| Running Update Time | 61       |
----------------------------------
--2023-11-08 14:11:13.266102 CST--
| Itration            | 62       |
| Real Det Return     | 2.25e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.88e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -333     |
| Running Env Steps   | 310000   |
| Running Forward KL  | 14.3     |
| Running Reverse KL  | 7.45     |
| Running Update Time | 62       |
----------------------------------
--2023-11-08 14:13:16.009443 CST--
| Itration            | 63       |
| Real Det Return     | 2.19e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.85e+03 |
| Real Sto violation  | 0.95     |
| Reward Loss         | -324     |
| Running Env Steps   | 315000   |
| Running Forward KL  | 14       |
| Running Reverse KL  | 7.48     |
| Running Update Time | 63       |
----------------------------------
--2023-11-08 14:15:18.984875 CST--
| Itration            | 64       |
| Real Det Return     | 2.31e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.82e+03 |
| Real Sto violation  | 0.9      |
| Reward Loss         | -319     |
| Running Env Steps   | 320000   |
| Running Forward KL  | 14.6     |
| Running Reverse KL  | 7.11     |
| Running Update Time | 64       |
----------------------------------
--2023-11-08 14:17:21.551343 CST--
| Itration            | 65       |
| Real Det Return     | 2.26e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.88e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -366     |
| Running Env Steps   | 325000   |
| Running Forward KL  | 13.8     |
| Running Reverse KL  | 7.43     |
| Running Update Time | 65       |
----------------------------------
--2023-11-08 14:19:23.956407 CST--
| Itration            | 66       |
| Real Det Return     | 2.32e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.85e+03 |
| Real Sto violation  | 0.9      |
| Reward Loss         | -348     |
| Running Env Steps   | 330000   |
| Running Forward KL  | 12.9     |
| Running Reverse KL  | 7.75     |
| Running Update Time | 66       |
----------------------------------
--2023-11-08 14:21:26.418067 CST--
| Itration            | 67       |
| Real Det Return     | 2.34e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.92e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -349     |
| Running Env Steps   | 335000   |
| Running Forward KL  | 13.9     |
| Running Reverse KL  | 7.31     |
| Running Update Time | 67       |
----------------------------------
--2023-11-08 14:23:29.049799 CST--
| Itration            | 68       |
| Real Det Return     | 2.32e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.89e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -356     |
| Running Env Steps   | 340000   |
| Running Forward KL  | 13.6     |
| Running Reverse KL  | 7.64     |
| Running Update Time | 68       |
----------------------------------
--2023-11-08 14:25:32.006201 CST--
| Itration            | 69       |
| Real Det Return     | 2.36e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.93e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -353     |
| Running Env Steps   | 345000   |
| Running Forward KL  | 14       |
| Running Reverse KL  | 7.43     |
| Running Update Time | 69       |
----------------------------------
--2023-11-08 14:27:34.610569 CST--
| Itration            | 70       |
| Real Det Return     | 2.38e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.93e+03 |
| Real Sto violation  | 0.95     |
| Reward Loss         | -374     |
| Running Env Steps   | 350000   |
| Running Forward KL  | 13.3     |
| Running Reverse KL  | 7.2      |
| Running Update Time | 70       |
----------------------------------
--2023-11-08 14:29:37.601043 CST--
| Itration            | 71       |
| Real Det Return     | 2.4e+03  |
| Real Det violation  | 0        |
| Real Sto Return     | 1.93e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -382     |
| Running Env Steps   | 355000   |
| Running Forward KL  | 13.3     |
| Running Reverse KL  | 7.42     |
| Running Update Time | 71       |
----------------------------------
--2023-11-08 14:31:40.475073 CST--
| Itration            | 72       |
| Real Det Return     | 2.42e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.9e+03  |
| Real Sto violation  | 1        |
| Reward Loss         | -386     |
| Running Env Steps   | 360000   |
| Running Forward KL  | 12.7     |
| Running Reverse KL  | 7.35     |
| Running Update Time | 72       |
----------------------------------
--2023-11-08 14:33:43.508156 CST--
| Itration            | 73       |
| Real Det Return     | 2.31e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.01e+03 |
| Real Sto violation  | 0.95     |
| Reward Loss         | -398     |
| Running Env Steps   | 365000   |
| Running Forward KL  | 12.8     |
| Running Reverse KL  | 7.55     |
| Running Update Time | 73       |
----------------------------------
--2023-11-08 14:35:46.860586 CST--
| Itration            | 74       |
| Real Det Return     | 2.39e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.01e+03 |
| Real Sto violation  | 0.95     |
| Reward Loss         | -383     |
| Running Env Steps   | 370000   |
| Running Forward KL  | 12.8     |
| Running Reverse KL  | 7.73     |
| Running Update Time | 74       |
----------------------------------
--2023-11-08 14:37:50.092902 CST--
| Itration            | 75       |
| Real Det Return     | 2.4e+03  |
| Real Det violation  | 0        |
| Real Sto Return     | 2.01e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -389     |
| Running Env Steps   | 375000   |
| Running Forward KL  | 13       |
| Running Reverse KL  | 7.5      |
| Running Update Time | 75       |
----------------------------------
--2023-11-08 14:39:53.407886 CST--
| Itration            | 76       |
| Real Det Return     | 2.54e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.93e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -382     |
| Running Env Steps   | 380000   |
| Running Forward KL  | 12.5     |
| Running Reverse KL  | 7.52     |
| Running Update Time | 76       |
----------------------------------
--2023-11-08 14:41:56.769973 CST--
| Itration            | 77       |
| Real Det Return     | 2.49e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.01e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -367     |
| Running Env Steps   | 385000   |
| Running Forward KL  | 12.4     |
| Running Reverse KL  | 7.43     |
| Running Update Time | 77       |
----------------------------------
--2023-11-08 14:43:59.550536 CST--
| Itration            | 78       |
| Real Det Return     | 2.47e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.07e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -405     |
| Running Env Steps   | 390000   |
| Running Forward KL  | 12.4     |
| Running Reverse KL  | 7.42     |
| Running Update Time | 78       |
----------------------------------
--2023-11-08 14:46:02.585643 CST--
| Itration            | 79       |
| Real Det Return     | 2.45e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.09e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -391     |
| Running Env Steps   | 395000   |
| Running Forward KL  | 12.3     |
| Running Reverse KL  | 7.71     |
| Running Update Time | 79       |
----------------------------------
--2023-11-08 14:48:05.783356 CST--
| Itration            | 80       |
| Real Det Return     | 2.6e+03  |
| Real Det violation  | 0        |
| Real Sto Return     | 2.07e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -383     |
| Running Env Steps   | 400000   |
| Running Forward KL  | 11.9     |
| Running Reverse KL  | 7.37     |
| Running Update Time | 80       |
----------------------------------
--2023-11-08 14:50:08.615000 CST--
| Itration            | 81       |
| Real Det Return     | 2.6e+03  |
| Real Det violation  | 0        |
| Real Sto Return     | 2.16e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -388     |
| Running Env Steps   | 405000   |
| Running Forward KL  | 12       |
| Running Reverse KL  | 7.7      |
| Running Update Time | 81       |
----------------------------------
--2023-11-08 14:52:11.245466 CST--
| Itration            | 82       |
| Real Det Return     | 2.54e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.15e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -378     |
| Running Env Steps   | 410000   |
| Running Forward KL  | 11.7     |
| Running Reverse KL  | 7.63     |
| Running Update Time | 82       |
----------------------------------
--2023-11-08 14:54:18.993557 CST--
| Itration            | 83       |
| Real Det Return     | 2.64e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.16e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -380     |
| Running Env Steps   | 415000   |
| Running Forward KL  | 11.5     |
| Running Reverse KL  | 7.47     |
| Running Update Time | 83       |
----------------------------------
--2023-11-08 14:56:26.625055 CST--
| Itration            | 84       |
| Real Det Return     | 2.41e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.11e+03 |
| Real Sto violation  | 0.9      |
| Reward Loss         | -394     |
| Running Env Steps   | 420000   |
| Running Forward KL  | 11.6     |
| Running Reverse KL  | 7.79     |
| Running Update Time | 84       |
----------------------------------
--2023-11-08 14:58:41.197237 CST--
| Itration            | 85       |
| Real Det Return     | 2.64e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.14e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -388     |
| Running Env Steps   | 425000   |
| Running Forward KL  | 11.9     |
| Running Reverse KL  | 7.41     |
| Running Update Time | 85       |
----------------------------------
--2023-11-08 15:00:55.554598 CST--
| Itration            | 86       |
| Real Det Return     | 2.56e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.15e+03 |
| Real Sto violation  | 0.9      |
| Reward Loss         | -393     |
| Running Env Steps   | 430000   |
| Running Forward KL  | 11.7     |
| Running Reverse KL  | 7.48     |
| Running Update Time | 86       |
----------------------------------
--2023-11-08 15:03:09.797861 CST--
| Itration            | 87       |
| Real Det Return     | 2.64e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.15e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -398     |
| Running Env Steps   | 435000   |
| Running Forward KL  | 11.6     |
| Running Reverse KL  | 7.58     |
| Running Update Time | 87       |
----------------------------------
--2023-11-08 15:05:24.020664 CST--
| Itration            | 88       |
| Real Det Return     | 2.61e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.17e+03 |
| Real Sto violation  | 0.95     |
| Reward Loss         | -399     |
| Running Env Steps   | 440000   |
| Running Forward KL  | 11.3     |
| Running Reverse KL  | 7.67     |
| Running Update Time | 88       |
----------------------------------
--2023-11-08 15:07:38.003499 CST--
| Itration            | 89       |
| Real Det Return     | 2.67e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.18e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -394     |
| Running Env Steps   | 445000   |
| Running Forward KL  | 11.2     |
| Running Reverse KL  | 7.65     |
| Running Update Time | 89       |
----------------------------------
--2023-11-08 15:09:42.357203 CST--
| Itration            | 90       |
| Real Det Return     | 2.64e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.23e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -394     |
| Running Env Steps   | 450000   |
| Running Forward KL  | 10.7     |
| Running Reverse KL  | 7.62     |
| Running Update Time | 90       |
----------------------------------
--2023-11-08 15:11:46.535305 CST--
| Itration            | 91       |
| Real Det Return     | 2.63e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.22e+03 |
| Real Sto violation  | 0.95     |
| Reward Loss         | -418     |
| Running Env Steps   | 455000   |
| Running Forward KL  | 11.3     |
| Running Reverse KL  | 7.8      |
| Running Update Time | 91       |
----------------------------------
--2023-11-08 15:13:50.656174 CST--
| Itration            | 92       |
| Real Det Return     | 2.66e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.19e+03 |
| Real Sto violation  | 0.95     |
| Reward Loss         | -398     |
| Running Env Steps   | 460000   |
| Running Forward KL  | 11.1     |
| Running Reverse KL  | 7.7      |
| Running Update Time | 92       |
----------------------------------
--2023-11-08 15:15:55.028857 CST--
| Itration            | 93       |
| Real Det Return     | 2.7e+03  |
| Real Det violation  | 0        |
| Real Sto Return     | 2.21e+03 |
| Real Sto violation  | 0.95     |
| Reward Loss         | -404     |
| Running Env Steps   | 465000   |
| Running Forward KL  | 10.5     |
| Running Reverse KL  | 7.55     |
| Running Update Time | 93       |
----------------------------------
--2023-11-08 15:17:59.349643 CST--
| Itration            | 94       |
| Real Det Return     | 2.68e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.19e+03 |
| Real Sto violation  | 0.95     |
| Reward Loss         | -418     |
| Running Env Steps   | 470000   |
| Running Forward KL  | 11       |
| Running Reverse KL  | 7.68     |
| Running Update Time | 94       |
----------------------------------
--2023-11-08 15:20:03.611150 CST--
| Itration            | 95       |
| Real Det Return     | 2.7e+03  |
| Real Det violation  | 0        |
| Real Sto Return     | 2.25e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -408     |
| Running Env Steps   | 475000   |
| Running Forward KL  | 11.2     |
| Running Reverse KL  | 7.23     |
| Running Update Time | 95       |
----------------------------------
--2023-11-08 15:22:17.698086 CST--
| Itration            | 96       |
| Real Det Return     | 2.67e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.23e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -420     |
| Running Env Steps   | 480000   |
| Running Forward KL  | 11.1     |
| Running Reverse KL  | 7.43     |
| Running Update Time | 96       |
----------------------------------
--2023-11-08 15:24:31.689165 CST--
| Itration            | 97       |
| Real Det Return     | 2.69e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.18e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -429     |
| Running Env Steps   | 485000   |
| Running Forward KL  | 11.6     |
| Running Reverse KL  | 7.67     |
| Running Update Time | 97       |
----------------------------------
--2023-11-08 15:26:45.888305 CST--
| Itration            | 98       |
| Real Det Return     | 2.65e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.25e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -396     |
| Running Env Steps   | 490000   |
| Running Forward KL  | 10.7     |
| Running Reverse KL  | 7.43     |
| Running Update Time | 98       |
----------------------------------
--2023-11-08 15:28:56.085977 CST--
| Itration            | 99       |
| Real Det Return     | 2.62e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.26e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -423     |
| Running Env Steps   | 495000   |
| Running Forward KL  | 10.1     |
| Running Reverse KL  | 7.58     |
| Running Update Time | 99       |
----------------------------------
--2023-11-08 15:31:10.479762 CST--
| Itration            | 100      |
| Real Det Return     | 2.61e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.2e+03  |
| Real Sto violation  | 0.75     |
| Reward Loss         | -418     |
| Running Env Steps   | 500000   |
| Running Forward KL  | 10.6     |
| Running Reverse KL  | 7.62     |
| Running Update Time | 100      |
----------------------------------
--2023-11-08 15:33:24.345186 CST--
| Itration            | 101      |
| Real Det Return     | 2.65e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.29e+03 |
| Real Sto violation  | 0.95     |
| Reward Loss         | -405     |
| Running Env Steps   | 505000   |
| Running Forward KL  | 10.9     |
| Running Reverse KL  | 7.62     |
| Running Update Time | 101      |
----------------------------------
--2023-11-08 15:35:35.508615 CST--
| Itration            | 102      |
| Real Det Return     | 2.68e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.29e+03 |
| Real Sto violation  | 0.95     |
| Reward Loss         | -429     |
| Running Env Steps   | 510000   |
| Running Forward KL  | 10.8     |
| Running Reverse KL  | 7.61     |
| Running Update Time | 102      |
----------------------------------
--2023-11-08 15:37:42.888204 CST--
| Itration            | 103      |
| Real Det Return     | 2.67e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.28e+03 |
| Real Sto violation  | 0.9      |
| Reward Loss         | -420     |
| Running Env Steps   | 515000   |
| Running Forward KL  | 10.1     |
| Running Reverse KL  | 7.72     |
| Running Update Time | 103      |
----------------------------------
--2023-11-08 15:39:50.404114 CST--
| Itration            | 104      |
| Real Det Return     | 2.69e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.26e+03 |
| Real Sto violation  | 0.75     |
| Reward Loss         | -432     |
| Running Env Steps   | 520000   |
| Running Forward KL  | 10.6     |
| Running Reverse KL  | 7.57     |
| Running Update Time | 104      |
----------------------------------
--2023-11-08 15:41:57.914540 CST--
| Itration            | 105      |
| Real Det Return     | 2.64e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.24e+03 |
| Real Sto violation  | 0.9      |
| Reward Loss         | -448     |
| Running Env Steps   | 525000   |
| Running Forward KL  | 10.2     |
| Running Reverse KL  | 7.61     |
| Running Update Time | 105      |
----------------------------------
--2023-11-08 15:44:05.954734 CST--
| Itration            | 106      |
| Real Det Return     | 2.67e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.27e+03 |
| Real Sto violation  | 0.75     |
| Reward Loss         | -429     |
| Running Env Steps   | 530000   |
| Running Forward KL  | 9.95     |
| Running Reverse KL  | 7.63     |
| Running Update Time | 106      |
----------------------------------
--2023-11-08 15:46:13.786642 CST--
| Itration            | 107      |
| Real Det Return     | 2.7e+03  |
| Real Det violation  | 0        |
| Real Sto Return     | 2.28e+03 |
| Real Sto violation  | 0.9      |
| Reward Loss         | -421     |
| Running Env Steps   | 535000   |
| Running Forward KL  | 10.2     |
| Running Reverse KL  | 7.43     |
| Running Update Time | 107      |
----------------------------------
--2023-11-08 15:48:21.394482 CST--
| Itration            | 108      |
| Real Det Return     | 2.68e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.29e+03 |
| Real Sto violation  | 0.85     |
| Reward Loss         | -434     |
| Running Env Steps   | 540000   |
| Running Forward KL  | 10.5     |
| Running Reverse KL  | 7.55     |
| Running Update Time | 108      |
----------------------------------
--2023-11-08 15:50:29.408907 CST--
| Itration            | 109      |
| Real Det Return     | 2.67e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.26e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -450     |
| Running Env Steps   | 545000   |
| Running Forward KL  | 10.5     |
| Running Reverse KL  | 7.51     |
| Running Update Time | 109      |
----------------------------------
--2023-11-08 15:52:36.706008 CST--
| Itration            | 110      |
| Real Det Return     | 2.68e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.25e+03 |
| Real Sto violation  | 0.8      |
| Reward Loss         | -428     |
| Running Env Steps   | 550000   |
| Running Forward KL  | 9.91     |
| Running Reverse KL  | 7.53     |
| Running Update Time | 110      |
----------------------------------
--2023-11-08 15:54:43.475624 CST--
| Itration            | 111      |
| Real Det Return     | 2.67e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.31e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -454     |
| Running Env Steps   | 555000   |
| Running Forward KL  | 10.7     |
| Running Reverse KL  | 7.53     |
| Running Update Time | 111      |
----------------------------------
--2023-11-08 15:56:50.718570 CST--
| Itration            | 112      |
| Real Det Return     | 2.7e+03  |
| Real Det violation  | 0        |
| Real Sto Return     | 2.28e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -450     |
| Running Env Steps   | 560000   |
| Running Forward KL  | 9.84     |
| Running Reverse KL  | 7.37     |
| Running Update Time | 112      |
----------------------------------
--2023-11-08 15:59:05.594638 CST--
| Itration            | 113      |
| Real Det Return     | 2.69e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.28e+03 |
| Real Sto violation  | 0.8      |
| Reward Loss         | -431     |
| Running Env Steps   | 565000   |
| Running Forward KL  | 10.1     |
| Running Reverse KL  | 7.44     |
| Running Update Time | 113      |
----------------------------------
--2023-11-08 16:01:19.881752 CST--
| Itration            | 114      |
| Real Det Return     | 2.72e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.31e+03 |
| Real Sto violation  | 0.9      |
| Reward Loss         | -453     |
| Running Env Steps   | 570000   |
| Running Forward KL  | 9.92     |
| Running Reverse KL  | 7.27     |
| Running Update Time | 114      |
----------------------------------
--2023-11-08 16:03:34.103074 CST--
| Itration            | 115      |
| Real Det Return     | 2.7e+03  |
| Real Det violation  | 0        |
| Real Sto Return     | 2.31e+03 |
| Real Sto violation  | 0.9      |
| Reward Loss         | -452     |
| Running Env Steps   | 575000   |
| Running Forward KL  | 10.1     |
| Running Reverse KL  | 7.54     |
| Running Update Time | 115      |
----------------------------------
--2023-11-08 16:05:48.321501 CST--
| Itration            | 116      |
| Real Det Return     | 2.69e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.32e+03 |
| Real Sto violation  | 0.9      |
| Reward Loss         | -450     |
| Running Env Steps   | 580000   |
| Running Forward KL  | 9.91     |
| Running Reverse KL  | 7.69     |
| Running Update Time | 116      |
----------------------------------
--2023-11-08 16:08:02.751116 CST--
| Itration            | 117      |
| Real Det Return     | 2.71e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.3e+03  |
| Real Sto violation  | 0.8      |
| Reward Loss         | -455     |
| Running Env Steps   | 585000   |
| Running Forward KL  | 9.75     |
| Running Reverse KL  | 7.58     |
| Running Update Time | 117      |
----------------------------------
--2023-11-08 16:10:17.538786 CST--
| Itration            | 118      |
| Real Det Return     | 2.73e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.33e+03 |
| Real Sto violation  | 0.95     |
| Reward Loss         | -450     |
| Running Env Steps   | 590000   |
| Running Forward KL  | 9.76     |
| Running Reverse KL  | 7.44     |
| Running Update Time | 118      |
----------------------------------
--2023-11-08 16:12:31.586066 CST--
| Itration            | 119      |
| Real Det Return     | 2.7e+03  |
| Real Det violation  | 0        |
| Real Sto Return     | 2.31e+03 |
| Real Sto violation  | 0.9      |
| Reward Loss         | -474     |
| Running Env Steps   | 595000   |
| Running Forward KL  | 9.64     |
| Running Reverse KL  | 7.49     |
| Running Update Time | 119      |
----------------------------------
--2023-11-08 16:14:45.463324 CST--
| Itration            | 120      |
| Real Det Return     | 2.72e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.27e+03 |
| Real Sto violation  | 0.85     |
| Reward Loss         | -457     |
| Running Env Steps   | 600000   |
| Running Forward KL  | 9.72     |
| Running Reverse KL  | 7.45     |
| Running Update Time | 120      |
----------------------------------
--2023-11-08 16:16:59.432497 CST--
| Itration            | 121      |
| Real Det Return     | 2.7e+03  |
| Real Det violation  | 0        |
| Real Sto Return     | 2.29e+03 |
| Real Sto violation  | 0.9      |
| Reward Loss         | -465     |
| Running Env Steps   | 605000   |
| Running Forward KL  | 10.1     |
| Running Reverse KL  | 7.48     |
| Running Update Time | 121      |
----------------------------------
--2023-11-08 16:19:13.581026 CST--
| Itration            | 122      |
| Real Det Return     | 2.72e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.37e+03 |
| Real Sto violation  | 0.95     |
| Reward Loss         | -456     |
| Running Env Steps   | 610000   |
| Running Forward KL  | 9.98     |
| Running Reverse KL  | 7.31     |
| Running Update Time | 122      |
----------------------------------
--2023-11-08 16:21:27.953829 CST--
| Itration            | 123      |
| Real Det Return     | 2.7e+03  |
| Real Det violation  | 0        |
| Real Sto Return     | 2.33e+03 |
| Real Sto violation  | 0.85     |
| Reward Loss         | -459     |
| Running Env Steps   | 615000   |
| Running Forward KL  | 9.52     |
| Running Reverse KL  | 7.38     |
| Running Update Time | 123      |
----------------------------------
--2023-11-08 16:23:42.122167 CST--
| Itration            | 124      |
| Real Det Return     | 2.62e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.34e+03 |
| Real Sto violation  | 0.85     |
| Reward Loss         | -454     |
| Running Env Steps   | 620000   |
| Running Forward KL  | 9.63     |
| Running Reverse KL  | 7.18     |
| Running Update Time | 124      |
----------------------------------
--2023-11-08 16:25:47.250203 CST--
| Itration            | 125      |
| Real Det Return     | 2.71e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.29e+03 |
| Real Sto violation  | 0.9      |
| Reward Loss         | -474     |
| Running Env Steps   | 625000   |
| Running Forward KL  | 9.23     |
| Running Reverse KL  | 7.34     |
| Running Update Time | 125      |
----------------------------------
--2023-11-08 16:27:52.653713 CST--
| Itration            | 126      |
| Real Det Return     | 2.71e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.3e+03  |
| Real Sto violation  | 0.6      |
| Reward Loss         | -460     |
| Running Env Steps   | 630000   |
| Running Forward KL  | 9.37     |
| Running Reverse KL  | 7.28     |
| Running Update Time | 126      |
----------------------------------
--2023-11-08 16:29:57.247424 CST--
| Itration            | 127      |
| Real Det Return     | 2.71e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.29e+03 |
| Real Sto violation  | 0.8      |
| Reward Loss         | -486     |
| Running Env Steps   | 635000   |
| Running Forward KL  | 9.4      |
| Running Reverse KL  | 7.2      |
| Running Update Time | 127      |
----------------------------------
--2023-11-08 16:32:02.501380 CST--
| Itration            | 128      |
| Real Det Return     | 2.71e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.29e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -466     |
| Running Env Steps   | 640000   |
| Running Forward KL  | 9.6      |
| Running Reverse KL  | 7.2      |
| Running Update Time | 128      |
----------------------------------
--2023-11-08 16:34:07.365452 CST--
| Itration            | 129      |
| Real Det Return     | 2.73e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.28e+03 |
| Real Sto violation  | 0.9      |
| Reward Loss         | -481     |
| Running Env Steps   | 645000   |
| Running Forward KL  | 9.63     |
| Running Reverse KL  | 7.13     |
| Running Update Time | 129      |
----------------------------------
--2023-11-08 16:36:12.196021 CST--
| Itration            | 130      |
| Real Det Return     | 2.68e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.35e+03 |
| Real Sto violation  | 0.85     |
| Reward Loss         | -462     |
| Running Env Steps   | 650000   |
| Running Forward KL  | 9.27     |
| Running Reverse KL  | 7.18     |
| Running Update Time | 130      |
----------------------------------
--2023-11-08 16:38:16.982402 CST--
| Itration            | 131      |
| Real Det Return     | 2.69e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.34e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -467     |
| Running Env Steps   | 655000   |
| Running Forward KL  | 9.55     |
| Running Reverse KL  | 7.06     |
| Running Update Time | 131      |
----------------------------------
--2023-11-08 16:40:21.634039 CST--
| Itration            | 132      |
| Real Det Return     | 2.74e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.32e+03 |
| Real Sto violation  | 0.85     |
| Reward Loss         | -483     |
| Running Env Steps   | 660000   |
| Running Forward KL  | 9.13     |
| Running Reverse KL  | 7.13     |
| Running Update Time | 132      |
----------------------------------
--2023-11-08 16:42:26.840948 CST--
| Itration            | 133      |
| Real Det Return     | 2.7e+03  |
| Real Det violation  | 0        |
| Real Sto Return     | 2.32e+03 |
| Real Sto violation  | 0.9      |
| Reward Loss         | -482     |
| Running Env Steps   | 665000   |
| Running Forward KL  | 8.95     |
| Running Reverse KL  | 7.22     |
| Running Update Time | 133      |
----------------------------------
--2023-11-08 16:44:32.526160 CST--
| Itration            | 134      |
| Real Det Return     | 2.71e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.35e+03 |
| Real Sto violation  | 0.85     |
| Reward Loss         | -485     |
| Running Env Steps   | 670000   |
| Running Forward KL  | 9.33     |
| Running Reverse KL  | 7.11     |
| Running Update Time | 134      |
----------------------------------
--2023-11-08 16:46:38.040995 CST--
| Itration            | 135      |
| Real Det Return     | 2.71e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.32e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -490     |
| Running Env Steps   | 675000   |
| Running Forward KL  | 9.26     |
| Running Reverse KL  | 6.99     |
| Running Update Time | 135      |
----------------------------------
--2023-11-08 16:48:43.356142 CST--
| Itration            | 136      |
| Real Det Return     | 2.69e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.34e+03 |
| Real Sto violation  | 0.9      |
| Reward Loss         | -491     |
| Running Env Steps   | 680000   |
| Running Forward KL  | 9.12     |
| Running Reverse KL  | 7.01     |
| Running Update Time | 136      |
----------------------------------
--2023-11-08 16:50:48.636628 CST--
| Itration            | 137      |
| Real Det Return     | 2.7e+03  |
| Real Det violation  | 0        |
| Real Sto Return     | 2.31e+03 |
| Real Sto violation  | 0.8      |
| Reward Loss         | -493     |
| Running Env Steps   | 685000   |
| Running Forward KL  | 8.98     |
| Running Reverse KL  | 7.09     |
| Running Update Time | 137      |
----------------------------------
--2023-11-08 16:52:53.962148 CST--
| Itration            | 138      |
| Real Det Return     | 2.68e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.35e+03 |
| Real Sto violation  | 0.9      |
| Reward Loss         | -504     |
| Running Env Steps   | 690000   |
| Running Forward KL  | 9.42     |
| Running Reverse KL  | 7.23     |
| Running Update Time | 138      |
----------------------------------
--2023-11-08 16:54:59.149193 CST--
| Itration            | 139      |
| Real Det Return     | 2.68e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.32e+03 |
| Real Sto violation  | 0.9      |
| Reward Loss         | -500     |
| Running Env Steps   | 695000   |
| Running Forward KL  | 9.2      |
| Running Reverse KL  | 7.05     |
| Running Update Time | 139      |
----------------------------------
--2023-11-08 16:57:04.182316 CST--
| Itration            | 140      |
| Real Det Return     | 2.69e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.3e+03  |
| Real Sto violation  | 0.95     |
| Reward Loss         | -496     |
| Running Env Steps   | 700000   |
| Running Forward KL  | 9.11     |
| Running Reverse KL  | 7.15     |
| Running Update Time | 140      |
----------------------------------
--2023-11-08 16:59:09.105885 CST--
| Itration            | 141      |
| Real Det Return     | 2.68e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.37e+03 |
| Real Sto violation  | 0.9      |
| Reward Loss         | -487     |
| Running Env Steps   | 705000   |
| Running Forward KL  | 9.12     |
| Running Reverse KL  | 7.22     |
| Running Update Time | 141      |
----------------------------------
--2023-11-08 17:01:14.034532 CST--
| Itration            | 142      |
| Real Det Return     | 2.66e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.35e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -514     |
| Running Env Steps   | 710000   |
| Running Forward KL  | 9.01     |
| Running Reverse KL  | 7.02     |
| Running Update Time | 142      |
----------------------------------
--2023-11-08 17:03:19.112059 CST--
| Itration            | 143      |
| Real Det Return     | 2.69e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.34e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -472     |
| Running Env Steps   | 715000   |
| Running Forward KL  | 9.03     |
| Running Reverse KL  | 7.04     |
| Running Update Time | 143      |
----------------------------------
--2023-11-08 17:05:24.960511 CST--
| Itration            | 144      |
| Real Det Return     | 2.66e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.32e+03 |
| Real Sto violation  | 0.6      |
| Reward Loss         | -491     |
| Running Env Steps   | 720000   |
| Running Forward KL  | 8.55     |
| Running Reverse KL  | 7        |
| Running Update Time | 144      |
----------------------------------
--2023-11-08 17:07:31.282382 CST--
| Itration            | 145      |
| Real Det Return     | 2.66e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.34e+03 |
| Real Sto violation  | 0.95     |
| Reward Loss         | -503     |
| Running Env Steps   | 725000   |
| Running Forward KL  | 8.87     |
| Running Reverse KL  | 6.9      |
| Running Update Time | 145      |
----------------------------------
--2023-11-08 17:09:37.279470 CST--
| Itration            | 146      |
| Real Det Return     | 2.7e+03  |
| Real Det violation  | 0        |
| Real Sto Return     | 2.32e+03 |
| Real Sto violation  | 0.75     |
| Reward Loss         | -488     |
| Running Env Steps   | 730000   |
| Running Forward KL  | 8.65     |
| Running Reverse KL  | 7        |
| Running Update Time | 146      |
----------------------------------
--2023-11-08 17:11:42.276715 CST--
| Itration            | 147      |
| Real Det Return     | 2.7e+03  |
| Real Det violation  | 0        |
| Real Sto Return     | 2.34e+03 |
| Real Sto violation  | 0.8      |
| Reward Loss         | -520     |
| Running Env Steps   | 735000   |
| Running Forward KL  | 8.5      |
| Running Reverse KL  | 7.04     |
| Running Update Time | 147      |
----------------------------------
--2023-11-08 17:13:47.315173 CST--
| Itration            | 148      |
| Real Det Return     | 2.7e+03  |
| Real Det violation  | 0        |
| Real Sto Return     | 2.35e+03 |
| Real Sto violation  | 0.95     |
| Reward Loss         | -488     |
| Running Env Steps   | 740000   |
| Running Forward KL  | 8.84     |
| Running Reverse KL  | 6.84     |
| Running Update Time | 148      |
----------------------------------
--2023-11-08 17:15:52.445040 CST--
| Itration            | 149      |
| Real Det Return     | 2.67e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.36e+03 |
| Real Sto violation  | 0.85     |
| Reward Loss         | -505     |
| Running Env Steps   | 745000   |
| Running Forward KL  | 8.64     |
| Running Reverse KL  | 6.97     |
| Running Update Time | 149      |
----------------------------------
--2023-11-08 17:17:57.719727 CST--
| Itration            | 150      |
| Real Det Return     | 2.69e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.38e+03 |
| Real Sto violation  | 0.95     |
| Reward Loss         | -498     |
| Running Env Steps   | 750000   |
| Running Forward KL  | 9.01     |
| Running Reverse KL  | 6.91     |
| Running Update Time | 150      |
----------------------------------
--2023-11-08 17:20:02.934468 CST--
| Itration            | 151      |
| Real Det Return     | 2.71e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.28e+03 |
| Real Sto violation  | 0.55     |
| Reward Loss         | -510     |
| Running Env Steps   | 755000   |
| Running Forward KL  | 8.56     |
| Running Reverse KL  | 7.1      |
| Running Update Time | 151      |
----------------------------------
--2023-11-08 17:22:08.297450 CST--
| Itration            | 152      |
| Real Det Return     | 2.7e+03  |
| Real Det violation  | 0        |
| Real Sto Return     | 2.32e+03 |
| Real Sto violation  | 0.85     |
| Reward Loss         | -511     |
| Running Env Steps   | 760000   |
| Running Forward KL  | 8.69     |
| Running Reverse KL  | 6.92     |
| Running Update Time | 152      |
----------------------------------
--2023-11-08 17:24:13.495151 CST--
| Itration            | 153      |
| Real Det Return     | 2.69e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.33e+03 |
| Real Sto violation  | 0.6      |
| Reward Loss         | -524     |
| Running Env Steps   | 765000   |
| Running Forward KL  | 8.61     |
| Running Reverse KL  | 7.03     |
| Running Update Time | 153      |
----------------------------------
--2023-11-08 17:26:18.528104 CST--
| Itration            | 154      |
| Real Det Return     | 2.65e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.36e+03 |
| Real Sto violation  | 0.8      |
| Reward Loss         | -525     |
| Running Env Steps   | 770000   |
| Running Forward KL  | 8.49     |
| Running Reverse KL  | 6.96     |
| Running Update Time | 154      |
----------------------------------
--2023-11-08 17:28:23.697440 CST--
| Itration            | 155      |
| Real Det Return     | 2.7e+03  |
| Real Det violation  | 0        |
| Real Sto Return     | 2.37e+03 |
| Real Sto violation  | 0.85     |
| Reward Loss         | -512     |
| Running Env Steps   | 775000   |
| Running Forward KL  | 8.41     |
| Running Reverse KL  | 6.92     |
| Running Update Time | 155      |
----------------------------------
--2023-11-08 17:30:29.025651 CST--
| Itration            | 156      |
| Real Det Return     | 2.69e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.35e+03 |
| Real Sto violation  | 0.85     |
| Reward Loss         | -524     |
| Running Env Steps   | 780000   |
| Running Forward KL  | 8.41     |
| Running Reverse KL  | 6.9      |
| Running Update Time | 156      |
----------------------------------
--2023-11-08 17:32:33.972004 CST--
| Itration            | 157      |
| Real Det Return     | 2.65e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.39e+03 |
| Real Sto violation  | 0.85     |
| Reward Loss         | -497     |
| Running Env Steps   | 785000   |
| Running Forward KL  | 8.52     |
| Running Reverse KL  | 6.81     |
| Running Update Time | 157      |
----------------------------------
--2023-11-08 17:34:39.321392 CST--
| Itration            | 158      |
| Real Det Return     | 2.66e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.43e+03 |
| Real Sto violation  | 0.95     |
| Reward Loss         | -504     |
| Running Env Steps   | 790000   |
| Running Forward KL  | 7.99     |
| Running Reverse KL  | 6.79     |
| Running Update Time | 158      |
----------------------------------
--2023-11-08 17:36:44.932301 CST--
| Itration            | 159      |
| Real Det Return     | 2.68e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.43e+03 |
| Real Sto violation  | 0.9      |
| Reward Loss         | -505     |
| Running Env Steps   | 795000   |
| Running Forward KL  | 8.53     |
| Running Reverse KL  | 6.9      |
| Running Update Time | 159      |
----------------------------------
--2023-11-08 17:38:50.801771 CST--
| Itration            | 160      |
| Real Det Return     | 2.63e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.36e+03 |
| Real Sto violation  | 0.8      |
| Reward Loss         | -523     |
| Running Env Steps   | 800000   |
| Running Forward KL  | 8.48     |
| Running Reverse KL  | 6.89     |
| Running Update Time | 160      |
----------------------------------
--2023-11-08 17:41:00.644729 CST--
| Itration            | 161      |
| Real Det Return     | 2.62e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.41e+03 |
| Real Sto violation  | 0.85     |
| Reward Loss         | -516     |
| Running Env Steps   | 805000   |
| Running Forward KL  | 8.59     |
| Running Reverse KL  | 6.63     |
| Running Update Time | 161      |
----------------------------------
--2023-11-08 17:43:09.969289 CST--
| Itration            | 162      |
| Real Det Return     | 2.64e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.42e+03 |
| Real Sto violation  | 0.75     |
| Reward Loss         | -528     |
| Running Env Steps   | 810000   |
| Running Forward KL  | 8.06     |
| Running Reverse KL  | 7.04     |
| Running Update Time | 162      |
----------------------------------
--2023-11-08 17:45:18.949043 CST--
| Itration            | 163      |
| Real Det Return     | 2.6e+03  |
| Real Det violation  | 0        |
| Real Sto Return     | 2.38e+03 |
| Real Sto violation  | 0.85     |
| Reward Loss         | -524     |
| Running Env Steps   | 815000   |
| Running Forward KL  | 8.26     |
| Running Reverse KL  | 6.76     |
| Running Update Time | 163      |
----------------------------------
--2023-11-08 17:47:28.029363 CST--
| Itration            | 164      |
| Real Det Return     | 2.67e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.44e+03 |
| Real Sto violation  | 0.9      |
| Reward Loss         | -492     |
| Running Env Steps   | 820000   |
| Running Forward KL  | 8.14     |
| Running Reverse KL  | 6.71     |
| Running Update Time | 164      |
----------------------------------
--2023-11-08 17:49:37.057685 CST--
| Itration            | 165      |
| Real Det Return     | 2.6e+03  |
| Real Det violation  | 0        |
| Real Sto Return     | 2.43e+03 |
| Real Sto violation  | 0.95     |
| Reward Loss         | -509     |
| Running Env Steps   | 825000   |
| Running Forward KL  | 8.09     |
| Running Reverse KL  | 6.66     |
| Running Update Time | 165      |
----------------------------------
--2023-11-08 17:51:45.892436 CST--
| Itration            | 166      |
| Real Det Return     | 2.64e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.37e+03 |
| Real Sto violation  | 0.7      |
| Reward Loss         | -539     |
| Running Env Steps   | 830000   |
| Running Forward KL  | 8.35     |
| Running Reverse KL  | 6.76     |
| Running Update Time | 166      |
----------------------------------
--2023-11-08 17:53:54.773034 CST--
| Itration            | 167      |
| Real Det Return     | 2.67e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.4e+03  |
| Real Sto violation  | 0.85     |
| Reward Loss         | -510     |
| Running Env Steps   | 835000   |
| Running Forward KL  | 8.27     |
| Running Reverse KL  | 6.61     |
| Running Update Time | 167      |
----------------------------------
--2023-11-08 17:56:03.406727 CST--
| Itration            | 168      |
| Real Det Return     | 2.6e+03  |
| Real Det violation  | 0        |
| Real Sto Return     | 2.46e+03 |
| Real Sto violation  | 0.85     |
| Reward Loss         | -504     |
| Running Env Steps   | 840000   |
| Running Forward KL  | 8.35     |
| Running Reverse KL  | 6.57     |
| Running Update Time | 168      |
----------------------------------
--2023-11-08 17:58:12.317926 CST--
| Itration            | 169      |
| Real Det Return     | 2.68e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.39e+03 |
| Real Sto violation  | 0.75     |
| Reward Loss         | -528     |
| Running Env Steps   | 845000   |
| Running Forward KL  | 7.91     |
| Running Reverse KL  | 6.73     |
| Running Update Time | 169      |
----------------------------------
--2023-11-08 18:00:21.332544 CST--
| Itration            | 170      |
| Real Det Return     | 2.67e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.43e+03 |
| Real Sto violation  | 0.65     |
| Reward Loss         | -517     |
| Running Env Steps   | 850000   |
| Running Forward KL  | 8.31     |
| Running Reverse KL  | 6.62     |
| Running Update Time | 170      |
----------------------------------
--2023-11-08 18:02:30.005521 CST--
| Itration            | 171      |
| Real Det Return     | 2.62e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.41e+03 |
| Real Sto violation  | 0.9      |
| Reward Loss         | -538     |
| Running Env Steps   | 855000   |
| Running Forward KL  | 8.18     |
| Running Reverse KL  | 6.63     |
| Running Update Time | 171      |
----------------------------------
--2023-11-08 18:04:39.228074 CST--
| Itration            | 172      |
| Real Det Return     | 2.62e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.41e+03 |
| Real Sto violation  | 0.9      |
| Reward Loss         | -531     |
| Running Env Steps   | 860000   |
| Running Forward KL  | 8.12     |
| Running Reverse KL  | 6.52     |
| Running Update Time | 172      |
----------------------------------
--2023-11-08 18:06:48.340081 CST--
| Itration            | 173      |
| Real Det Return     | 2.58e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.44e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -514     |
| Running Env Steps   | 865000   |
| Running Forward KL  | 8.36     |
| Running Reverse KL  | 6.59     |
| Running Update Time | 173      |
----------------------------------
--2023-11-08 18:08:57.460448 CST--
| Itration            | 174      |
| Real Det Return     | 2.63e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.43e+03 |
| Real Sto violation  | 0.75     |
| Reward Loss         | -518     |
| Running Env Steps   | 870000   |
| Running Forward KL  | 7.72     |
| Running Reverse KL  | 6.46     |
| Running Update Time | 174      |
----------------------------------
--2023-11-08 18:11:06.575203 CST--
| Itration            | 175      |
| Real Det Return     | 2.63e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.44e+03 |
| Real Sto violation  | 0.85     |
| Reward Loss         | -536     |
| Running Env Steps   | 875000   |
| Running Forward KL  | 8.16     |
| Running Reverse KL  | 6.55     |
| Running Update Time | 175      |
----------------------------------
--2023-11-08 18:13:15.575318 CST--
| Itration            | 176      |
| Real Det Return     | 2.59e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.42e+03 |
| Real Sto violation  | 0.55     |
| Reward Loss         | -508     |
| Running Env Steps   | 880000   |
| Running Forward KL  | 7.89     |
| Running Reverse KL  | 6.53     |
| Running Update Time | 176      |
----------------------------------
--2023-11-08 18:15:24.401839 CST--
| Itration            | 177      |
| Real Det Return     | 2.69e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.45e+03 |
| Real Sto violation  | 0.7      |
| Reward Loss         | -520     |
| Running Env Steps   | 885000   |
| Running Forward KL  | 7.55     |
| Running Reverse KL  | 6.52     |
| Running Update Time | 177      |
----------------------------------
--2023-11-08 18:17:33.339601 CST--
| Itration            | 178      |
| Real Det Return     | 2.62e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.43e+03 |
| Real Sto violation  | 0.65     |
| Reward Loss         | -519     |
| Running Env Steps   | 890000   |
| Running Forward KL  | 7.87     |
| Running Reverse KL  | 6.44     |
| Running Update Time | 178      |
----------------------------------
--2023-11-08 18:19:42.332805 CST--
| Itration            | 179      |
| Real Det Return     | 2.69e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.41e+03 |
| Real Sto violation  | 0.7      |
| Reward Loss         | -536     |
| Running Env Steps   | 895000   |
| Running Forward KL  | 7.58     |
| Running Reverse KL  | 6.42     |
| Running Update Time | 179      |
----------------------------------
--2023-11-08 18:21:51.434960 CST--
| Itration            | 180      |
| Real Det Return     | 2.68e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.4e+03  |
| Real Sto violation  | 1        |
| Reward Loss         | -548     |
| Running Env Steps   | 900000   |
| Running Forward KL  | 7.72     |
| Running Reverse KL  | 6.44     |
| Running Update Time | 180      |
----------------------------------
--2023-11-08 18:24:00.624749 CST--
| Itration            | 181      |
| Real Det Return     | 2.69e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.4e+03  |
| Real Sto violation  | 0.75     |
| Reward Loss         | -527     |
| Running Env Steps   | 905000   |
| Running Forward KL  | 7.76     |
| Running Reverse KL  | 6.53     |
| Running Update Time | 181      |
----------------------------------
--2023-11-08 18:26:09.734789 CST--
| Itration            | 182      |
| Real Det Return     | 2.62e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.43e+03 |
| Real Sto violation  | 0.8      |
| Reward Loss         | -526     |
| Running Env Steps   | 910000   |
| Running Forward KL  | 7.82     |
| Running Reverse KL  | 6.5      |
| Running Update Time | 182      |
----------------------------------
--2023-11-08 18:28:18.925270 CST--
| Itration            | 183      |
| Real Det Return     | 2.66e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.41e+03 |
| Real Sto violation  | 0.8      |
| Reward Loss         | -543     |
| Running Env Steps   | 915000   |
| Running Forward KL  | 7.65     |
| Running Reverse KL  | 6.54     |
| Running Update Time | 183      |
----------------------------------
--2023-11-08 18:30:27.809469 CST--
| Itration            | 184      |
| Real Det Return     | 2.6e+03  |
| Real Det violation  | 0        |
| Real Sto Return     | 2.46e+03 |
| Real Sto violation  | 0.9      |
| Reward Loss         | -539     |
| Running Env Steps   | 920000   |
| Running Forward KL  | 7.93     |
| Running Reverse KL  | 6.39     |
| Running Update Time | 184      |
----------------------------------
--2023-11-08 18:32:37.049182 CST--
| Itration            | 185      |
| Real Det Return     | 2.68e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.49e+03 |
| Real Sto violation  | 0.95     |
| Reward Loss         | -518     |
| Running Env Steps   | 925000   |
| Running Forward KL  | 7.74     |
| Running Reverse KL  | 6.3      |
| Running Update Time | 185      |
----------------------------------
--2023-11-08 18:34:45.831495 CST--
| Itration            | 186      |
| Real Det Return     | 2.62e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.47e+03 |
| Real Sto violation  | 0.95     |
| Reward Loss         | -531     |
| Running Env Steps   | 930000   |
| Running Forward KL  | 7.92     |
| Running Reverse KL  | 6.48     |
| Running Update Time | 186      |
----------------------------------
--2023-11-08 18:36:54.815312 CST--
| Itration            | 187      |
| Real Det Return     | 2.72e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.4e+03  |
| Real Sto violation  | 0.75     |
| Reward Loss         | -541     |
| Running Env Steps   | 935000   |
| Running Forward KL  | 7.69     |
| Running Reverse KL  | 6.34     |
| Running Update Time | 187      |
----------------------------------
--2023-11-08 18:39:03.468591 CST--
| Itration            | 188      |
| Real Det Return     | 2.67e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.43e+03 |
| Real Sto violation  | 0.75     |
| Reward Loss         | -535     |
| Running Env Steps   | 940000   |
| Running Forward KL  | 7.55     |
| Running Reverse KL  | 6.42     |
| Running Update Time | 188      |
----------------------------------
--2023-11-08 18:41:07.482707 CST--
| Itration            | 189      |
| Real Det Return     | 2.45e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.49e+03 |
| Real Sto violation  | 0.8      |
| Reward Loss         | -522     |
| Running Env Steps   | 945000   |
| Running Forward KL  | 7.31     |
| Running Reverse KL  | 6.42     |
| Running Update Time | 189      |
----------------------------------
--2023-11-08 18:43:11.969692 CST--
| Itration            | 190      |
| Real Det Return     | 2.52e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.46e+03 |
| Real Sto violation  | 0.75     |
| Reward Loss         | -533     |
| Running Env Steps   | 950000   |
| Running Forward KL  | 7.25     |
| Running Reverse KL  | 6.25     |
| Running Update Time | 190      |
----------------------------------
--2023-11-08 18:45:15.704799 CST--
| Itration            | 191      |
| Real Det Return     | 2.68e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.51e+03 |
| Real Sto violation  | 0.8      |
| Reward Loss         | -518     |
| Running Env Steps   | 955000   |
| Running Forward KL  | 7.18     |
| Running Reverse KL  | 6.16     |
| Running Update Time | 191      |
----------------------------------
--2023-11-08 18:47:19.646492 CST--
| Itration            | 192      |
| Real Det Return     | 2.44e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.5e+03  |
| Real Sto violation  | 0.9      |
| Reward Loss         | -526     |
| Running Env Steps   | 960000   |
| Running Forward KL  | 7.32     |
| Running Reverse KL  | 6.24     |
| Running Update Time | 192      |
----------------------------------
--2023-11-08 18:49:23.460804 CST--
| Itration            | 193      |
| Real Det Return     | 2.56e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.51e+03 |
| Real Sto violation  | 0.95     |
| Reward Loss         | -536     |
| Running Env Steps   | 965000   |
| Running Forward KL  | 7.47     |
| Running Reverse KL  | 6.13     |
| Running Update Time | 193      |
----------------------------------
--2023-11-08 18:51:27.265322 CST--
| Itration            | 194      |
| Real Det Return     | 2.58e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.48e+03 |
| Real Sto violation  | 0.55     |
| Reward Loss         | -520     |
| Running Env Steps   | 970000   |
| Running Forward KL  | 7.09     |
| Running Reverse KL  | 6.41     |
| Running Update Time | 194      |
----------------------------------
--2023-11-08 18:53:31.645935 CST--
| Itration            | 195      |
| Real Det Return     | 2.6e+03  |
| Real Det violation  | 0        |
| Real Sto Return     | 2.47e+03 |
| Real Sto violation  | 0.85     |
| Reward Loss         | -549     |
| Running Env Steps   | 975000   |
| Running Forward KL  | 7.4      |
| Running Reverse KL  | 6.4      |
| Running Update Time | 195      |
----------------------------------
--2023-11-08 18:55:35.865023 CST--
| Itration            | 196      |
| Real Det Return     | 2.56e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.47e+03 |
| Real Sto violation  | 0.95     |
| Reward Loss         | -546     |
| Running Env Steps   | 980000   |
| Running Forward KL  | 7.66     |
| Running Reverse KL  | 6.21     |
| Running Update Time | 196      |
----------------------------------
--2023-11-08 18:57:40.877536 CST--
| Itration            | 197      |
| Real Det Return     | 2.63e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.52e+03 |
| Real Sto violation  | 0.75     |
| Reward Loss         | -535     |
| Running Env Steps   | 985000   |
| Running Forward KL  | 7.31     |
| Running Reverse KL  | 6.29     |
| Running Update Time | 197      |
----------------------------------
--2023-11-08 18:59:45.105238 CST--
| Itration            | 198      |
| Real Det Return     | 2.55e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.47e+03 |
| Real Sto violation  | 0.55     |
| Reward Loss         | -538     |
| Running Env Steps   | 990000   |
| Running Forward KL  | 7.32     |
| Running Reverse KL  | 6.2      |
| Running Update Time | 198      |
----------------------------------
--2023-11-08 19:01:49.518223 CST--
| Itration            | 199      |
| Real Det Return     | 2.59e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.5e+03  |
| Real Sto violation  | 0.8      |
| Reward Loss         | -534     |
| Running Env Steps   | 995000   |
| Running Forward KL  | 7.18     |
| Running Reverse KL  | 6.19     |
| Running Update Time | 199      |
----------------------------------
--2023-11-08 19:03:54.691062 CST--
| Itration            | 200      |
| Real Det Return     | 2.58e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.48e+03 |
| Real Sto violation  | 0.6      |
| Reward Loss         | -558     |
| Running Env Steps   | 1000000  |
| Running Forward KL  | 7.27     |
| Running Reverse KL  | 6.1      |
| Running Update Time | 200      |
----------------------------------
--2023-11-08 19:05:59.365994 CST--
| Itration            | 201      |
| Real Det Return     | 2.57e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.52e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -548     |
| Running Env Steps   | 1005000  |
| Running Forward KL  | 7.28     |
| Running Reverse KL  | 6.2      |
| Running Update Time | 201      |
----------------------------------
--2023-11-08 19:08:04.094257 CST--
| Itration            | 202      |
| Real Det Return     | 2.47e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.5e+03  |
| Real Sto violation  | 0.8      |
| Reward Loss         | -548     |
| Running Env Steps   | 1010000  |
| Running Forward KL  | 7.19     |
| Running Reverse KL  | 6.19     |
| Running Update Time | 202      |
----------------------------------
--2023-11-08 19:10:08.884983 CST--
| Itration            | 203      |
| Real Det Return     | 2.48e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.51e+03 |
| Real Sto violation  | 0.85     |
| Reward Loss         | -549     |
| Running Env Steps   | 1015000  |
| Running Forward KL  | 7.44     |
| Running Reverse KL  | 6.16     |
| Running Update Time | 203      |
----------------------------------
--2023-11-08 19:12:13.967329 CST--
| Itration            | 204      |
| Real Det Return     | 2.47e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.54e+03 |
| Real Sto violation  | 0.85     |
| Reward Loss         | -538     |
| Running Env Steps   | 1020000  |
| Running Forward KL  | 7.15     |
| Running Reverse KL  | 6.08     |
| Running Update Time | 204      |
----------------------------------
--2023-11-08 19:14:19.188036 CST--
| Itration            | 205      |
| Real Det Return     | 2.55e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.52e+03 |
| Real Sto violation  | 0.55     |
| Reward Loss         | -536     |
| Running Env Steps   | 1025000  |
| Running Forward KL  | 6.8      |
| Running Reverse KL  | 6.09     |
| Running Update Time | 205      |
----------------------------------
--2023-11-08 19:16:24.273527 CST--
| Itration            | 206      |
| Real Det Return     | 2.46e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.51e+03 |
| Real Sto violation  | 0.75     |
| Reward Loss         | -539     |
| Running Env Steps   | 1030000  |
| Running Forward KL  | 7.03     |
| Running Reverse KL  | 6.23     |
| Running Update Time | 206      |
----------------------------------
--2023-11-08 19:18:28.989459 CST--
| Itration            | 207      |
| Real Det Return     | 2.62e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.55e+03 |
| Real Sto violation  | 0.95     |
| Reward Loss         | -528     |
| Running Env Steps   | 1035000  |
| Running Forward KL  | 7.15     |
| Running Reverse KL  | 5.91     |
| Running Update Time | 207      |
----------------------------------
--2023-11-08 19:20:34.113432 CST--
| Itration            | 208      |
| Real Det Return     | 2.56e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.49e+03 |
| Real Sto violation  | 0.8      |
| Reward Loss         | -552     |
| Running Env Steps   | 1040000  |
| Running Forward KL  | 6.98     |
| Running Reverse KL  | 6        |
| Running Update Time | 208      |
----------------------------------
--2023-11-08 19:22:38.769888 CST--
| Itration            | 209      |
| Real Det Return     | 2.58e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.52e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -544     |
| Running Env Steps   | 1045000  |
| Running Forward KL  | 7.06     |
| Running Reverse KL  | 6.07     |
| Running Update Time | 209      |
----------------------------------
--2023-11-08 19:24:43.300291 CST--
| Itration            | 210      |
| Real Det Return     | 2.55e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.53e+03 |
| Real Sto violation  | 0.7      |
| Reward Loss         | -545     |
| Running Env Steps   | 1050000  |
| Running Forward KL  | 6.58     |
| Running Reverse KL  | 6.11     |
| Running Update Time | 210      |
----------------------------------
--2023-11-08 19:26:47.888655 CST--
| Itration            | 211      |
| Real Det Return     | 2.63e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.53e+03 |
| Real Sto violation  | 0.75     |
| Reward Loss         | -542     |
| Running Env Steps   | 1055000  |
| Running Forward KL  | 6.75     |
| Running Reverse KL  | 5.95     |
| Running Update Time | 211      |
----------------------------------
--2023-11-08 19:28:52.795390 CST--
| Itration            | 212      |
| Real Det Return     | 2.52e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.53e+03 |
| Real Sto violation  | 0.95     |
| Reward Loss         | -550     |
| Running Env Steps   | 1060000  |
| Running Forward KL  | 7        |
| Running Reverse KL  | 6.07     |
| Running Update Time | 212      |
----------------------------------
--2023-11-08 19:30:57.857716 CST--
| Itration            | 213      |
| Real Det Return     | 2.45e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.54e+03 |
| Real Sto violation  | 0.85     |
| Reward Loss         | -550     |
| Running Env Steps   | 1065000  |
| Running Forward KL  | 7.32     |
| Running Reverse KL  | 6.13     |
| Running Update Time | 213      |
----------------------------------
--2023-11-08 19:33:03.347720 CST--
| Itration            | 214      |
| Real Det Return     | 2.56e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.5e+03  |
| Real Sto violation  | 0.7      |
| Reward Loss         | -535     |
| Running Env Steps   | 1070000  |
| Running Forward KL  | 6.69     |
| Running Reverse KL  | 6.03     |
| Running Update Time | 214      |
----------------------------------
--2023-11-08 19:35:08.837682 CST--
| Itration            | 215      |
| Real Det Return     | 2.56e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.54e+03 |
| Real Sto violation  | 0.75     |
| Reward Loss         | -549     |
| Running Env Steps   | 1075000  |
| Running Forward KL  | 7.19     |
| Running Reverse KL  | 5.96     |
| Running Update Time | 215      |
----------------------------------
--2023-11-08 19:37:14.652550 CST--
| Itration            | 216      |
| Real Det Return     | 2.61e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.52e+03 |
| Real Sto violation  | 0.85     |
| Reward Loss         | -551     |
| Running Env Steps   | 1080000  |
| Running Forward KL  | 6.94     |
| Running Reverse KL  | 5.95     |
| Running Update Time | 216      |
----------------------------------
--2023-11-08 19:39:19.879234 CST--
| Itration            | 217      |
| Real Det Return     | 2.53e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.57e+03 |
| Real Sto violation  | 0.8      |
| Reward Loss         | -506     |
| Running Env Steps   | 1085000  |
| Running Forward KL  | 6.85     |
| Running Reverse KL  | 6.06     |
| Running Update Time | 217      |
----------------------------------
--2023-11-08 19:41:24.624477 CST--
| Itration            | 218      |
| Real Det Return     | 2.55e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.56e+03 |
| Real Sto violation  | 0.9      |
| Reward Loss         | -536     |
| Running Env Steps   | 1090000  |
| Running Forward KL  | 6.64     |
| Running Reverse KL  | 5.98     |
| Running Update Time | 218      |
----------------------------------
--2023-11-08 19:43:28.457294 CST--
| Itration            | 219      |
| Real Det Return     | 2.39e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.53e+03 |
| Real Sto violation  | 0.65     |
| Reward Loss         | -537     |
| Running Env Steps   | 1095000  |
| Running Forward KL  | 6.75     |
| Running Reverse KL  | 6.01     |
| Running Update Time | 219      |
----------------------------------
--2023-11-08 19:45:32.636840 CST--
| Itration            | 220      |
| Real Det Return     | 2.48e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.55e+03 |
| Real Sto violation  | 0.9      |
| Reward Loss         | -540     |
| Running Env Steps   | 1100000  |
| Running Forward KL  | 6.69     |
| Running Reverse KL  | 5.88     |
| Running Update Time | 220      |
----------------------------------
--2023-11-08 19:47:36.489780 CST--
| Itration            | 221      |
| Real Det Return     | 2.5e+03  |
| Real Det violation  | 0        |
| Real Sto Return     | 2.57e+03 |
| Real Sto violation  | 0.9      |
| Reward Loss         | -522     |
| Running Env Steps   | 1105000  |
| Running Forward KL  | 6.57     |
| Running Reverse KL  | 5.91     |
| Running Update Time | 221      |
----------------------------------
--2023-11-08 19:49:40.304393 CST--
| Itration            | 222      |
| Real Det Return     | 2.47e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.55e+03 |
| Real Sto violation  | 0.65     |
| Reward Loss         | -541     |
| Running Env Steps   | 1110000  |
| Running Forward KL  | 6.6      |
| Running Reverse KL  | 5.99     |
| Running Update Time | 222      |
----------------------------------
--2023-11-08 19:51:43.873033 CST--
| Itration            | 223      |
| Real Det Return     | 2.54e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.57e+03 |
| Real Sto violation  | 0.75     |
| Reward Loss         | -537     |
| Running Env Steps   | 1115000  |
| Running Forward KL  | 6.64     |
| Running Reverse KL  | 5.93     |
| Running Update Time | 223      |
----------------------------------
--2023-11-08 19:53:47.688444 CST--
| Itration            | 224      |
| Real Det Return     | 2.46e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.52e+03 |
| Real Sto violation  | 0.85     |
| Reward Loss         | -563     |
| Running Env Steps   | 1120000  |
| Running Forward KL  | 6.29     |
| Running Reverse KL  | 5.88     |
| Running Update Time | 224      |
----------------------------------
--2023-11-08 19:55:51.622411 CST--
| Itration            | 225      |
| Real Det Return     | 2.48e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.55e+03 |
| Real Sto violation  | 0.9      |
| Reward Loss         | -548     |
| Running Env Steps   | 1125000  |
| Running Forward KL  | 6.69     |
| Running Reverse KL  | 5.85     |
| Running Update Time | 225      |
----------------------------------
--2023-11-08 19:57:56.233035 CST--
| Itration            | 226      |
| Real Det Return     | 2.22e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.55e+03 |
| Real Sto violation  | 0.9      |
| Reward Loss         | -546     |
| Running Env Steps   | 1130000  |
| Running Forward KL  | 6.16     |
| Running Reverse KL  | 5.81     |
| Running Update Time | 226      |
----------------------------------
--2023-11-08 20:00:00.172069 CST--
| Itration            | 227      |
| Real Det Return     | 2.38e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.55e+03 |
| Real Sto violation  | 0.85     |
| Reward Loss         | -544     |
| Running Env Steps   | 1135000  |
| Running Forward KL  | 6.59     |
| Running Reverse KL  | 5.91     |
| Running Update Time | 227      |
----------------------------------
--2023-11-08 20:02:03.846130 CST--
| Itration            | 228      |
| Real Det Return     | 2.4e+03  |
| Real Det violation  | 0        |
| Real Sto Return     | 2.55e+03 |
| Real Sto violation  | 0.9      |
| Reward Loss         | -556     |
| Running Env Steps   | 1140000  |
| Running Forward KL  | 6.76     |
| Running Reverse KL  | 5.79     |
| Running Update Time | 228      |
----------------------------------
--2023-11-08 20:04:07.702538 CST--
| Itration            | 229      |
| Real Det Return     | 2.46e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.59e+03 |
| Real Sto violation  | 0.9      |
| Reward Loss         | -514     |
| Running Env Steps   | 1145000  |
| Running Forward KL  | 6.68     |
| Running Reverse KL  | 5.75     |
| Running Update Time | 229      |
----------------------------------
--2023-11-08 20:06:11.656556 CST--
| Itration            | 230      |
| Real Det Return     | 2.6e+03  |
| Real Det violation  | 0        |
| Real Sto Return     | 2.59e+03 |
| Real Sto violation  | 0.8      |
| Reward Loss         | -513     |
| Running Env Steps   | 1150000  |
| Running Forward KL  | 6.2      |
| Running Reverse KL  | 5.63     |
| Running Update Time | 230      |
----------------------------------
--2023-11-08 20:08:15.921498 CST--
| Itration            | 231      |
| Real Det Return     | 2.34e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.58e+03 |
| Real Sto violation  | 0.9      |
| Reward Loss         | -539     |
| Running Env Steps   | 1155000  |
| Running Forward KL  | 6.48     |
| Running Reverse KL  | 5.69     |
| Running Update Time | 231      |
----------------------------------
--2023-11-08 20:10:19.976817 CST--
| Itration            | 232      |
| Real Det Return     | 2.5e+03  |
| Real Det violation  | 0        |
| Real Sto Return     | 2.57e+03 |
| Real Sto violation  | 0.95     |
| Reward Loss         | -511     |
| Running Env Steps   | 1160000  |
| Running Forward KL  | 6.61     |
| Running Reverse KL  | 5.91     |
| Running Update Time | 232      |
----------------------------------
--2023-11-08 20:12:23.926659 CST--
| Itration            | 233      |
| Real Det Return     | 2.35e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.56e+03 |
| Real Sto violation  | 0.65     |
| Reward Loss         | -533     |
| Running Env Steps   | 1165000  |
| Running Forward KL  | 6.24     |
| Running Reverse KL  | 5.83     |
| Running Update Time | 233      |
----------------------------------
--2023-11-08 20:14:27.858171 CST--
| Itration            | 234      |
| Real Det Return     | 2.37e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.55e+03 |
| Real Sto violation  | 0.85     |
| Reward Loss         | -533     |
| Running Env Steps   | 1170000  |
| Running Forward KL  | 6.08     |
| Running Reverse KL  | 5.83     |
| Running Update Time | 234      |
----------------------------------
--2023-11-08 20:16:31.655423 CST--
| Itration            | 235      |
| Real Det Return     | 2.43e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.58e+03 |
| Real Sto violation  | 0.9      |
| Reward Loss         | -536     |
| Running Env Steps   | 1175000  |
| Running Forward KL  | 6.22     |
| Running Reverse KL  | 5.65     |
| Running Update Time | 235      |
----------------------------------
--2023-11-08 20:18:35.445906 CST--
| Itration            | 236      |
| Real Det Return     | 2.23e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.57e+03 |
| Real Sto violation  | 0.65     |
| Reward Loss         | -523     |
| Running Env Steps   | 1180000  |
| Running Forward KL  | 6.1      |
| Running Reverse KL  | 5.74     |
| Running Update Time | 236      |
----------------------------------
--2023-11-08 20:20:39.744647 CST--
| Itration            | 237      |
| Real Det Return     | 2.27e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.56e+03 |
| Real Sto violation  | 0.6      |
| Reward Loss         | -520     |
| Running Env Steps   | 1185000  |
| Running Forward KL  | 6.28     |
| Running Reverse KL  | 5.8      |
| Running Update Time | 237      |
----------------------------------
--2023-11-08 20:22:44.364425 CST--
| Itration            | 238      |
| Real Det Return     | 2.46e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.59e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -524     |
| Running Env Steps   | 1190000  |
| Running Forward KL  | 6.29     |
| Running Reverse KL  | 5.58     |
| Running Update Time | 238      |
----------------------------------
--2023-11-08 20:24:52.570936 CST--
| Itration            | 239      |
| Real Det Return     | 2.36e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.59e+03 |
| Real Sto violation  | 0.85     |
| Reward Loss         | -513     |
| Running Env Steps   | 1195000  |
| Running Forward KL  | 6.57     |
| Running Reverse KL  | 5.82     |
| Running Update Time | 239      |
----------------------------------
--2023-11-08 20:27:00.139567 CST--
| Itration            | 240      |
| Real Det Return     | 2.49e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.6e+03  |
| Real Sto violation  | 0.6      |
| Reward Loss         | -502     |
| Running Env Steps   | 1200000  |
| Running Forward KL  | 5.97     |
| Running Reverse KL  | 5.67     |
| Running Update Time | 240      |
----------------------------------
--2023-11-08 20:29:07.738911 CST--
| Itration            | 241      |
| Real Det Return     | 2.59e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.59e+03 |
| Real Sto violation  | 0.95     |
| Reward Loss         | -513     |
| Running Env Steps   | 1205000  |
| Running Forward KL  | 6.35     |
| Running Reverse KL  | 5.62     |
| Running Update Time | 241      |
----------------------------------
--2023-11-08 20:31:14.944624 CST--
| Itration            | 242      |
| Real Det Return     | 2.39e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.59e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -503     |
| Running Env Steps   | 1210000  |
| Running Forward KL  | 6.34     |
| Running Reverse KL  | 5.61     |
| Running Update Time | 242      |
----------------------------------
--2023-11-08 20:33:21.431045 CST--
| Itration            | 243      |
| Real Det Return     | 2.28e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.58e+03 |
| Real Sto violation  | 0.75     |
| Reward Loss         | -529     |
| Running Env Steps   | 1215000  |
| Running Forward KL  | 5.99     |
| Running Reverse KL  | 5.76     |
| Running Update Time | 243      |
----------------------------------
--2023-11-08 20:35:28.936933 CST--
| Itration            | 244      |
| Real Det Return     | 2.21e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.58e+03 |
| Real Sto violation  | 0.6      |
| Reward Loss         | -527     |
| Running Env Steps   | 1220000  |
| Running Forward KL  | 5.93     |
| Running Reverse KL  | 5.68     |
| Running Update Time | 244      |
----------------------------------
--2023-11-08 20:37:36.234970 CST--
| Itration            | 245      |
| Real Det Return     | 2.52e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.59e+03 |
| Real Sto violation  | 0.95     |
| Reward Loss         | -522     |
| Running Env Steps   | 1225000  |
| Running Forward KL  | 6.17     |
| Running Reverse KL  | 5.49     |
| Running Update Time | 245      |
----------------------------------
--2023-11-08 20:39:44.042832 CST--
| Itration            | 246      |
| Real Det Return     | 2.4e+03  |
| Real Det violation  | 0        |
| Real Sto Return     | 2.58e+03 |
| Real Sto violation  | 0.95     |
| Reward Loss         | -558     |
| Running Env Steps   | 1230000  |
| Running Forward KL  | 6.11     |
| Running Reverse KL  | 5.55     |
| Running Update Time | 246      |
----------------------------------
--2023-11-08 20:41:52.568313 CST--
| Itration            | 247      |
| Real Det Return     | 2.28e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.58e+03 |
| Real Sto violation  | 0.8      |
| Reward Loss         | -542     |
| Running Env Steps   | 1235000  |
| Running Forward KL  | 6.3      |
| Running Reverse KL  | 5.71     |
| Running Update Time | 247      |
----------------------------------
--2023-11-08 20:44:01.292849 CST--
| Itration            | 248      |
| Real Det Return     | 2.55e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.59e+03 |
| Real Sto violation  | 0.7      |
| Reward Loss         | -521     |
| Running Env Steps   | 1240000  |
| Running Forward KL  | 6.24     |
| Running Reverse KL  | 5.71     |
| Running Update Time | 248      |
----------------------------------
--2023-11-08 20:46:10.040030 CST--
| Itration            | 249      |
| Real Det Return     | 2.4e+03  |
| Real Det violation  | 0        |
| Real Sto Return     | 2.58e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -532     |
| Running Env Steps   | 1245000  |
| Running Forward KL  | 6.26     |
| Running Reverse KL  | 5.53     |
| Running Update Time | 249      |
----------------------------------
--2023-11-08 20:48:18.854357 CST--
| Itration            | 250      |
| Real Det Return     | 2.37e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.6e+03  |
| Real Sto violation  | 0.75     |
| Reward Loss         | -516     |
| Running Env Steps   | 1250000  |
| Running Forward KL  | 5.78     |
| Running Reverse KL  | 5.56     |
| Running Update Time | 250      |
----------------------------------
--2023-11-08 20:50:27.480389 CST--
| Itration            | 251      |
| Real Det Return     | 2.42e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.58e+03 |
| Real Sto violation  | 0.95     |
| Reward Loss         | -542     |
| Running Env Steps   | 1255000  |
| Running Forward KL  | 5.99     |
| Running Reverse KL  | 5.47     |
| Running Update Time | 251      |
----------------------------------
--2023-11-08 20:52:36.304516 CST--
| Itration            | 252      |
| Real Det Return     | 2.32e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.59e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -526     |
| Running Env Steps   | 1260000  |
| Running Forward KL  | 6.16     |
| Running Reverse KL  | 5.52     |
| Running Update Time | 252      |
----------------------------------
--2023-11-08 20:54:45.329910 CST--
| Itration            | 253      |
| Real Det Return     | 2.48e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.58e+03 |
| Real Sto violation  | 0.65     |
| Reward Loss         | -512     |
| Running Env Steps   | 1265000  |
| Running Forward KL  | 5.52     |
| Running Reverse KL  | 5.53     |
| Running Update Time | 253      |
----------------------------------
--2023-11-08 20:56:53.963079 CST--
| Itration            | 254      |
| Real Det Return     | 2.24e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.58e+03 |
| Real Sto violation  | 0.9      |
| Reward Loss         | -529     |
| Running Env Steps   | 1270000  |
| Running Forward KL  | 6.02     |
| Running Reverse KL  | 5.53     |
| Running Update Time | 254      |
----------------------------------
--2023-11-08 20:59:02.293164 CST--
| Itration            | 255      |
| Real Det Return     | 2.27e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.59e+03 |
| Real Sto violation  | 0.9      |
| Reward Loss         | -531     |
| Running Env Steps   | 1275000  |
| Running Forward KL  | 5.71     |
| Running Reverse KL  | 5.51     |
| Running Update Time | 255      |
----------------------------------
--2023-11-08 21:01:11.564053 CST--
| Itration            | 256      |
| Real Det Return     | 2.52e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.59e+03 |
| Real Sto violation  | 0.9      |
| Reward Loss         | -521     |
| Running Env Steps   | 1280000  |
| Running Forward KL  | 5.53     |
| Running Reverse KL  | 5.36     |
| Running Update Time | 256      |
----------------------------------
--2023-11-08 21:03:20.812342 CST--
| Itration            | 257      |
| Real Det Return     | 2.39e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.6e+03  |
| Real Sto violation  | 0.95     |
| Reward Loss         | -512     |
| Running Env Steps   | 1285000  |
| Running Forward KL  | 5.66     |
| Running Reverse KL  | 5.41     |
| Running Update Time | 257      |
----------------------------------
--2023-11-08 21:05:28.627109 CST--
| Itration            | 258      |
| Real Det Return     | 2.4e+03  |
| Real Det violation  | 0        |
| Real Sto Return     | 2.58e+03 |
| Real Sto violation  | 0.5      |
| Reward Loss         | -526     |
| Running Env Steps   | 1290000  |
| Running Forward KL  | 5.74     |
| Running Reverse KL  | 5.63     |
| Running Update Time | 258      |
----------------------------------
--2023-11-08 21:07:36.846796 CST--
| Itration            | 259      |
| Real Det Return     | 2.45e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.59e+03 |
| Real Sto violation  | 0.65     |
| Reward Loss         | -524     |
| Running Env Steps   | 1295000  |
| Running Forward KL  | 5.65     |
| Running Reverse KL  | 5.49     |
| Running Update Time | 259      |
----------------------------------
--2023-11-08 21:09:45.653514 CST--
| Itration            | 260      |
| Real Det Return     | 2.25e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.59e+03 |
| Real Sto violation  | 0.85     |
| Reward Loss         | -525     |
| Running Env Steps   | 1300000  |
| Running Forward KL  | 5.65     |
| Running Reverse KL  | 5.43     |
| Running Update Time | 260      |
----------------------------------
--2023-11-08 21:11:54.819857 CST--
| Itration            | 261      |
| Real Det Return     | 2.36e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.58e+03 |
| Real Sto violation  | 0.85     |
| Reward Loss         | -523     |
| Running Env Steps   | 1305000  |
| Running Forward KL  | 6.01     |
| Running Reverse KL  | 5.53     |
| Running Update Time | 261      |
----------------------------------
--2023-11-08 21:14:04.102942 CST--
| Itration            | 262      |
| Real Det Return     | 2.44e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.59e+03 |
| Real Sto violation  | 0.85     |
| Reward Loss         | -531     |
| Running Env Steps   | 1310000  |
| Running Forward KL  | 5.73     |
| Running Reverse KL  | 5.45     |
| Running Update Time | 262      |
----------------------------------
--2023-11-08 21:16:13.145686 CST--
| Itration            | 263      |
| Real Det Return     | 2.18e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.58e+03 |
| Real Sto violation  | 0.75     |
| Reward Loss         | -515     |
| Running Env Steps   | 1315000  |
| Running Forward KL  | 5.25     |
| Running Reverse KL  | 5.43     |
| Running Update Time | 263      |
----------------------------------
--2023-11-08 21:18:22.644278 CST--
| Itration            | 264      |
| Real Det Return     | 2.47e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.59e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -527     |
| Running Env Steps   | 1320000  |
| Running Forward KL  | 5.51     |
| Running Reverse KL  | 5.4      |
| Running Update Time | 264      |
----------------------------------
--2023-11-08 21:20:31.358369 CST--
| Itration            | 265      |
| Real Det Return     | 2.46e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.58e+03 |
| Real Sto violation  | 0.7      |
| Reward Loss         | -505     |
| Running Env Steps   | 1325000  |
| Running Forward KL  | 5.6      |
| Running Reverse KL  | 5.43     |
| Running Update Time | 265      |
----------------------------------
--2023-11-08 21:22:40.715780 CST--
| Itration            | 266      |
| Real Det Return     | 2.39e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.58e+03 |
| Real Sto violation  | 0.65     |
| Reward Loss         | -524     |
| Running Env Steps   | 1330000  |
| Running Forward KL  | 5.91     |
| Running Reverse KL  | 5.4      |
| Running Update Time | 266      |
----------------------------------
--2023-11-08 21:24:50.233592 CST--
| Itration            | 267      |
| Real Det Return     | 2.43e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.58e+03 |
| Real Sto violation  | 0.75     |
| Reward Loss         | -529     |
| Running Env Steps   | 1335000  |
| Running Forward KL  | 5.7      |
| Running Reverse KL  | 5.45     |
| Running Update Time | 267      |
----------------------------------
--2023-11-08 21:26:59.271191 CST--
| Itration            | 268      |
| Real Det Return     | 2.48e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.59e+03 |
| Real Sto violation  | 0.65     |
| Reward Loss         | -536     |
| Running Env Steps   | 1340000  |
| Running Forward KL  | 5.54     |
| Running Reverse KL  | 5.48     |
| Running Update Time | 268      |
----------------------------------
--2023-11-08 21:29:08.651059 CST--
| Itration            | 269      |
| Real Det Return     | 2.56e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.59e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -496     |
| Running Env Steps   | 1345000  |
| Running Forward KL  | 5.64     |
| Running Reverse KL  | 5.38     |
| Running Update Time | 269      |
----------------------------------
--2023-11-08 21:31:17.657592 CST--
| Itration            | 270      |
| Real Det Return     | 2.61e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.57e+03 |
| Real Sto violation  | 0.85     |
| Reward Loss         | -497     |
| Running Env Steps   | 1350000  |
| Running Forward KL  | 5.88     |
| Running Reverse KL  | 5.41     |
| Running Update Time | 270      |
----------------------------------
--2023-11-08 21:33:27.190423 CST--
| Itration            | 271      |
| Real Det Return     | 2.6e+03  |
| Real Det violation  | 0        |
| Real Sto Return     | 2.56e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -503     |
| Running Env Steps   | 1355000  |
| Running Forward KL  | 5.9      |
| Running Reverse KL  | 5.44     |
| Running Update Time | 271      |
----------------------------------
--2023-11-08 21:35:36.344790 CST--
| Itration            | 272      |
| Real Det Return     | 2.5e+03  |
| Real Det violation  | 0        |
| Real Sto Return     | 2.55e+03 |
| Real Sto violation  | 0.85     |
| Reward Loss         | -474     |
| Running Env Steps   | 1360000  |
| Running Forward KL  | 5.41     |
| Running Reverse KL  | 5.36     |
| Running Update Time | 272      |
----------------------------------
--2023-11-08 21:37:45.016635 CST--
| Itration            | 273      |
| Real Det Return     | 2.54e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.57e+03 |
| Real Sto violation  | 0.95     |
| Reward Loss         | -492     |
| Running Env Steps   | 1365000  |
| Running Forward KL  | 5.39     |
| Running Reverse KL  | 5.19     |
| Running Update Time | 273      |
----------------------------------
--2023-11-08 21:39:53.219127 CST--
| Itration            | 274      |
| Real Det Return     | 2.23e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.59e+03 |
| Real Sto violation  | 0.85     |
| Reward Loss         | -522     |
| Running Env Steps   | 1370000  |
| Running Forward KL  | 5.45     |
| Running Reverse KL  | 5.44     |
| Running Update Time | 274      |
----------------------------------
--2023-11-08 21:42:02.119225 CST--
| Itration            | 275      |
| Real Det Return     | 2.59e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.59e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -511     |
| Running Env Steps   | 1375000  |
| Running Forward KL  | 5.28     |
| Running Reverse KL  | 5.21     |
| Running Update Time | 275      |
----------------------------------
--2023-11-08 21:44:10.272432 CST--
| Itration            | 276      |
| Real Det Return     | 2.48e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.57e+03 |
| Real Sto violation  | 0.9      |
| Reward Loss         | -516     |
| Running Env Steps   | 1380000  |
| Running Forward KL  | 5.68     |
| Running Reverse KL  | 5.28     |
| Running Update Time | 276      |
----------------------------------
--2023-11-08 21:46:19.615809 CST--
| Itration            | 277      |
| Real Det Return     | 2.49e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.55e+03 |
| Real Sto violation  | 0.9      |
| Reward Loss         | -488     |
| Running Env Steps   | 1385000  |
| Running Forward KL  | 5.33     |
| Running Reverse KL  | 5.14     |
| Running Update Time | 277      |
----------------------------------
--2023-11-08 21:48:28.575850 CST--
| Itration            | 278      |
| Real Det Return     | 2.7e+03  |
| Real Det violation  | 0        |
| Real Sto Return     | 2.57e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -508     |
| Running Env Steps   | 1390000  |
| Running Forward KL  | 5.55     |
| Running Reverse KL  | 5.18     |
| Running Update Time | 278      |
----------------------------------
--2023-11-08 21:50:38.820754 CST--
| Itration            | 279      |
| Real Det Return     | 2.06e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.58e+03 |
| Real Sto violation  | 0.5      |
| Reward Loss         | -516     |
| Running Env Steps   | 1395000  |
| Running Forward KL  | 5.38     |
| Running Reverse KL  | 5.36     |
| Running Update Time | 279      |
----------------------------------
--2023-11-08 21:52:49.389417 CST--
| Itration            | 280      |
| Real Det Return     | 2.54e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.59e+03 |
| Real Sto violation  | 0.6      |
| Reward Loss         | -506     |
| Running Env Steps   | 1400000  |
| Running Forward KL  | 5.27     |
| Running Reverse KL  | 5.41     |
| Running Update Time | 280      |
----------------------------------
--2023-11-08 21:54:59.709375 CST--
| Itration            | 281      |
| Real Det Return     | 2.59e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.56e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -506     |
| Running Env Steps   | 1405000  |
| Running Forward KL  | 5.53     |
| Running Reverse KL  | 5.36     |
| Running Update Time | 281      |
----------------------------------
--2023-11-08 21:57:09.634384 CST--
| Itration            | 282      |
| Real Det Return     | 2.51e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.57e+03 |
| Real Sto violation  | 0.95     |
| Reward Loss         | -505     |
| Running Env Steps   | 1410000  |
| Running Forward KL  | 5.31     |
| Running Reverse KL  | 5.14     |
| Running Update Time | 282      |
----------------------------------
--2023-11-08 21:59:19.866554 CST--
| Itration            | 283      |
| Real Det Return     | 2.62e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.6e+03  |
| Real Sto violation  | 0.75     |
| Reward Loss         | -502     |
| Running Env Steps   | 1415000  |
| Running Forward KL  | 5.09     |
| Running Reverse KL  | 5.3      |
| Running Update Time | 283      |
----------------------------------
--2023-11-08 22:01:30.003482 CST--
| Itration            | 284      |
| Real Det Return     | 2.44e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.59e+03 |
| Real Sto violation  | 0.75     |
| Reward Loss         | -532     |
| Running Env Steps   | 1420000  |
| Running Forward KL  | 5.01     |
| Running Reverse KL  | 5.13     |
| Running Update Time | 284      |
----------------------------------
--2023-11-08 22:03:40.201791 CST--
| Itration            | 285      |
| Real Det Return     | 2.53e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.57e+03 |
| Real Sto violation  | 0.7      |
| Reward Loss         | -521     |
| Running Env Steps   | 1425000  |
| Running Forward KL  | 5.42     |
| Running Reverse KL  | 5.33     |
| Running Update Time | 285      |
----------------------------------
--2023-11-08 22:05:50.257115 CST--
| Itration            | 286      |
| Real Det Return     | 2.66e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.56e+03 |
| Real Sto violation  | 0.9      |
| Reward Loss         | -504     |
| Running Env Steps   | 1430000  |
| Running Forward KL  | 5.66     |
| Running Reverse KL  | 5.38     |
| Running Update Time | 286      |
----------------------------------
--2023-11-08 22:08:00.543417 CST--
| Itration            | 287      |
| Real Det Return     | 2.48e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.56e+03 |
| Real Sto violation  | 0.85     |
| Reward Loss         | -474     |
| Running Env Steps   | 1435000  |
| Running Forward KL  | 5.13     |
| Running Reverse KL  | 5.22     |
| Running Update Time | 287      |
----------------------------------
--2023-11-08 22:10:10.344963 CST--
| Itration            | 288      |
| Real Det Return     | 2.5e+03  |
| Real Det violation  | 0        |
| Real Sto Return     | 2.5e+03  |
| Real Sto violation  | 1        |
| Reward Loss         | -486     |
| Running Env Steps   | 1440000  |
| Running Forward KL  | 5.61     |
| Running Reverse KL  | 5.44     |
| Running Update Time | 288      |
----------------------------------
--2023-11-08 22:12:20.812081 CST--
| Itration            | 289      |
| Real Det Return     | 2.67e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.58e+03 |
| Real Sto violation  | 1        |
| Reward Loss         | -491     |
| Running Env Steps   | 1445000  |
| Running Forward KL  | 4.92     |
| Running Reverse KL  | 5.17     |
| Running Update Time | 289      |
----------------------------------
--2023-11-08 22:14:30.984384 CST--
| Itration            | 290      |
| Real Det Return     | 2.22e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.56e+03 |
| Real Sto violation  | 0.75     |
| Reward Loss         | -508     |
| Running Env Steps   | 1450000  |
| Running Forward KL  | 4.95     |
| Running Reverse KL  | 5.22     |
| Running Update Time | 290      |
----------------------------------
--2023-11-08 22:16:41.640138 CST--
| Itration            | 291      |
| Real Det Return     | 2.69e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.54e+03 |
| Real Sto violation  | 0.95     |
| Reward Loss         | -465     |
| Running Env Steps   | 1455000  |
| Running Forward KL  | 5.56     |
| Running Reverse KL  | 5.39     |
| Running Update Time | 291      |
----------------------------------
--2023-11-08 22:18:51.954824 CST--
| Itration            | 292      |
| Real Det Return     | 2.52e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.58e+03 |
| Real Sto violation  | 0.7      |
| Reward Loss         | -521     |
| Running Env Steps   | 1460000  |
| Running Forward KL  | 5.2      |
| Running Reverse KL  | 5.24     |
| Running Update Time | 292      |
----------------------------------
--2023-11-08 22:21:02.611310 CST--
| Itration            | 293      |
| Real Det Return     | 2.65e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.58e+03 |
| Real Sto violation  | 0.85     |
| Reward Loss         | -493     |
| Running Env Steps   | 1465000  |
| Running Forward KL  | 5.16     |
| Running Reverse KL  | 5.22     |
| Running Update Time | 293      |
----------------------------------
--2023-11-08 22:23:12.556656 CST--
| Itration            | 294      |
| Real Det Return     | 2.39e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.56e+03 |
| Real Sto violation  | 0.8      |
| Reward Loss         | -482     |
| Running Env Steps   | 1470000  |
| Running Forward KL  | 5.01     |
| Running Reverse KL  | 5.22     |
| Running Update Time | 294      |
----------------------------------
--2023-11-08 22:25:22.623341 CST--
| Itration            | 295      |
| Real Det Return     | 2.83e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.55e+03 |
| Real Sto violation  | 0.95     |
| Reward Loss         | -503     |
| Running Env Steps   | 1475000  |
| Running Forward KL  | 5.06     |
| Running Reverse KL  | 5.07     |
| Running Update Time | 295      |
----------------------------------
--2023-11-08 22:27:32.502476 CST--
| Itration            | 296      |
| Real Det Return     | 2.68e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.55e+03 |
| Real Sto violation  | 0.85     |
| Reward Loss         | -523     |
| Running Env Steps   | 1480000  |
| Running Forward KL  | 5.15     |
| Running Reverse KL  | 5.18     |
| Running Update Time | 296      |
----------------------------------
--2023-11-08 22:29:42.278652 CST--
| Itration            | 297      |
| Real Det Return     | 2.62e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.57e+03 |
| Real Sto violation  | 0.95     |
| Reward Loss         | -508     |
| Running Env Steps   | 1485000  |
| Running Forward KL  | 4.81     |
| Running Reverse KL  | 4.99     |
| Running Update Time | 297      |
----------------------------------
--2023-11-08 22:31:52.158234 CST--
| Itration            | 298      |
| Real Det Return     | 2.67e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.56e+03 |
| Real Sto violation  | 0.75     |
| Reward Loss         | -495     |
| Running Env Steps   | 1490000  |
| Running Forward KL  | 5.13     |
| Running Reverse KL  | 5.14     |
| Running Update Time | 298      |
----------------------------------
