Logging to logs/HalfCheetah-v3/exp-1/maxentirl/2023_11_09_05_15_16
--2023-11-09 05:16:30.353258 CST--
| Itration            | 0        |
| Real Det Return     | 1.75e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.78e+03 |
| Real Sto violation  | 0.05     |
| Reward Loss         | 30.3     |
| Running Env Steps   | 0        |
| Running Forward KL  | 16.2     |
| Running Reverse KL  | 12.6     |
| Running Update Time | 0        |
----------------------------------
--2023-11-09 05:17:54.577854 CST--
| Itration            | 1        |
| Real Det Return     | 1.75e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.81e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | 50.6     |
| Running Env Steps   | 5000     |
| Running Forward KL  | 16       |
| Running Reverse KL  | 14       |
| Running Update Time | 1        |
----------------------------------
--2023-11-09 05:19:19.110797 CST--
| Itration            | 2        |
| Real Det Return     | 1.76e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.82e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | 31.3     |
| Running Env Steps   | 10000    |
| Running Forward KL  | 15.8     |
| Running Reverse KL  | 14.4     |
| Running Update Time | 2        |
----------------------------------
--2023-11-09 05:20:44.351790 CST--
| Itration            | 3        |
| Real Det Return     | 1.77e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.8e+03  |
| Real Sto violation  | 0        |
| Reward Loss         | 25.2     |
| Running Env Steps   | 15000    |
| Running Forward KL  | 17.1     |
| Running Reverse KL  | 15.5     |
| Running Update Time | 3        |
----------------------------------
--2023-11-09 05:22:09.228272 CST--
| Itration            | 4        |
| Real Det Return     | 1.77e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.81e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | 17.6     |
| Running Env Steps   | 20000    |
| Running Forward KL  | 16.6     |
| Running Reverse KL  | 15.2     |
| Running Update Time | 4        |
----------------------------------
--2023-11-09 05:23:34.236211 CST--
| Itration            | 5        |
| Real Det Return     | 1.77e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.82e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -0.844   |
| Running Env Steps   | 25000    |
| Running Forward KL  | 15.9     |
| Running Reverse KL  | 15       |
| Running Update Time | 5        |
----------------------------------
--2023-11-09 05:24:59.436150 CST--
| Itration            | 6        |
| Real Det Return     | 1.77e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.82e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -8.46    |
| Running Env Steps   | 30000    |
| Running Forward KL  | 16.2     |
| Running Reverse KL  | 15.2     |
| Running Update Time | 6        |
----------------------------------
--2023-11-09 05:26:24.589907 CST--
| Itration            | 7        |
| Real Det Return     | 1.78e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.82e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -32.5    |
| Running Env Steps   | 35000    |
| Running Forward KL  | 15.8     |
| Running Reverse KL  | 15       |
| Running Update Time | 7        |
----------------------------------
--2023-11-09 05:27:49.794073 CST--
| Itration            | 8        |
| Real Det Return     | 1.76e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.82e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -41.5    |
| Running Env Steps   | 40000    |
| Running Forward KL  | 16       |
| Running Reverse KL  | 14.7     |
| Running Update Time | 8        |
----------------------------------
--2023-11-09 05:29:15.253221 CST--
| Itration            | 9        |
| Real Det Return     | 1.77e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.81e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -53      |
| Running Env Steps   | 45000    |
| Running Forward KL  | 16.2     |
| Running Reverse KL  | 15       |
| Running Update Time | 9        |
----------------------------------
--2023-11-09 05:30:41.501057 CST--
| Itration            | 10       |
| Real Det Return     | 1.76e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.82e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -69.7    |
| Running Env Steps   | 50000    |
| Running Forward KL  | 15       |
| Running Reverse KL  | 14.3     |
| Running Update Time | 10       |
----------------------------------
--2023-11-09 05:32:09.384508 CST--
| Itration            | 11       |
| Real Det Return     | 1.76e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.83e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -83.1    |
| Running Env Steps   | 55000    |
| Running Forward KL  | 15       |
| Running Reverse KL  | 13.7     |
| Running Update Time | 11       |
----------------------------------
--2023-11-09 05:33:38.264267 CST--
| Itration            | 12       |
| Real Det Return     | 1.76e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.83e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -99.3    |
| Running Env Steps   | 60000    |
| Running Forward KL  | 15.8     |
| Running Reverse KL  | 14.2     |
| Running Update Time | 12       |
----------------------------------
--2023-11-09 05:35:07.812470 CST--
| Itration            | 13       |
| Real Det Return     | 1.76e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.83e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -108     |
| Running Env Steps   | 65000    |
| Running Forward KL  | 14.7     |
| Running Reverse KL  | 13.8     |
| Running Update Time | 13       |
----------------------------------
--2023-11-09 05:36:40.724195 CST--
| Itration            | 14       |
| Real Det Return     | 1.76e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.83e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -122     |
| Running Env Steps   | 70000    |
| Running Forward KL  | 14.8     |
| Running Reverse KL  | 13.7     |
| Running Update Time | 14       |
----------------------------------
--2023-11-09 05:38:17.647051 CST--
| Itration            | 15       |
| Real Det Return     | 1.76e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.82e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -137     |
| Running Env Steps   | 75000    |
| Running Forward KL  | 14.8     |
| Running Reverse KL  | 13.6     |
| Running Update Time | 15       |
----------------------------------
