Logging to logs/HalfCheetah-v3/exp-1/maxentirl_sa/2023_11_08_11_52_41
--2023-11-08 11:54:05.902416 CST--
| Cost Loss           | 50.6     |
| Itration            | 0        |
| Real Det Return     | -115     |
| Real Det violation  | 0.9      |
| Real Sto Return     | 0.43     |
| Real Sto violation  | 1        |
| Reward Loss         | 563      |
| Running Env Steps   | 0        |
| Running Forward KL  | 17.7     |
| Running Reverse KL  | 9.22     |
| Running Update Time | 0        |
----------------------------------
--2023-11-08 11:55:40.524897 CST--
| Cost Loss           | 36.5     |
| Itration            | 1        |
| Real Det Return     | -281     |
| Real Det violation  | 0.15     |
| Real Sto Return     | 9.8      |
| Real Sto violation  | 1        |
| Reward Loss         | 587      |
| Running Env Steps   | 5000     |
| Running Forward KL  | 17.8     |
| Running Reverse KL  | 9.91     |
| Running Update Time | 1        |
----------------------------------
--2023-11-08 11:57:14.755258 CST---
| Cost Loss           | 59.9      |
| Itration            | 2         |
| Real Det Return     | -1.01e+03 |
| Real Det violation  | 0         |
| Real Sto Return     | -30.6     |
| Real Sto violation  | 1         |
| Reward Loss         | 569       |
| Running Env Steps   | 10000     |
| Running Forward KL  | 17.8      |
| Running Reverse KL  | 9.25      |
| Running Update Time | 2         |
-----------------------------------
--2023-11-08 11:58:49.161102 CST--
| Cost Loss           | 45.4     |
| Itration            | 3        |
| Real Det Return     | -690     |
| Real Det violation  | 0        |
| Real Sto Return     | -84.5    |
| Real Sto violation  | 1        |
| Reward Loss         | 612      |
| Running Env Steps   | 15000    |
| Running Forward KL  | 17.5     |
| Running Reverse KL  | 9.83     |
| Running Update Time | 3        |
----------------------------------
--2023-11-08 12:00:23.302314 CST--
| Cost Loss           | 9.86     |
| Itration            | 4        |
| Real Det Return     | -1.1e+03 |
| Real Det violation  | 0.1      |
| Real Sto Return     | -159     |
| Real Sto violation  | 1        |
| Reward Loss         | 597      |
| Running Env Steps   | 20000    |
| Running Forward KL  | 17.2     |
| Running Reverse KL  | 10.2     |
| Running Update Time | 4        |
----------------------------------
--2023-11-08 12:01:57.536788 CST--
| Cost Loss           | 12.1     |
| Itration            | 5        |
| Real Det Return     | -632     |
| Real Det violation  | 0.7      |
| Real Sto Return     | -113     |
| Real Sto violation  | 1        |
| Reward Loss         | 574      |
| Running Env Steps   | 25000    |
| Running Forward KL  | 17.6     |
| Running Reverse KL  | 9.65     |
| Running Update Time | 5        |
----------------------------------
--2023-11-08 12:03:31.995146 CST--
| Cost Loss           | 8.36     |
| Itration            | 6        |
| Real Det Return     | -940     |
| Real Det violation  | 0.95     |
| Real Sto Return     | -123     |
| Real Sto violation  | 1        |
| Reward Loss         | 554      |
| Running Env Steps   | 30000    |
| Running Forward KL  | 17.5     |
| Running Reverse KL  | 9.67     |
| Running Update Time | 6        |
----------------------------------
--2023-11-08 12:05:05.014777 CST---
| Cost Loss           | 5.15      |
| Itration            | 7         |
| Real Det Return     | -1.09e+03 |
| Real Det violation  | 0.95      |
| Real Sto Return     | -194      |
| Real Sto violation  | 1         |
| Reward Loss         | 522       |
| Running Env Steps   | 35000     |
| Running Forward KL  | 17.6      |
| Running Reverse KL  | 9.39      |
| Running Update Time | 7         |
-----------------------------------
--2023-11-08 12:06:35.161642 CST---
| Cost Loss           | 2.58      |
| Itration            | 8         |
| Real Det Return     | -1.38e+03 |
| Real Det violation  | 0.45      |
| Real Sto Return     | -244      |
| Real Sto violation  | 1         |
| Reward Loss         | 502       |
| Running Env Steps   | 40000     |
| Running Forward KL  | 17.6      |
| Running Reverse KL  | 8.98      |
| Running Update Time | 8         |
-----------------------------------
--2023-11-08 12:08:05.237904 CST---
| Cost Loss           | -13.7     |
| Itration            | 9         |
| Real Det Return     | -1.38e+03 |
| Real Det violation  | 0.4       |
| Real Sto Return     | -203      |
| Real Sto violation  | 1         |
| Reward Loss         | 484       |
| Running Env Steps   | 45000     |
| Running Forward KL  | 17.2      |
| Running Reverse KL  | 9.2       |
| Running Update Time | 9         |
-----------------------------------
--2023-11-08 12:09:36.270408 CST---
| Cost Loss           | -18       |
| Itration            | 10        |
| Real Det Return     | -1.59e+03 |
| Real Det violation  | 0         |
| Real Sto Return     | -242      |
| Real Sto violation  | 1         |
| Reward Loss         | 454       |
| Running Env Steps   | 50000     |
| Running Forward KL  | 17.6      |
| Running Reverse KL  | 9.12      |
| Running Update Time | 10        |
-----------------------------------
--2023-11-08 12:11:08.954880 CST---
| Cost Loss           | -17.9     |
| Itration            | 11        |
| Real Det Return     | -1.33e+03 |
| Real Det violation  | 0.05      |
| Real Sto Return     | -173      |
| Real Sto violation  | 0.95      |
| Reward Loss         | 451       |
| Running Env Steps   | 55000     |
| Running Forward KL  | 17.7      |
| Running Reverse KL  | 9.11      |
| Running Update Time | 11        |
-----------------------------------
