Logging to logs/HalfCheetah-v3/exp-1/maxentirl_sa/2023_11_09_00_10_19
--2023-11-09 00:11:39.097353 CST---
| Itration            | 0         |
| Real Det Return     | -1.24e+03 |
| Real Det violation  | 0         |
| Real Sto Return     | -134      |
| Real Sto violation  | 1         |
| Reward Loss         | 643       |
| Running Env Steps   | 0         |
| Running Forward KL  | 17.9      |
| Running Reverse KL  | 10.3      |
| Running Update Time | 0         |
-----------------------------------
--2023-11-09 00:13:07.790606 CST---
| Itration            | 1         |
| Real Det Return     | -1.24e+03 |
| Real Det violation  | 0.6       |
| Real Sto Return     | -201      |
| Real Sto violation  | 1         |
| Reward Loss         | 743       |
| Running Env Steps   | 5000      |
| Running Forward KL  | 18.1      |
| Running Reverse KL  | 10.9      |
| Running Update Time | 1         |
-----------------------------------
--2023-11-09 00:14:36.448139 CST---
| Itration            | 2         |
| Real Det Return     | -1.48e+03 |
| Real Det violation  | 0.65      |
| Real Sto Return     | -326      |
| Real Sto violation  | 1         |
| Reward Loss         | 759       |
| Running Env Steps   | 10000     |
| Running Forward KL  | 18.6      |
| Running Reverse KL  | 11.7      |
| Running Update Time | 2         |
-----------------------------------
--2023-11-09 00:16:04.826150 CST---
| Itration            | 3         |
| Real Det Return     | -1.31e+03 |
| Real Det violation  | 0.35      |
| Real Sto Return     | -291      |
| Real Sto violation  | 1         |
| Reward Loss         | 814       |
| Running Env Steps   | 15000     |
| Running Forward KL  | 18.8      |
| Running Reverse KL  | 12.4      |
| Running Update Time | 3         |
-----------------------------------
--2023-11-09 00:17:33.439915 CST---
| Itration            | 4         |
| Real Det Return     | -1.71e+03 |
| Real Det violation  | 0         |
| Real Sto Return     | -321      |
| Real Sto violation  | 1         |
| Reward Loss         | 693       |
| Running Env Steps   | 20000     |
| Running Forward KL  | 18.5      |
| Running Reverse KL  | 11.3      |
| Running Update Time | 4         |
-----------------------------------
--2023-11-09 00:19:02.105133 CST--
| Itration            | 5        |
| Real Det Return     | -1.6e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | -347     |
| Real Sto violation  | 1        |
| Reward Loss         | 674      |
| Running Env Steps   | 25000    |
| Running Forward KL  | 18.1     |
| Running Reverse KL  | 11.4     |
| Running Update Time | 5        |
----------------------------------
--2023-11-09 00:20:29.176718 CST---
| Itration            | 6         |
| Real Det Return     | -1.57e+03 |
| Real Det violation  | 0         |
| Real Sto Return     | -351      |
| Real Sto violation  | 1         |
| Reward Loss         | 628       |
| Running Env Steps   | 30000     |
| Running Forward KL  | 18        |
| Running Reverse KL  | 11.2      |
| Running Update Time | 6         |
-----------------------------------
--2023-11-09 00:21:56.124416 CST---
| Itration            | 7         |
| Real Det Return     | -1.75e+03 |
| Real Det violation  | 0         |
| Real Sto Return     | -371      |
| Real Sto violation  | 1         |
| Reward Loss         | 616       |
| Running Env Steps   | 35000     |
| Running Forward KL  | 18.6      |
| Running Reverse KL  | 11.3      |
| Running Update Time | 7         |
-----------------------------------
--2023-11-09 00:23:23.563027 CST---
| Itration            | 8         |
| Real Det Return     | -1.78e+03 |
| Real Det violation  | 0         |
| Real Sto Return     | -405      |
| Real Sto violation  | 1         |
| Reward Loss         | 566       |
| Running Env Steps   | 40000     |
| Running Forward KL  | 18.3      |
| Running Reverse KL  | 10.9      |
| Running Update Time | 8         |
-----------------------------------
--2023-11-09 00:24:59.909872 CST---
| Itration            | 9         |
| Real Det Return     | -1.78e+03 |
| Real Det violation  | 0         |
| Real Sto Return     | -348      |
| Real Sto violation  | 1         |
| Reward Loss         | 547       |
| Running Env Steps   | 45000     |
| Running Forward KL  | 17.9      |
| Running Reverse KL  | 10.7      |
| Running Update Time | 9         |
-----------------------------------
--2023-11-09 00:26:37.175001 CST---
| Itration            | 10        |
| Real Det Return     | -1.58e+03 |
| Real Det violation  | 0         |
| Real Sto Return     | -343      |
| Real Sto violation  | 1         |
| Reward Loss         | 524       |
| Running Env Steps   | 50000     |
| Running Forward KL  | 18        |
| Running Reverse KL  | 10.4      |
| Running Update Time | 10        |
-----------------------------------
--2023-11-09 00:28:07.790463 CST---
| Itration            | 11        |
| Real Det Return     | -1.61e+03 |
| Real Det violation  | 0         |
| Real Sto Return     | -402      |
| Real Sto violation  | 1         |
| Reward Loss         | 509       |
| Running Env Steps   | 55000     |
| Running Forward KL  | 18.1      |
| Running Reverse KL  | 10.5      |
| Running Update Time | 11        |
-----------------------------------
--2023-11-09 00:29:40.041897 CST---
| Itration            | 12        |
| Real Det Return     | -1.62e+03 |
| Real Det violation  | 0         |
| Real Sto Return     | -430      |
| Real Sto violation  | 1         |
| Reward Loss         | 479       |
| Running Env Steps   | 60000     |
| Running Forward KL  | 18.1      |
| Running Reverse KL  | 10.2      |
| Running Update Time | 12        |
-----------------------------------
--2023-11-09 00:31:14.255699 CST---
| Itration            | 13        |
| Real Det Return     | -1.49e+03 |
| Real Det violation  | 0         |
| Real Sto Return     | -362      |
| Real Sto violation  | 0.95      |
| Reward Loss         | 430       |
| Running Env Steps   | 65000     |
| Running Forward KL  | 17.6      |
| Running Reverse KL  | 9.78      |
| Running Update Time | 13        |
-----------------------------------
--2023-11-09 00:32:53.055038 CST---
| Itration            | 14        |
| Real Det Return     | -1.64e+03 |
| Real Det violation  | 0         |
| Real Sto Return     | -422      |
| Real Sto violation  | 0.95      |
| Reward Loss         | 432       |
| Running Env Steps   | 70000     |
| Running Forward KL  | 17.6      |
| Running Reverse KL  | 9.94      |
| Running Update Time | 14        |
-----------------------------------
--2023-11-09 00:34:36.685034 CST---
| Itration            | 15        |
| Real Det Return     | -1.64e+03 |
| Real Det violation  | 0         |
| Real Sto Return     | -482      |
| Real Sto violation  | 1         |
| Reward Loss         | 404       |
| Running Env Steps   | 75000     |
| Running Forward KL  | 17.7      |
| Running Reverse KL  | 9.93      |
| Running Update Time | 15        |
-----------------------------------
--2023-11-09 00:36:23.399323 CST--
| Itration            | 16       |
| Real Det Return     | -1.7e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | -342     |
| Real Sto violation  | 1        |
| Reward Loss         | 391      |
| Running Env Steps   | 80000    |
| Running Forward KL  | 18       |
| Running Reverse KL  | 9.73     |
| Running Update Time | 16       |
----------------------------------
--2023-11-09 00:38:10.939733 CST---
| Itration            | 17        |
| Real Det Return     | -1.53e+03 |
| Real Det violation  | 0         |
| Real Sto Return     | -393      |
| Real Sto violation  | 1         |
| Reward Loss         | 373       |
| Running Env Steps   | 85000     |
| Running Forward KL  | 17.5      |
| Running Reverse KL  | 9.64      |
| Running Update Time | 17        |
-----------------------------------
