Logging to logs/HalfCheetah-v3/exp-1/maxentirl_sa/2023_11_09_00_55_10
--2023-11-09 00:56:24.885838 CST---
| Itration            | 0         |
| Real Det Return     | -1.27e+03 |
| Real Det violation  | 0         |
| Real Sto Return     | -142      |
| Real Sto violation  | 1         |
| Reward Loss         | 707       |
| Running Env Steps   | 0         |
| Running Forward KL  | 17.7      |
| Running Reverse KL  | 10.8      |
| Running Update Time | 0         |
-----------------------------------
--2023-11-09 00:57:53.571670 CST--
| Itration            | 1        |
| Real Det Return     | -1.6e+03 |
| Real Det violation  | 0.3      |
| Real Sto Return     | -314     |
| Real Sto violation  | 1        |
| Reward Loss         | 870      |
| Running Env Steps   | 5000     |
| Running Forward KL  | 19.6     |
| Running Reverse KL  | 13.1     |
| Running Update Time | 1        |
----------------------------------
--2023-11-09 00:59:22.392983 CST---
| Itration            | 2         |
| Real Det Return     | -1.74e+03 |
| Real Det violation  | 0.15      |
| Real Sto Return     | -461      |
| Real Sto violation  | 1         |
| Reward Loss         | 857       |
| Running Env Steps   | 10000     |
| Running Forward KL  | 19.3      |
| Running Reverse KL  | 12.6      |
| Running Update Time | 2         |
-----------------------------------
--2023-11-09 01:00:49.751092 CST---
| Itration            | 3         |
| Real Det Return     | -1.51e+03 |
| Real Det violation  | 0.05      |
| Real Sto Return     | -349      |
| Real Sto violation  | 1         |
| Reward Loss         | 802       |
| Running Env Steps   | 15000     |
| Running Forward KL  | 19.1      |
| Running Reverse KL  | 12.5      |
| Running Update Time | 3         |
-----------------------------------
--2023-11-09 01:02:17.557586 CST---
| Itration            | 4         |
| Real Det Return     | -1.69e+03 |
| Real Det violation  | 0         |
| Real Sto Return     | -388      |
| Real Sto violation  | 1         |
| Reward Loss         | 723       |
| Running Env Steps   | 20000     |
| Running Forward KL  | 18.7      |
| Running Reverse KL  | 12        |
| Running Update Time | 4         |
-----------------------------------
--2023-11-09 01:03:44.128045 CST---
| Itration            | 5         |
| Real Det Return     | -1.79e+03 |
| Real Det violation  | 0         |
| Real Sto Return     | -378      |
| Real Sto violation  | 1         |
| Reward Loss         | 633       |
| Running Env Steps   | 25000     |
| Running Forward KL  | 18.2      |
| Running Reverse KL  | 11.3      |
| Running Update Time | 5         |
-----------------------------------
--2023-11-09 01:05:12.002893 CST---
| Itration            | 6         |
| Real Det Return     | -1.64e+03 |
| Real Det violation  | 0         |
| Real Sto Return     | -376      |
| Real Sto violation  | 0.9       |
| Reward Loss         | 627       |
| Running Env Steps   | 30000     |
| Running Forward KL  | 18.4      |
| Running Reverse KL  | 11.2      |
| Running Update Time | 6         |
-----------------------------------
--2023-11-09 01:06:39.806214 CST---
| Itration            | 7         |
| Real Det Return     | -1.53e+03 |
| Real Det violation  | 0         |
| Real Sto Return     | -372      |
| Real Sto violation  | 1         |
| Reward Loss         | 582       |
| Running Env Steps   | 35000     |
| Running Forward KL  | 18.1      |
| Running Reverse KL  | 11        |
| Running Update Time | 7         |
-----------------------------------
--2023-11-09 01:08:08.153028 CST---
| Itration            | 8         |
| Real Det Return     | -1.58e+03 |
| Real Det violation  | 0         |
| Real Sto Return     | -417      |
| Real Sto violation  | 1         |
| Reward Loss         | 564       |
| Running Env Steps   | 40000     |
| Running Forward KL  | 18.4      |
| Running Reverse KL  | 10.9      |
| Running Update Time | 8         |
-----------------------------------
--2023-11-09 01:09:36.841707 CST---
| Itration            | 9         |
| Real Det Return     | -1.45e+03 |
| Real Det violation  | 0         |
| Real Sto Return     | -469      |
| Real Sto violation  | 1         |
| Reward Loss         | 519       |
| Running Env Steps   | 45000     |
| Running Forward KL  | 17.9      |
| Running Reverse KL  | 10.6      |
| Running Update Time | 9         |
-----------------------------------
--2023-11-09 01:11:06.902850 CST---
| Itration            | 10        |
| Real Det Return     | -1.73e+03 |
| Real Det violation  | 0         |
| Real Sto Return     | -488      |
| Real Sto violation  | 1         |
| Reward Loss         | 541       |
| Running Env Steps   | 50000     |
| Running Forward KL  | 18.3      |
| Running Reverse KL  | 10.6      |
| Running Update Time | 10        |
-----------------------------------
--2023-11-09 01:12:37.708508 CST---
| Itration            | 11        |
| Real Det Return     | -1.56e+03 |
| Real Det violation  | 0         |
| Real Sto Return     | -455      |
| Real Sto violation  | 1         |
| Reward Loss         | 492       |
| Running Env Steps   | 55000     |
| Running Forward KL  | 18        |
| Running Reverse KL  | 10.4      |
| Running Update Time | 11        |
-----------------------------------
--2023-11-09 01:14:12.974136 CST---
| Itration            | 12        |
| Real Det Return     | -1.77e+03 |
| Real Det violation  | 0         |
| Real Sto Return     | -471      |
| Real Sto violation  | 1         |
| Reward Loss         | 491       |
| Running Env Steps   | 60000     |
| Running Forward KL  | 17.9      |
| Running Reverse KL  | 10.6      |
| Running Update Time | 12        |
-----------------------------------
--2023-11-09 01:15:48.311304 CST--
| Itration            | 13       |
| Real Det Return     | -1.6e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | -437     |
| Real Sto violation  | 1        |
| Reward Loss         | 450      |
| Running Env Steps   | 65000    |
| Running Forward KL  | 17.6     |
| Running Reverse KL  | 10.1     |
| Running Update Time | 13       |
----------------------------------
--2023-11-09 01:17:26.769383 CST--
| Itration            | 14       |
| Real Det Return     | -1.6e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | -453     |
| Real Sto violation  | 0.95     |
| Reward Loss         | 419      |
| Running Env Steps   | 70000    |
| Running Forward KL  | 18       |
| Running Reverse KL  | 10.1     |
| Running Update Time | 14       |
----------------------------------
--2023-11-09 01:19:10.724036 CST---
| Itration            | 15        |
| Real Det Return     | -1.68e+03 |
| Real Det violation  | 0         |
| Real Sto Return     | -471      |
| Real Sto violation  | 1         |
| Reward Loss         | 408       |
| Running Env Steps   | 75000     |
| Running Forward KL  | 18        |
| Running Reverse KL  | 9.78      |
| Running Update Time | 15        |
-----------------------------------
--2023-11-09 01:20:53.393596 CST---
| Itration            | 16        |
| Real Det Return     | -1.58e+03 |
| Real Det violation  | 0         |
| Real Sto Return     | -339      |
| Real Sto violation  | 1         |
| Reward Loss         | 395       |
| Running Env Steps   | 80000     |
| Running Forward KL  | 17.5      |
| Running Reverse KL  | 9.66      |
| Running Update Time | 16        |
-----------------------------------
--2023-11-09 01:22:36.989128 CST--
| Itration            | 17       |
| Real Det Return     | -1.2e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | -319     |
| Real Sto violation  | 1        |
| Reward Loss         | 355      |
| Running Env Steps   | 85000    |
| Running Forward KL  | 17.5     |
| Running Reverse KL  | 9.69     |
| Running Update Time | 17       |
----------------------------------
--2023-11-09 01:24:26.035687 CST---
| Itration            | 18        |
| Real Det Return     | -1.32e+03 |
| Real Det violation  | 0         |
| Real Sto Return     | -416      |
| Real Sto violation  | 1         |
| Reward Loss         | 331       |
| Running Env Steps   | 90000     |
| Running Forward KL  | 17.7      |
| Running Reverse KL  | 9.46      |
| Running Update Time | 18        |
-----------------------------------
--2023-11-09 01:26:15.697484 CST--
| Itration            | 19       |
| Real Det Return     | -1.5e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | -383     |
| Real Sto violation  | 1        |
| Reward Loss         | 309      |
| Running Env Steps   | 95000    |
| Running Forward KL  | 17.1     |
| Running Reverse KL  | 9.5      |
| Running Update Time | 19       |
----------------------------------
--2023-11-09 01:28:06.070366 CST---
| Itration            | 20        |
| Real Det Return     | -1.59e+03 |
| Real Det violation  | 0         |
| Real Sto Return     | -428      |
| Real Sto violation  | 1         |
| Reward Loss         | 307       |
| Running Env Steps   | 100000    |
| Running Forward KL  | 17.7      |
| Running Reverse KL  | 9.41      |
| Running Update Time | 20        |
-----------------------------------
--2023-11-09 01:29:57.953201 CST---
| Itration            | 21        |
| Real Det Return     | -1.48e+03 |
| Real Det violation  | 0         |
| Real Sto Return     | -431      |
| Real Sto violation  | 0.95      |
| Reward Loss         | 281       |
| Running Env Steps   | 105000    |
| Running Forward KL  | 17.4      |
| Running Reverse KL  | 9.37      |
| Running Update Time | 21        |
-----------------------------------
--2023-11-09 01:31:50.832589 CST---
| Itration            | 22        |
| Real Det Return     | -1.37e+03 |
| Real Det violation  | 0         |
| Real Sto Return     | -404      |
| Real Sto violation  | 1         |
| Reward Loss         | 278       |
| Running Env Steps   | 110000    |
| Running Forward KL  | 17.6      |
| Running Reverse KL  | 9.27      |
| Running Update Time | 22        |
-----------------------------------
--2023-11-09 01:33:43.813860 CST---
| Itration            | 23        |
| Real Det Return     | -1.44e+03 |
| Real Det violation  | 0         |
| Real Sto Return     | -291      |
| Real Sto violation  | 1         |
| Reward Loss         | 254       |
| Running Env Steps   | 115000    |
| Running Forward KL  | 17.2      |
| Running Reverse KL  | 8.73      |
| Running Update Time | 23        |
-----------------------------------
--2023-11-09 01:35:37.779538 CST---
| Itration            | 24        |
| Real Det Return     | -1.66e+03 |
| Real Det violation  | 0         |
| Real Sto Return     | -404      |
| Real Sto violation  | 1         |
| Reward Loss         | 249       |
| Running Env Steps   | 120000    |
| Running Forward KL  | 17.7      |
| Running Reverse KL  | 9.2       |
| Running Update Time | 24        |
-----------------------------------
--2023-11-09 01:37:32.923767 CST---
| Itration            | 25        |
| Real Det Return     | -1.41e+03 |
| Real Det violation  | 0         |
| Real Sto Return     | -407      |
| Real Sto violation  | 1         |
| Reward Loss         | 236       |
| Running Env Steps   | 125000    |
| Running Forward KL  | 17.3      |
| Running Reverse KL  | 8.99      |
| Running Update Time | 25        |
-----------------------------------
--2023-11-09 01:39:30.420266 CST---
| Itration            | 26        |
| Real Det Return     | -1.29e+03 |
| Real Det violation  | 0         |
| Real Sto Return     | -388      |
| Real Sto violation  | 1         |
| Reward Loss         | 224       |
| Running Env Steps   | 130000    |
| Running Forward KL  | 17.2      |
| Running Reverse KL  | 9.09      |
| Running Update Time | 26        |
-----------------------------------
--2023-11-09 01:41:28.166057 CST---
| Itration            | 27        |
| Real Det Return     | -1.24e+03 |
| Real Det violation  | 0         |
| Real Sto Return     | -302      |
| Real Sto violation  | 1         |
| Reward Loss         | 197       |
| Running Env Steps   | 135000    |
| Running Forward KL  | 17        |
| Running Reverse KL  | 8.72      |
| Running Update Time | 27        |
-----------------------------------
--2023-11-09 01:43:26.640229 CST---
| Itration            | 28        |
| Real Det Return     | -1.46e+03 |
| Real Det violation  | 0         |
| Real Sto Return     | -326      |
| Real Sto violation  | 1         |
| Reward Loss         | 194       |
| Running Env Steps   | 140000    |
| Running Forward KL  | 16.6      |
| Running Reverse KL  | 8.55      |
| Running Update Time | 28        |
-----------------------------------
--2023-11-09 01:45:25.595982 CST---
| Itration            | 29        |
| Real Det Return     | -1.22e+03 |
| Real Det violation  | 0         |
| Real Sto Return     | -304      |
| Real Sto violation  | 1         |
| Reward Loss         | 167       |
| Running Env Steps   | 145000    |
| Running Forward KL  | 16.8      |
| Running Reverse KL  | 8.15      |
| Running Update Time | 29        |
-----------------------------------
--2023-11-09 01:47:20.224008 CST---
| Itration            | 30        |
| Real Det Return     | -1.08e+03 |
| Real Det violation  | 0         |
| Real Sto Return     | -338      |
| Real Sto violation  | 1         |
| Reward Loss         | 178       |
| Running Env Steps   | 150000    |
| Running Forward KL  | 17.2      |
| Running Reverse KL  | 8.59      |
| Running Update Time | 30        |
-----------------------------------
--2023-11-09 01:49:07.089026 CST---
| Itration            | 31        |
| Real Det Return     | -1.26e+03 |
| Real Det violation  | 0         |
| Real Sto Return     | -276      |
| Real Sto violation  | 0.95      |
| Reward Loss         | 149       |
| Running Env Steps   | 155000    |
| Running Forward KL  | 17        |
| Running Reverse KL  | 8.56      |
| Running Update Time | 31        |
-----------------------------------
--2023-11-09 01:51:07.223427 CST---
| Itration            | 32        |
| Real Det Return     | -1.26e+03 |
| Real Det violation  | 0         |
| Real Sto Return     | -348      |
| Real Sto violation  | 1         |
| Reward Loss         | 147       |
| Running Env Steps   | 160000    |
| Running Forward KL  | 16.6      |
| Running Reverse KL  | 8.55      |
| Running Update Time | 32        |
-----------------------------------
--2023-11-09 01:53:09.312632 CST---
| Itration            | 33        |
| Real Det Return     | -1.35e+03 |
| Real Det violation  | 0         |
| Real Sto Return     | -231      |
| Real Sto violation  | 1         |
| Reward Loss         | 144       |
| Running Env Steps   | 165000    |
| Running Forward KL  | 16.7      |
| Running Reverse KL  | 8.35      |
| Running Update Time | 33        |
-----------------------------------
--2023-11-09 01:55:11.089443 CST---
| Itration            | 34        |
| Real Det Return     | -1.12e+03 |
| Real Det violation  | 0         |
| Real Sto Return     | -294      |
| Real Sto violation  | 1         |
| Reward Loss         | 125       |
| Running Env Steps   | 170000    |
| Running Forward KL  | 16.8      |
| Running Reverse KL  | 8.39      |
| Running Update Time | 34        |
-----------------------------------
--2023-11-09 01:57:11.861577 CST---
| Itration            | 35        |
| Real Det Return     | -1.36e+03 |
| Real Det violation  | 0         |
| Real Sto Return     | -283      |
| Real Sto violation  | 1         |
| Reward Loss         | 124       |
| Running Env Steps   | 175000    |
| Running Forward KL  | 16.5      |
| Running Reverse KL  | 8.34      |
| Running Update Time | 35        |
-----------------------------------
--2023-11-09 01:59:13.202624 CST---
| Itration            | 36        |
| Real Det Return     | -1.32e+03 |
| Real Det violation  | 0         |
| Real Sto Return     | -343      |
| Real Sto violation  | 0.95      |
| Reward Loss         | 115       |
| Running Env Steps   | 180000    |
| Running Forward KL  | 16.4      |
| Running Reverse KL  | 8.08      |
| Running Update Time | 36        |
-----------------------------------
--2023-11-09 02:01:13.705759 CST---
| Itration            | 37        |
| Real Det Return     | -1.25e+03 |
| Real Det violation  | 0         |
| Real Sto Return     | -315      |
| Real Sto violation  | 1         |
| Reward Loss         | 116       |
| Running Env Steps   | 185000    |
| Running Forward KL  | 16.6      |
| Running Reverse KL  | 8.31      |
| Running Update Time | 37        |
-----------------------------------
--2023-11-09 02:03:14.539375 CST---
| Itration            | 38        |
| Real Det Return     | -1.25e+03 |
| Real Det violation  | 0         |
| Real Sto Return     | -341      |
| Real Sto violation  | 1         |
| Reward Loss         | 109       |
| Running Env Steps   | 190000    |
| Running Forward KL  | 16.7      |
| Running Reverse KL  | 8.21      |
| Running Update Time | 38        |
-----------------------------------
