Logging to logs/HalfCheetah-v3/exp-1/maxentirl_sa/2023_11_06_10_01_32
--2023-11-06 10:02:52.835692 CST--
| Itration            | 0        |
| Real Det Return     | 124      |
| Real Sto Return     | -325     |
| Reward Loss         | 150      |
| Running Env Steps   | 0        |
| Running Forward KL  | 19.6     |
| Running Reverse KL  | 12.3     |
| Running Update Time | 0        |
----------------------------------
--2023-11-06 10:04:23.484962 CST--
| Itration            | 1        |
| Real Det Return     | 74.5     |
| Real Sto Return     | -389     |
| Reward Loss         | 151      |
| Running Env Steps   | 5000     |
| Running Forward KL  | 19.3     |
| Running Reverse KL  | 11.9     |
| Running Update Time | 1        |
----------------------------------
--2023-11-06 10:05:51.242169 CST--
| Itration            | 2        |
| Real Det Return     | 138      |
| Real Sto Return     | -370     |
| Reward Loss         | 172      |
| Running Env Steps   | 10000    |
| Running Forward KL  | 19.6     |
| Running Reverse KL  | 12.4     |
| Running Update Time | 2        |
----------------------------------
--2023-11-06 10:07:19.291651 CST--
| Itration            | 3        |
| Real Det Return     | 237      |
| Real Sto Return     | -297     |
| Reward Loss         | 111      |
| Running Env Steps   | 15000    |
| Running Forward KL  | 19.7     |
| Running Reverse KL  | 12.4     |
| Running Update Time | 3        |
----------------------------------
--2023-11-06 10:08:48.555525 CST--
| Itration            | 4        |
| Real Det Return     | -33.4    |
| Real Sto Return     | -352     |
| Reward Loss         | 94.3     |
| Running Env Steps   | 20000    |
| Running Forward KL  | 20       |
| Running Reverse KL  | 12.9     |
| Running Update Time | 4        |
----------------------------------
--2023-11-06 10:10:20.082131 CST--
| Itration            | 5        |
| Real Det Return     | 88.8     |
| Real Sto Return     | -315     |
| Reward Loss         | 104      |
| Running Env Steps   | 25000    |
| Running Forward KL  | 19.6     |
| Running Reverse KL  | 12.6     |
| Running Update Time | 5        |
----------------------------------
--2023-11-06 10:11:51.869666 CST--
| Itration            | 6        |
| Real Det Return     | 188      |
| Real Sto Return     | -258     |
| Reward Loss         | 50       |
| Running Env Steps   | 30000    |
| Running Forward KL  | 19.9     |
| Running Reverse KL  | 12.9     |
| Running Update Time | 6        |
----------------------------------
--2023-11-06 10:13:24.125048 CST--
| Itration            | 7        |
| Real Det Return     | 59.2     |
| Real Sto Return     | -283     |
| Reward Loss         | 46.6     |
| Running Env Steps   | 35000    |
| Running Forward KL  | 19.9     |
| Running Reverse KL  | 13       |
| Running Update Time | 7        |
----------------------------------
--2023-11-06 10:14:56.722503 CST--
| Itration            | 8        |
| Real Det Return     | 122      |
| Real Sto Return     | -287     |
| Reward Loss         | 29       |
| Running Env Steps   | 40000    |
| Running Forward KL  | 19.9     |
| Running Reverse KL  | 13       |
| Running Update Time | 8        |
----------------------------------
--2023-11-06 10:16:29.327034 CST--
| Itration            | 9        |
| Real Det Return     | -157     |
| Real Sto Return     | -233     |
| Reward Loss         | 21.6     |
| Running Env Steps   | 45000    |
| Running Forward KL  | 19.9     |
| Running Reverse KL  | 12.8     |
| Running Update Time | 9        |
----------------------------------
--2023-11-06 10:17:55.386920 CST--
| Itration            | 10       |
| Real Det Return     | 284      |
| Real Sto Return     | -278     |
| Reward Loss         | -24.9    |
| Running Env Steps   | 50000    |
| Running Forward KL  | 19.9     |
| Running Reverse KL  | 12.8     |
| Running Update Time | 10       |
----------------------------------
--2023-11-06 10:19:31.370337 CST--
| Itration            | 11       |
| Real Det Return     | 222      |
| Real Sto Return     | -227     |
| Reward Loss         | -27.7    |
| Running Env Steps   | 55000    |
| Running Forward KL  | 19.8     |
| Running Reverse KL  | 12.7     |
| Running Update Time | 11       |
----------------------------------
--2023-11-06 10:21:08.078896 CST--
| Itration            | 12       |
| Real Det Return     | 632      |
| Real Sto Return     | -237     |
| Reward Loss         | -65      |
| Running Env Steps   | 60000    |
| Running Forward KL  | 19.6     |
| Running Reverse KL  | 12.8     |
| Running Update Time | 12       |
----------------------------------
--2023-11-06 10:22:46.614445 CST--
| Itration            | 13       |
| Real Det Return     | 182      |
| Real Sto Return     | -251     |
| Reward Loss         | -76.1    |
| Running Env Steps   | 65000    |
| Running Forward KL  | 19.6     |
| Running Reverse KL  | 12.5     |
| Running Update Time | 13       |
----------------------------------
--2023-11-06 10:24:29.664158 CST--
| Itration            | 14       |
| Real Det Return     | 437      |
| Real Sto Return     | -219     |
| Reward Loss         | -87.3    |
| Running Env Steps   | 70000    |
| Running Forward KL  | 19.7     |
| Running Reverse KL  | 12.5     |
| Running Update Time | 14       |
----------------------------------
--2023-11-06 10:26:18.084482 CST--
| Itration            | 15       |
| Real Det Return     | 504      |
| Real Sto Return     | -204     |
| Reward Loss         | -109     |
| Running Env Steps   | 75000    |
| Running Forward KL  | 19.4     |
| Running Reverse KL  | 12.3     |
| Running Update Time | 15       |
----------------------------------
--2023-11-06 10:28:07.524045 CST--
| Itration            | 16       |
| Real Det Return     | 537      |
| Real Sto Return     | -225     |
| Reward Loss         | -141     |
| Running Env Steps   | 80000    |
| Running Forward KL  | 19.7     |
| Running Reverse KL  | 12.3     |
| Running Update Time | 16       |
----------------------------------
--2023-11-06 10:29:58.221046 CST--
| Itration            | 17       |
| Real Det Return     | 750      |
| Real Sto Return     | -204     |
| Reward Loss         | -157     |
| Running Env Steps   | 85000    |
| Running Forward KL  | 19.6     |
| Running Reverse KL  | 12.3     |
| Running Update Time | 17       |
----------------------------------
--2023-11-06 10:31:50.113197 CST--
| Itration            | 18       |
| Real Det Return     | 708      |
| Real Sto Return     | -185     |
| Reward Loss         | -170     |
| Running Env Steps   | 90000    |
| Running Forward KL  | 19.2     |
| Running Reverse KL  | 12       |
| Running Update Time | 18       |
----------------------------------
--2023-11-06 10:33:43.335651 CST--
| Itration            | 19       |
| Real Det Return     | 716      |
| Real Sto Return     | -213     |
| Reward Loss         | -221     |
| Running Env Steps   | 95000    |
| Running Forward KL  | 19.6     |
| Running Reverse KL  | 12.5     |
| Running Update Time | 19       |
----------------------------------
--2023-11-06 10:35:37.609732 CST--
| Itration            | 20       |
| Real Det Return     | 844      |
| Real Sto Return     | -154     |
| Reward Loss         | -208     |
| Running Env Steps   | 100000   |
| Running Forward KL  | 19.2     |
| Running Reverse KL  | 12.2     |
| Running Update Time | 20       |
----------------------------------
--2023-11-06 10:37:33.787721 CST--
| Itration            | 21       |
| Real Det Return     | 646      |
| Real Sto Return     | -164     |
| Reward Loss         | -233     |
| Running Env Steps   | 105000   |
| Running Forward KL  | 19.4     |
| Running Reverse KL  | 12.2     |
| Running Update Time | 21       |
----------------------------------
