Logging to logs/Walker2d-v3/exp-1/maxentirl_sa/2023_11_10_22_33_40
--2023-11-10 22:34:50.187459 CST--
| Itration            | 0        |
| Real Det Return     | 96.7     |
| Real Det violation  | 0.05     |
| Real Sto Return     | 145      |
| Real Sto violation  | 0.3      |
| Reward Loss         | 163      |
| Running Env Steps   | 0        |
| Running Forward KL  | 29.3     |
| Running Reverse KL  | 16.3     |
| Running Update Time | 0        |
----------------------------------
--2023-11-10 22:36:11.881928 CST--
| Itration            | 1        |
| Real Det Return     | 114      |
| Real Det violation  | 0        |
| Real Sto Return     | 205      |
| Real Sto violation  | 0.4      |
| Reward Loss         | 138      |
| Running Env Steps   | 5000     |
| Running Forward KL  | 28.4     |
| Running Reverse KL  | 15.2     |
| Running Update Time | 1        |
----------------------------------
--2023-11-10 22:37:33.178182 CST--
| Itration            | 2        |
| Real Det Return     | 126      |
| Real Det violation  | 0        |
| Real Sto Return     | 165      |
| Real Sto violation  | 0.45     |
| Reward Loss         | 176      |
| Running Env Steps   | 10000    |
| Running Forward KL  | 28.3     |
| Running Reverse KL  | 14.9     |
| Running Update Time | 2        |
----------------------------------
--2023-11-10 22:38:55.651392 CST--
| Itration            | 3        |
| Real Det Return     | 337      |
| Real Det violation  | 1        |
| Real Sto Return     | 276      |
| Real Sto violation  | 0.6      |
| Reward Loss         | 157      |
| Running Env Steps   | 15000    |
| Running Forward KL  | 28.1     |
| Running Reverse KL  | 14.6     |
| Running Update Time | 3        |
----------------------------------
--2023-11-10 22:40:19.781677 CST--
| Itration            | 4        |
| Real Det Return     | 459      |
| Real Det violation  | 1        |
| Real Sto Return     | 342      |
| Real Sto violation  | 0.95     |
| Reward Loss         | 152      |
| Running Env Steps   | 20000    |
| Running Forward KL  | 28.2     |
| Running Reverse KL  | 15.6     |
| Running Update Time | 4        |
----------------------------------
--2023-11-10 22:41:41.886329 CST--
| Itration            | 5        |
| Real Det Return     | 477      |
| Real Det violation  | 0.95     |
| Real Sto Return     | 313      |
| Real Sto violation  | 0.8      |
| Reward Loss         | 102      |
| Running Env Steps   | 25000    |
| Running Forward KL  | 27.8     |
| Running Reverse KL  | 14.1     |
| Running Update Time | 5        |
----------------------------------
--2023-11-10 22:43:08.968799 CST--
| Itration            | 6        |
| Real Det Return     | 357      |
| Real Det violation  | 1        |
| Real Sto Return     | 395      |
| Real Sto violation  | 0.85     |
| Reward Loss         | 103      |
| Running Env Steps   | 30000    |
| Running Forward KL  | 28.1     |
| Running Reverse KL  | 13.1     |
| Running Update Time | 6        |
----------------------------------
--2023-11-10 22:44:38.786338 CST--
| Itration            | 7        |
| Real Det Return     | 763      |
| Real Det violation  | 0.9      |
| Real Sto Return     | 300      |
| Real Sto violation  | 0.65     |
| Reward Loss         | 126      |
| Running Env Steps   | 35000    |
| Running Forward KL  | 28.3     |
| Running Reverse KL  | 16.2     |
| Running Update Time | 7        |
----------------------------------
--2023-11-10 22:46:06.869360 CST--
| Itration            | 8        |
| Real Det Return     | 223      |
| Real Det violation  | 1        |
| Real Sto Return     | 439      |
| Real Sto violation  | 0.95     |
| Reward Loss         | 52.3     |
| Running Env Steps   | 40000    |
| Running Forward KL  | 28.2     |
| Running Reverse KL  | 22       |
| Running Update Time | 8        |
----------------------------------
--2023-11-10 22:47:39.464585 CST--
| Itration            | 9        |
| Real Det Return     | 747      |
| Real Det violation  | 1        |
| Real Sto Return     | 682      |
| Real Sto violation  | 0.95     |
| Reward Loss         | 85.9     |
| Running Env Steps   | 45000    |
| Running Forward KL  | 28       |
| Running Reverse KL  | 17.7     |
| Running Update Time | 9        |
----------------------------------
--2023-11-10 22:49:14.821109 CST--
| Itration            | 10       |
| Real Det Return     | 991      |
| Real Det violation  | 0.95     |
| Real Sto Return     | 795      |
| Real Sto violation  | 0.95     |
| Reward Loss         | 56.7     |
| Running Env Steps   | 50000    |
| Running Forward KL  | 27.9     |
| Running Reverse KL  | 15.7     |
| Running Update Time | 10       |
----------------------------------
--2023-11-10 22:50:49.355963 CST--
| Itration            | 11       |
| Real Det Return     | 639      |
| Real Det violation  | 1        |
| Real Sto Return     | 796      |
| Real Sto violation  | 0.95     |
| Reward Loss         | 79.7     |
| Running Env Steps   | 55000    |
| Running Forward KL  | 27.8     |
| Running Reverse KL  | 14.8     |
| Running Update Time | 11       |
----------------------------------
--2023-11-10 22:52:38.292641 CST--
| Itration            | 12       |
| Real Det Return     | 2.76e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 870      |
| Real Sto violation  | 0.75     |
| Reward Loss         | 68.1     |
| Running Env Steps   | 60000    |
| Running Forward KL  | 27.9     |
| Running Reverse KL  | 16.3     |
| Running Update Time | 12       |
----------------------------------
--2023-11-10 22:54:26.368347 CST--
| Itration            | 13       |
| Real Det Return     | 2.52e+03 |
| Real Det violation  | 0.1      |
| Real Sto Return     | 764      |
| Real Sto violation  | 1        |
| Reward Loss         | 17.5     |
| Running Env Steps   | 65000    |
| Running Forward KL  | 28.6     |
| Running Reverse KL  | 41.6     |
| Running Update Time | 13       |
----------------------------------
--2023-11-10 22:56:16.556178 CST--
| Itration            | 14       |
| Real Det Return     | 2.44e+03 |
| Real Det violation  | 0.05     |
| Real Sto Return     | 765      |
| Real Sto violation  | 0.7      |
| Reward Loss         | 30.8     |
| Running Env Steps   | 70000    |
| Running Forward KL  | 28.4     |
| Running Reverse KL  | 28       |
| Running Update Time | 14       |
----------------------------------
--2023-11-10 22:58:12.750810 CST--
| Itration            | 15       |
| Real Det Return     | 2.66e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.12e+03 |
| Real Sto violation  | 0.95     |
| Reward Loss         | 65.9     |
| Running Env Steps   | 75000    |
| Running Forward KL  | 26.4     |
| Running Reverse KL  | 13.6     |
| Running Update Time | 15       |
----------------------------------
--2023-11-10 22:59:58.565160 CST--
| Itration            | 16       |
| Real Det Return     | 624      |
| Real Det violation  | 1        |
| Real Sto Return     | 1.14e+03 |
| Real Sto violation  | 0.85     |
| Reward Loss         | 53.5     |
| Running Env Steps   | 80000    |
| Running Forward KL  | 27       |
| Running Reverse KL  | 14.3     |
| Running Update Time | 16       |
----------------------------------
--2023-11-10 23:01:48.019522 CST--
| Itration            | 17       |
| Real Det Return     | 1.01e+03 |
| Real Det violation  | 0.75     |
| Real Sto Return     | 975      |
| Real Sto violation  | 0.55     |
| Reward Loss         | -24.4    |
| Running Env Steps   | 85000    |
| Running Forward KL  | 28.4     |
| Running Reverse KL  | 53       |
| Running Update Time | 17       |
----------------------------------
--2023-11-10 23:03:46.881225 CST--
| Itration            | 18       |
| Real Det Return     | 2.48e+03 |
| Real Det violation  | 0.1      |
| Real Sto Return     | 1.13e+03 |
| Real Sto violation  | 0.65     |
| Reward Loss         | 45       |
| Running Env Steps   | 90000    |
| Running Forward KL  | 27.6     |
| Running Reverse KL  | 14.9     |
| Running Update Time | 18       |
----------------------------------
--2023-11-10 23:05:45.528477 CST--
| Itration            | 19       |
| Real Det Return     | 2.01e+03 |
| Real Det violation  | 0.4      |
| Real Sto Return     | 1.28e+03 |
| Real Sto violation  | 0.3      |
| Reward Loss         | 39.8     |
| Running Env Steps   | 95000    |
| Running Forward KL  | 27.6     |
| Running Reverse KL  | 14.3     |
| Running Update Time | 19       |
----------------------------------
--2023-11-10 23:07:46.327725 CST--
| Itration            | 20       |
| Real Det Return     | 2.29e+03 |
| Real Det violation  | 0.05     |
| Real Sto Return     | 1.46e+03 |
| Real Sto violation  | 0.25     |
| Reward Loss         | 46.1     |
| Running Env Steps   | 100000   |
| Running Forward KL  | 27.4     |
| Running Reverse KL  | 14.7     |
| Running Update Time | 20       |
----------------------------------
--2023-11-10 23:09:45.268468 CST--
| Itration            | 21       |
| Real Det Return     | 2.38e+03 |
| Real Det violation  | 0.15     |
| Real Sto Return     | 1.31e+03 |
| Real Sto violation  | 0.75     |
| Reward Loss         | 33.8     |
| Running Env Steps   | 105000   |
| Running Forward KL  | 27.1     |
| Running Reverse KL  | 14.2     |
| Running Update Time | 21       |
----------------------------------
--2023-11-10 23:11:49.240452 CST--
| Itration            | 22       |
| Real Det Return     | 2.12e+03 |
| Real Det violation  | 0.05     |
| Real Sto Return     | 1.9e+03  |
| Real Sto violation  | 0.25     |
| Reward Loss         | 32.6     |
| Running Env Steps   | 110000   |
| Running Forward KL  | 27.2     |
| Running Reverse KL  | 15.4     |
| Running Update Time | 22       |
----------------------------------
--2023-11-10 23:13:52.721246 CST--
| Itration            | 23       |
| Real Det Return     | 2.62e+03 |
| Real Det violation  | 0.05     |
| Real Sto Return     | 1.96e+03 |
| Real Sto violation  | 0.25     |
| Reward Loss         | 30.2     |
| Running Env Steps   | 115000   |
| Running Forward KL  | 27.2     |
| Running Reverse KL  | 15.3     |
| Running Update Time | 23       |
----------------------------------
--2023-11-10 23:15:58.208762 CST--
| Itration            | 24       |
| Real Det Return     | 2.75e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.96e+03 |
| Real Sto violation  | 0.3      |
| Reward Loss         | 23.2     |
| Running Env Steps   | 120000   |
| Running Forward KL  | 27.6     |
| Running Reverse KL  | 14.6     |
| Running Update Time | 24       |
----------------------------------
--2023-11-10 23:18:01.575138 CST--
| Itration            | 25       |
| Real Det Return     | 2.47e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.8e+03  |
| Real Sto violation  | 0.25     |
| Reward Loss         | 2.84     |
| Running Env Steps   | 125000   |
| Running Forward KL  | 27.4     |
| Running Reverse KL  | 14.9     |
| Running Update Time | 25       |
----------------------------------
--2023-11-10 23:20:07.173641 CST--
| Itration            | 26       |
| Real Det Return     | 2.75e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.94e+03 |
| Real Sto violation  | 0.2      |
| Reward Loss         | -13.3    |
| Running Env Steps   | 130000   |
| Running Forward KL  | 27.1     |
| Running Reverse KL  | 14.3     |
| Running Update Time | 26       |
----------------------------------
--2023-11-10 23:22:13.310717 CST--
| Itration            | 27       |
| Real Det Return     | 2.13e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.04e+03 |
| Real Sto violation  | 0.1      |
| Reward Loss         | 4.46     |
| Running Env Steps   | 135000   |
| Running Forward KL  | 27.5     |
| Running Reverse KL  | 15.3     |
| Running Update Time | 27       |
----------------------------------
--2023-11-10 23:24:18.577728 CST--
| Itration            | 28       |
| Real Det Return     | 2.62e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 1.91e+03 |
| Real Sto violation  | 0.15     |
| Reward Loss         | -12.2    |
| Running Env Steps   | 140000   |
| Running Forward KL  | 28.1     |
| Running Reverse KL  | 15.4     |
| Running Update Time | 28       |
----------------------------------
--2023-11-10 23:26:25.766485 CST--
| Itration            | 29       |
| Real Det Return     | 2.66e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.08e+03 |
| Real Sto violation  | 0.1      |
| Reward Loss         | -19.6    |
| Running Env Steps   | 145000   |
| Running Forward KL  | 27.7     |
| Running Reverse KL  | 15.1     |
| Running Update Time | 29       |
----------------------------------
--2023-11-10 23:28:32.995595 CST--
| Itration            | 30       |
| Real Det Return     | 2.4e+03  |
| Real Det violation  | 0        |
| Real Sto Return     | 2.15e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -8.4     |
| Running Env Steps   | 150000   |
| Running Forward KL  | 27.8     |
| Running Reverse KL  | 15.7     |
| Running Update Time | 30       |
----------------------------------
--2023-11-10 23:30:40.640103 CST--
| Itration            | 31       |
| Real Det Return     | 2.72e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.09e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -21      |
| Running Env Steps   | 155000   |
| Running Forward KL  | 28       |
| Running Reverse KL  | 16.3     |
| Running Update Time | 31       |
----------------------------------
--2023-11-10 23:32:47.979599 CST--
| Itration            | 32       |
| Real Det Return     | 2.73e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.13e+03 |
| Real Sto violation  | 0.15     |
| Reward Loss         | -34.9    |
| Running Env Steps   | 160000   |
| Running Forward KL  | 27.5     |
| Running Reverse KL  | 15.3     |
| Running Update Time | 32       |
----------------------------------
--2023-11-10 23:34:54.272298 CST--
| Itration            | 33       |
| Real Det Return     | 2.71e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.02e+03 |
| Real Sto violation  | 0.2      |
| Reward Loss         | -41.4    |
| Running Env Steps   | 165000   |
| Running Forward KL  | 27.7     |
| Running Reverse KL  | 16       |
| Running Update Time | 33       |
----------------------------------
--2023-11-10 23:37:01.137194 CST--
| Itration            | 34       |
| Real Det Return     | 2.35e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.17e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -62.3    |
| Running Env Steps   | 170000   |
| Running Forward KL  | 27.3     |
| Running Reverse KL  | 15       |
| Running Update Time | 34       |
----------------------------------
--2023-11-10 23:39:01.111002 CST--
| Itration            | 35       |
| Real Det Return     | 2.39e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.17e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -55.5    |
| Running Env Steps   | 175000   |
| Running Forward KL  | 28.1     |
| Running Reverse KL  | 15.5     |
| Running Update Time | 35       |
----------------------------------
--2023-11-10 23:40:59.787379 CST--
| Itration            | 36       |
| Real Det Return     | 2.46e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.21e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -67      |
| Running Env Steps   | 180000   |
| Running Forward KL  | 27.5     |
| Running Reverse KL  | 15.5     |
| Running Update Time | 36       |
----------------------------------
--2023-11-10 23:42:58.111193 CST--
| Itration            | 37       |
| Real Det Return     | 2.69e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.28e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -73.5    |
| Running Env Steps   | 185000   |
| Running Forward KL  | 27.6     |
| Running Reverse KL  | 15.4     |
| Running Update Time | 37       |
----------------------------------
--2023-11-10 23:44:55.937955 CST--
| Itration            | 38       |
| Real Det Return     | 2.43e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.14e+03 |
| Real Sto violation  | 0.05     |
| Reward Loss         | -94.6    |
| Running Env Steps   | 190000   |
| Running Forward KL  | 27.5     |
| Running Reverse KL  | 15.3     |
| Running Update Time | 38       |
----------------------------------
--2023-11-10 23:46:53.568131 CST--
| Itration            | 39       |
| Real Det Return     | 2.67e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.2e+03  |
| Real Sto violation  | 0.05     |
| Reward Loss         | -99.6    |
| Running Env Steps   | 195000   |
| Running Forward KL  | 27.4     |
| Running Reverse KL  | 14.8     |
| Running Update Time | 39       |
----------------------------------
--2023-11-10 23:48:52.227993 CST--
| Itration            | 40       |
| Real Det Return     | 2.67e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.23e+03 |
| Real Sto violation  | 0.05     |
| Reward Loss         | -93.4    |
| Running Env Steps   | 200000   |
| Running Forward KL  | 27.1     |
| Running Reverse KL  | 15.4     |
| Running Update Time | 40       |
----------------------------------
--2023-11-10 23:50:51.635121 CST--
| Itration            | 41       |
| Real Det Return     | 2.74e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.31e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -118     |
| Running Env Steps   | 205000   |
| Running Forward KL  | 27.7     |
| Running Reverse KL  | 15.2     |
| Running Update Time | 41       |
----------------------------------
--2023-11-10 23:52:55.935107 CST--
| Itration            | 42       |
| Real Det Return     | 2.71e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.34e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -127     |
| Running Env Steps   | 210000   |
| Running Forward KL  | 27.7     |
| Running Reverse KL  | 15       |
| Running Update Time | 42       |
----------------------------------
--2023-11-10 23:54:59.137001 CST--
| Itration            | 43       |
| Real Det Return     | 2.63e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.22e+03 |
| Real Sto violation  | 0.05     |
| Reward Loss         | -124     |
| Running Env Steps   | 215000   |
| Running Forward KL  | 27.4     |
| Running Reverse KL  | 15.5     |
| Running Update Time | 43       |
----------------------------------
--2023-11-10 23:57:02.837071 CST--
| Itration            | 44       |
| Real Det Return     | 2.76e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.35e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -133     |
| Running Env Steps   | 220000   |
| Running Forward KL  | 27.2     |
| Running Reverse KL  | 15.1     |
| Running Update Time | 44       |
----------------------------------
--2023-11-10 23:59:06.482311 CST--
| Itration            | 45       |
| Real Det Return     | 2.74e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.38e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -131     |
| Running Env Steps   | 225000   |
| Running Forward KL  | 26.9     |
| Running Reverse KL  | 14.7     |
| Running Update Time | 45       |
----------------------------------
--2023-11-11 00:01:09.707198 CST--
| Itration            | 46       |
| Real Det Return     | 2.62e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.34e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -147     |
| Running Env Steps   | 230000   |
| Running Forward KL  | 26.6     |
| Running Reverse KL  | 14.5     |
| Running Update Time | 46       |
----------------------------------
--2023-11-11 00:03:13.127802 CST--
| Itration            | 47       |
| Real Det Return     | 2.75e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.32e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -161     |
| Running Env Steps   | 235000   |
| Running Forward KL  | 27.3     |
| Running Reverse KL  | 14.6     |
| Running Update Time | 47       |
----------------------------------
--2023-11-11 00:05:16.948917 CST--
| Itration            | 48       |
| Real Det Return     | 2.76e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.36e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -180     |
| Running Env Steps   | 240000   |
| Running Forward KL  | 27.4     |
| Running Reverse KL  | 14.7     |
| Running Update Time | 48       |
----------------------------------
--2023-11-11 00:07:20.902120 CST--
| Itration            | 49       |
| Real Det Return     | 2.75e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.38e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -177     |
| Running Env Steps   | 245000   |
| Running Forward KL  | 26.7     |
| Running Reverse KL  | 14.2     |
| Running Update Time | 49       |
----------------------------------
--2023-11-11 00:09:25.539486 CST--
| Itration            | 50       |
| Real Det Return     | 2.73e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.33e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -165     |
| Running Env Steps   | 250000   |
| Running Forward KL  | 27.4     |
| Running Reverse KL  | 14.9     |
| Running Update Time | 50       |
----------------------------------
--2023-11-11 00:11:23.362441 CST--
| Itration            | 51       |
| Real Det Return     | 2.73e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.34e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -183     |
| Running Env Steps   | 255000   |
| Running Forward KL  | 27.1     |
| Running Reverse KL  | 14.8     |
| Running Update Time | 51       |
----------------------------------
--2023-11-11 00:13:22.469525 CST--
| Itration            | 52       |
| Real Det Return     | 2.75e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.36e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -184     |
| Running Env Steps   | 260000   |
| Running Forward KL  | 27.1     |
| Running Reverse KL  | 14.6     |
| Running Update Time | 52       |
----------------------------------
--2023-11-11 00:15:27.772096 CST--
| Itration            | 53       |
| Real Det Return     | 2.74e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.49e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -190     |
| Running Env Steps   | 265000   |
| Running Forward KL  | 26       |
| Running Reverse KL  | 14.1     |
| Running Update Time | 53       |
----------------------------------
--2023-11-11 00:17:32.642883 CST--
| Itration            | 54       |
| Real Det Return     | 2.76e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.43e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -201     |
| Running Env Steps   | 270000   |
| Running Forward KL  | 27       |
| Running Reverse KL  | 14.4     |
| Running Update Time | 54       |
----------------------------------
--2023-11-11 00:19:36.771296 CST--
| Itration            | 55       |
| Real Det Return     | 2.68e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.37e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -204     |
| Running Env Steps   | 275000   |
| Running Forward KL  | 27.2     |
| Running Reverse KL  | 14.7     |
| Running Update Time | 55       |
----------------------------------
--2023-11-11 00:21:40.816369 CST--
| Itration            | 56       |
| Real Det Return     | 2.72e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.39e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -220     |
| Running Env Steps   | 280000   |
| Running Forward KL  | 26.7     |
| Running Reverse KL  | 13.9     |
| Running Update Time | 56       |
----------------------------------
--2023-11-11 00:23:44.733297 CST--
| Itration            | 57       |
| Real Det Return     | 2.64e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.41e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -218     |
| Running Env Steps   | 285000   |
| Running Forward KL  | 26.8     |
| Running Reverse KL  | 14       |
| Running Update Time | 57       |
----------------------------------
--2023-11-11 00:25:49.610041 CST--
| Itration            | 58       |
| Real Det Return     | 2.74e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.52e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -208     |
| Running Env Steps   | 290000   |
| Running Forward KL  | 26.1     |
| Running Reverse KL  | 14.1     |
| Running Update Time | 58       |
----------------------------------
--2023-11-11 00:27:52.316260 CST--
| Itration            | 59       |
| Real Det Return     | 2.75e+03 |
| Real Det violation  | 0        |
| Real Sto Return     | 2.47e+03 |
| Real Sto violation  | 0        |
| Reward Loss         | -247     |
| Running Env Steps   | 295000   |
| Running Forward KL  | 26.5     |
| Running Reverse KL  | 14.1     |
| Running Update Time | 59       |
----------------------------------
