Logging to logs/StockMarket/exp-1/maxentirl/2024_05_11_00_57_37
2024-05-11 00:59:45.743204 Eastern Daylight Time
| Itration            | 0        |
| Loss                | 10       |
| Real Det Return     | 402.87   |
| Real Sto Return     | -258.79  |
| Running Env Steps   | 0        |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 0        |
----------------------------------
2024-05-11 01:01:09.113401 Eastern Daylight Time
| Itration            | 1        |
| Loss                | 10       |
| Real Det Return     | 397.1    |
| Real Sto Return     | -256.24  |
| Running Env Steps   | 1260     |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 1        |
----------------------------------
2024-05-11 01:02:36.209689 Eastern Daylight Time
| Itration            | 2        |
| Loss                | 10       |
| Real Det Return     | 14.42    |
| Real Sto Return     | -258.83  |
| Running Env Steps   | 2520     |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 2        |
----------------------------------
2024-05-11 01:04:00.441223 Eastern Daylight Time
| Itration            | 3        |
| Loss                | 10       |
| Real Det Return     | 293.18   |
| Real Sto Return     | -251.48  |
| Running Env Steps   | 3780     |
| Running Forward KL  | -57.7    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 3        |
----------------------------------
2024-05-11 01:05:24.366220 Eastern Daylight Time
| Itration            | 4        |
| Loss                | 10       |
| Real Det Return     | 243.65   |
| Real Sto Return     | -234.29  |
| Running Env Steps   | 5040     |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 4        |
----------------------------------
2024-05-11 01:06:48.681551 Eastern Daylight Time
| Itration            | 5        |
| Loss                | 10       |
| Real Det Return     | 371.0    |
| Real Sto Return     | -297.82  |
| Running Env Steps   | 6300     |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 5        |
----------------------------------
2024-05-11 01:08:13.076972 Eastern Daylight Time
| Itration            | 6        |
| Loss                | 10       |
| Real Det Return     | 200.6    |
| Real Sto Return     | -191.86  |
| Running Env Steps   | 7560     |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 6        |
----------------------------------
2024-05-11 01:09:37.182333 Eastern Daylight Time
| Itration            | 7        |
| Loss                | 10       |
| Real Det Return     | 304.83   |
| Real Sto Return     | -316.79  |
| Running Env Steps   | 8820     |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 7        |
----------------------------------
2024-05-11 01:11:01.299781 Eastern Daylight Time
| Itration            | 8        |
| Loss                | 10       |
| Real Det Return     | 337.05   |
| Real Sto Return     | -267.48  |
| Running Env Steps   | 10080    |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 8        |
----------------------------------
2024-05-11 01:12:26.595320 Eastern Daylight Time
| Itration            | 9        |
| Loss                | 10       |
| Real Det Return     | 65.62    |
| Real Sto Return     | -278.07  |
| Running Env Steps   | 11340    |
| Running Forward KL  | -57.5    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 9        |
----------------------------------
2024-05-11 01:14:05.184556 Eastern Daylight Time
| Itration            | 10       |
| Loss                | 10       |
| Real Det Return     | 215.76   |
| Real Sto Return     | -261.29  |
| Running Env Steps   | 12600    |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 10       |
----------------------------------
2024-05-11 01:15:29.465333 Eastern Daylight Time
| Itration            | 11       |
| Loss                | 10       |
| Real Det Return     | -47.86   |
| Real Sto Return     | -299.28  |
| Running Env Steps   | 13860    |
| Running Forward KL  | -57.2    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 11       |
----------------------------------
2024-05-11 01:16:54.029988 Eastern Daylight Time
| Itration            | 12       |
| Loss                | 10       |
| Real Det Return     | 603.27   |
| Real Sto Return     | -246.44  |
| Running Env Steps   | 15120    |
| Running Forward KL  | -56.9    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 12       |
----------------------------------
2024-05-11 01:18:19.481126 Eastern Daylight Time
| Itration            | 13       |
| Loss                | 10       |
| Real Det Return     | 264.38   |
| Real Sto Return     | -276.07  |
| Running Env Steps   | 16380    |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 13       |
----------------------------------
2024-05-11 01:19:44.415149 Eastern Daylight Time
| Itration            | 14       |
| Loss                | 10       |
| Real Det Return     | 80.54    |
| Real Sto Return     | -182.59  |
| Running Env Steps   | 17640    |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 14       |
----------------------------------
2024-05-11 01:21:09.703270 Eastern Daylight Time
| Itration            | 15       |
| Loss                | 10       |
| Real Det Return     | 325.98   |
| Real Sto Return     | -239.06  |
| Running Env Steps   | 18900    |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 15       |
----------------------------------
2024-05-11 01:22:34.511101 Eastern Daylight Time
| Itration            | 16       |
| Loss                | 10       |
| Real Det Return     | 2.12     |
| Real Sto Return     | -247.91  |
| Running Env Steps   | 20160    |
| Running Forward KL  | -57      |
| Running Reverse KL  | -58.3    |
| Running Update Time | 16       |
----------------------------------
2024-05-11 01:24:00.436895 Eastern Daylight Time
| Itration            | 17       |
| Loss                | 10       |
| Real Det Return     | 196.67   |
| Real Sto Return     | -228.28  |
| Running Env Steps   | 21420    |
| Running Forward KL  | -57.5    |
| Running Reverse KL  | -57.6    |
| Running Update Time | 17       |
----------------------------------
2024-05-11 01:25:25.827856 Eastern Daylight Time
| Itration            | 18       |
| Loss                | 10       |
| Real Det Return     | 367.94   |
| Real Sto Return     | -245.35  |
| Running Env Steps   | 22680    |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 18       |
----------------------------------
2024-05-11 01:26:50.532170 Eastern Daylight Time
| Itration            | 19       |
| Loss                | 10       |
| Real Det Return     | 153.1    |
| Real Sto Return     | -283.29  |
| Running Env Steps   | 23940    |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 19       |
----------------------------------
2024-05-11 01:28:15.847210 Eastern Daylight Time
| Itration            | 20       |
| Loss                | 10       |
| Real Det Return     | 70.09    |
| Real Sto Return     | -208.93  |
| Running Env Steps   | 25200    |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 20       |
----------------------------------
2024-05-11 01:29:40.932041 Eastern Daylight Time
| Itration            | 21       |
| Loss                | 10       |
| Real Det Return     | 151.56   |
| Real Sto Return     | -189.97  |
| Running Env Steps   | 26460    |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 21       |
----------------------------------
2024-05-11 01:31:07.827405 Eastern Daylight Time
| Itration            | 22       |
| Loss                | 10       |
| Real Det Return     | 113.61   |
| Real Sto Return     | -218.96  |
| Running Env Steps   | 27720    |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 22       |
----------------------------------
2024-05-11 01:32:33.026785 Eastern Daylight Time
| Itration            | 23       |
| Loss                | 10       |
| Real Det Return     | 135.22   |
| Real Sto Return     | -227.26  |
| Running Env Steps   | 28980    |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 23       |
----------------------------------
2024-05-11 01:33:58.146854 Eastern Daylight Time
| Itration            | 24       |
| Loss                | 10       |
| Real Det Return     | 108.35   |
| Real Sto Return     | -283.94  |
| Running Env Steps   | 30240    |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 24       |
----------------------------------
2024-05-11 01:35:23.691092 Eastern Daylight Time
| Itration            | 25       |
| Loss                | 10       |
| Real Det Return     | 152.38   |
| Real Sto Return     | -268.86  |
| Running Env Steps   | 31500    |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 25       |
----------------------------------
2024-05-11 01:36:48.945704 Eastern Daylight Time
| Itration            | 26       |
| Loss                | 10       |
| Real Det Return     | 182.11   |
| Real Sto Return     | -271.28  |
| Running Env Steps   | 32760    |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 26       |
----------------------------------
2024-05-11 01:38:15.516958 Eastern Daylight Time
| Itration            | 27       |
| Loss                | 10       |
| Real Det Return     | 268.53   |
| Real Sto Return     | -286.18  |
| Running Env Steps   | 34020    |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 27       |
----------------------------------
2024-05-11 01:39:41.260733 Eastern Daylight Time
| Itration            | 28       |
| Loss                | 10       |
| Real Det Return     | 339.21   |
| Real Sto Return     | -184.52  |
| Running Env Steps   | 35280    |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 28       |
----------------------------------
2024-05-11 01:41:06.867673 Eastern Daylight Time
| Itration            | 29       |
| Loss                | 10       |
| Real Det Return     | 346.75   |
| Real Sto Return     | -245.69  |
| Running Env Steps   | 36540    |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 29       |
----------------------------------
2024-05-11 01:42:32.546652 Eastern Daylight Time
| Itration            | 30       |
| Loss                | 10       |
| Real Det Return     | 102.55   |
| Real Sto Return     | -275.1   |
| Running Env Steps   | 37800    |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 30       |
----------------------------------
2024-05-11 01:43:58.093323 Eastern Daylight Time
| Itration            | 31       |
| Loss                | 10       |
| Real Det Return     | 299.52   |
| Real Sto Return     | -221.47  |
| Running Env Steps   | 39060    |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 31       |
----------------------------------
2024-05-11 01:45:25.390617 Eastern Daylight Time
| Itration            | 32       |
| Loss                | 10       |
| Real Det Return     | 240.65   |
| Real Sto Return     | -283.04  |
| Running Env Steps   | 40320    |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 32       |
----------------------------------
2024-05-11 01:46:52.292959 Eastern Daylight Time
| Itration            | 33       |
| Loss                | 10       |
| Real Det Return     | 37.69    |
| Real Sto Return     | -204.37  |
| Running Env Steps   | 41580    |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 33       |
----------------------------------
2024-05-11 01:48:18.061658 Eastern Daylight Time
| Itration            | 34       |
| Loss                | 10       |
| Real Det Return     | 131.8    |
| Real Sto Return     | -298.27  |
| Running Env Steps   | 42840    |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 34       |
----------------------------------
2024-05-11 01:49:43.891607 Eastern Daylight Time
| Itration            | 35       |
| Loss                | 10       |
| Real Det Return     | 260.8    |
| Real Sto Return     | -297.06  |
| Running Env Steps   | 44100    |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 35       |
----------------------------------
2024-05-11 01:51:09.701502 Eastern Daylight Time
| Itration            | 36       |
| Loss                | 10       |
| Real Det Return     | 325.53   |
| Real Sto Return     | -221.95  |
| Running Env Steps   | 45360    |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 36       |
----------------------------------
2024-05-11 01:52:35.395601 Eastern Daylight Time
| Itration            | 37       |
| Loss                | 10       |
| Real Det Return     | 151.69   |
| Real Sto Return     | -265.86  |
| Running Env Steps   | 46620    |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 37       |
----------------------------------
2024-05-11 01:54:02.999889 Eastern Daylight Time
| Itration            | 38       |
| Loss                | 10       |
| Real Det Return     | 231.3    |
| Real Sto Return     | -216.7   |
| Running Env Steps   | 47880    |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 38       |
----------------------------------
2024-05-11 01:55:29.085109 Eastern Daylight Time
| Itration            | 39       |
| Loss                | 10       |
| Real Det Return     | 174.81   |
| Real Sto Return     | -195.37  |
| Running Env Steps   | 49140    |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 39       |
----------------------------------
2024-05-11 01:56:55.317007 Eastern Daylight Time
| Itration            | 40       |
| Loss                | 10       |
| Real Det Return     | 329.09   |
| Real Sto Return     | -270.34  |
| Running Env Steps   | 50400    |
| Running Forward KL  | -57.1    |
| Running Reverse KL  | -58.4    |
| Running Update Time | 40       |
----------------------------------
2024-05-11 01:58:21.687867 Eastern Daylight Time
| Itration            | 41       |
| Loss                | 10       |
| Real Det Return     | 485.65   |
| Real Sto Return     | -231.29  |
| Running Env Steps   | 51660    |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 41       |
----------------------------------
2024-05-11 01:59:47.825224 Eastern Daylight Time
| Itration            | 42       |
| Loss                | 10       |
| Real Det Return     | 363.8    |
| Real Sto Return     | -175.99  |
| Running Env Steps   | 52920    |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 42       |
----------------------------------
2024-05-11 02:01:13.901353 Eastern Daylight Time
| Itration            | 43       |
| Loss                | 10       |
| Real Det Return     | 253.19   |
| Real Sto Return     | -223.31  |
| Running Env Steps   | 54180    |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 43       |
----------------------------------
2024-05-11 02:02:41.247307 Eastern Daylight Time
| Itration            | 44       |
| Loss                | 10       |
| Real Det Return     | 166.08   |
| Real Sto Return     | -186.22  |
| Running Env Steps   | 55440    |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 44       |
----------------------------------
2024-05-11 02:04:09.829091 Eastern Daylight Time
| Itration            | 45       |
| Loss                | 10       |
| Real Det Return     | 250.22   |
| Real Sto Return     | -224.74  |
| Running Env Steps   | 56700    |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 45       |
----------------------------------
2024-05-11 02:05:36.421140 Eastern Daylight Time
| Itration            | 46       |
| Loss                | 10       |
| Real Det Return     | 100.72   |
| Real Sto Return     | -247.79  |
| Running Env Steps   | 57960    |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 46       |
----------------------------------
2024-05-11 02:07:03.408862 Eastern Daylight Time
| Itration            | 47       |
| Loss                | 10       |
| Real Det Return     | 213.43   |
| Real Sto Return     | -263.34  |
| Running Env Steps   | 59220    |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 47       |
----------------------------------
2024-05-11 02:08:30.387820 Eastern Daylight Time
| Itration            | 48       |
| Loss                | 10       |
| Real Det Return     | 296.57   |
| Real Sto Return     | -220.46  |
| Running Env Steps   | 60480    |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 48       |
----------------------------------
2024-05-11 02:09:57.442398 Eastern Daylight Time
| Itration            | 49       |
| Loss                | 10       |
| Real Det Return     | 469.37   |
| Real Sto Return     | -208.86  |
| Running Env Steps   | 61740    |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 49       |
----------------------------------
2024-05-11 02:11:24.605166 Eastern Daylight Time
| Itration            | 50       |
| Loss                | 10       |
| Real Det Return     | 70.87    |
| Real Sto Return     | -248.57  |
| Running Env Steps   | 63000    |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 50       |
----------------------------------
2024-05-11 02:12:51.732283 Eastern Daylight Time
| Itration            | 51       |
| Loss                | 10       |
| Real Det Return     | 140.27   |
| Real Sto Return     | -148.68  |
| Running Env Steps   | 64260    |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 51       |
----------------------------------
2024-05-11 02:14:21.904881 Eastern Daylight Time
| Itration            | 52       |
| Loss                | 10       |
| Real Det Return     | 73.1     |
| Real Sto Return     | -223.73  |
| Running Env Steps   | 65520    |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 52       |
----------------------------------
2024-05-11 02:15:49.285610 Eastern Daylight Time
| Itration            | 53       |
| Loss                | 10       |
| Real Det Return     | 236.86   |
| Real Sto Return     | -287.1   |
| Running Env Steps   | 66780    |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 53       |
----------------------------------
2024-05-11 02:17:17.792864 Eastern Daylight Time
| Itration            | 54       |
| Loss                | 10       |
| Real Det Return     | 219.18   |
| Real Sto Return     | -277.45  |
| Running Env Steps   | 68040    |
| Running Forward KL  | -56.9    |
| Running Reverse KL  | -57.3    |
| Running Update Time | 54       |
----------------------------------
2024-05-11 02:18:45.765568 Eastern Daylight Time
| Itration            | 55       |
| Loss                | 10       |
| Real Det Return     | 261.91   |
| Real Sto Return     | -249.0   |
| Running Env Steps   | 69300    |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 55       |
----------------------------------
2024-05-11 02:20:13.708655 Eastern Daylight Time
| Itration            | 56       |
| Loss                | 10       |
| Real Det Return     | 158.45   |
| Real Sto Return     | -273.88  |
| Running Env Steps   | 70560    |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 56       |
----------------------------------
2024-05-11 02:21:41.726810 Eastern Daylight Time
| Itration            | 57       |
| Loss                | 10       |
| Real Det Return     | 191.08   |
| Real Sto Return     | -226.9   |
| Running Env Steps   | 71820    |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 57       |
----------------------------------
2024-05-11 02:23:10.532128 Eastern Daylight Time
| Itration            | 58       |
| Loss                | 10       |
| Real Det Return     | 103.48   |
| Real Sto Return     | -245.66  |
| Running Env Steps   | 73080    |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 58       |
----------------------------------
2024-05-11 02:24:47.758260 Eastern Daylight Time
| Itration            | 59       |
| Loss                | 10       |
| Real Det Return     | 275.22   |
| Real Sto Return     | -288.77  |
| Running Env Steps   | 74340    |
| Running Forward KL  | -57      |
| Running Reverse KL  | -57.4    |
| Running Update Time | 59       |
----------------------------------
2024-05-11 02:26:17.104654 Eastern Daylight Time
| Itration            | 60       |
| Loss                | 10       |
| Real Det Return     | 251.81   |
| Real Sto Return     | -348.01  |
| Running Env Steps   | 75600    |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 60       |
----------------------------------
2024-05-11 02:27:47.131378 Eastern Daylight Time
| Itration            | 61       |
| Loss                | 10       |
| Real Det Return     | 144.99   |
| Real Sto Return     | -224.73  |
| Running Env Steps   | 76860    |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 61       |
----------------------------------
2024-05-11 02:29:17.909543 Eastern Daylight Time
| Itration            | 62       |
| Loss                | 10       |
| Real Det Return     | 125.48   |
| Real Sto Return     | -181.66  |
| Running Env Steps   | 78120    |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.6    |
| Running Update Time | 62       |
----------------------------------
2024-05-11 02:30:49.705171 Eastern Daylight Time
| Itration            | 63       |
| Loss                | 10       |
| Real Det Return     | 153.23   |
| Real Sto Return     | -222.48  |
| Running Env Steps   | 79380    |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 63       |
----------------------------------
2024-05-11 02:32:22.988713 Eastern Daylight Time
| Itration            | 64       |
| Loss                | 10       |
| Real Det Return     | 346.98   |
| Real Sto Return     | -269.78  |
| Running Env Steps   | 80640    |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 64       |
----------------------------------
2024-05-11 02:33:56.552780 Eastern Daylight Time
| Itration            | 65       |
| Loss                | 10       |
| Real Det Return     | 148.07   |
| Real Sto Return     | -332.65  |
| Running Env Steps   | 81900    |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 65       |
----------------------------------
2024-05-11 02:35:31.214016 Eastern Daylight Time
| Itration            | 66       |
| Loss                | 10       |
| Real Det Return     | 279.95   |
| Real Sto Return     | -298.51  |
| Running Env Steps   | 83160    |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 66       |
----------------------------------
2024-05-11 02:37:06.907553 Eastern Daylight Time
| Itration            | 67       |
| Loss                | 10       |
| Real Det Return     | 234.95   |
| Real Sto Return     | -232.54  |
| Running Env Steps   | 84420    |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 67       |
----------------------------------
2024-05-11 02:38:46.571981 Eastern Daylight Time
| Itration            | 68       |
| Loss                | 10       |
| Real Det Return     | 145.24   |
| Real Sto Return     | -278.89  |
| Running Env Steps   | 85680    |
| Running Forward KL  | -57.3    |
| Running Reverse KL  | -58.1    |
| Running Update Time | 68       |
----------------------------------
2024-05-11 02:40:24.350774 Eastern Daylight Time
| Itration            | 69       |
| Loss                | 10       |
| Real Det Return     | 171.56   |
| Real Sto Return     | -247.9   |
| Running Env Steps   | 86940    |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 69       |
----------------------------------
2024-05-11 02:42:02.495552 Eastern Daylight Time
| Itration            | 70       |
| Loss                | 10       |
| Real Det Return     | 103.58   |
| Real Sto Return     | -249.95  |
| Running Env Steps   | 88200    |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 70       |
----------------------------------
2024-05-11 02:43:41.805416 Eastern Daylight Time
| Itration            | 71       |
| Loss                | 10       |
| Real Det Return     | 222.84   |
| Real Sto Return     | -230.08  |
| Running Env Steps   | 89460    |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 71       |
----------------------------------
2024-05-11 02:45:25.308988 Eastern Daylight Time
| Itration            | 72       |
| Loss                | 10       |
| Real Det Return     | 92.92    |
| Real Sto Return     | -281.1   |
| Running Env Steps   | 90720    |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 72       |
----------------------------------
2024-05-11 02:47:07.286680 Eastern Daylight Time
| Itration            | 73       |
| Loss                | 10       |
| Real Det Return     | 353.95   |
| Real Sto Return     | -228.17  |
| Running Env Steps   | 91980    |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 73       |
----------------------------------
2024-05-11 02:48:49.966646 Eastern Daylight Time
| Itration            | 74       |
| Loss                | 10       |
| Real Det Return     | 68.37    |
| Real Sto Return     | -212.86  |
| Running Env Steps   | 93240    |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 74       |
----------------------------------
2024-05-11 02:50:33.319874 Eastern Daylight Time
| Itration            | 75       |
| Loss                | 10       |
| Real Det Return     | 158.04   |
| Real Sto Return     | -265.62  |
| Running Env Steps   | 94500    |
| Running Forward KL  | -56.8    |
| Running Reverse KL  | -57.6    |
| Running Update Time | 75       |
----------------------------------
2024-05-11 02:52:17.449324 Eastern Daylight Time
| Itration            | 76       |
| Loss                | 10       |
| Real Det Return     | 267.55   |
| Real Sto Return     | -231.12  |
| Running Env Steps   | 95760    |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 76       |
----------------------------------
2024-05-11 02:54:05.204538 Eastern Daylight Time
| Itration            | 77       |
| Loss                | 10       |
| Real Det Return     | 320.88   |
| Real Sto Return     | -277.23  |
| Running Env Steps   | 97020    |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 77       |
----------------------------------
2024-05-11 02:55:49.552076 Eastern Daylight Time
| Itration            | 78       |
| Loss                | 10       |
| Real Det Return     | 317.08   |
| Real Sto Return     | -246.57  |
| Running Env Steps   | 98280    |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 78       |
----------------------------------
2024-05-11 02:57:34.245377 Eastern Daylight Time
| Itration            | 79       |
| Loss                | 10       |
| Real Det Return     | 144.42   |
| Real Sto Return     | -224.76  |
| Running Env Steps   | 99540    |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 79       |
----------------------------------
2024-05-11 02:59:19.420204 Eastern Daylight Time
| Itration            | 80       |
| Loss                | 10       |
| Real Det Return     | 209.41   |
| Real Sto Return     | -324.65  |
| Running Env Steps   | 100800   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 80       |
----------------------------------
2024-05-11 03:01:04.243424 Eastern Daylight Time
| Itration            | 81       |
| Loss                | 10       |
| Real Det Return     | 177.01   |
| Real Sto Return     | -268.36  |
| Running Env Steps   | 102060   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 81       |
----------------------------------
2024-05-11 03:02:50.038460 Eastern Daylight Time
| Itration            | 82       |
| Loss                | 10       |
| Real Det Return     | 189.67   |
| Real Sto Return     | -269.1   |
| Running Env Steps   | 103320   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 82       |
----------------------------------
2024-05-11 03:04:35.055216 Eastern Daylight Time
| Itration            | 83       |
| Loss                | 10       |
| Real Det Return     | 181.06   |
| Real Sto Return     | -218.55  |
| Running Env Steps   | 104580   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 83       |
----------------------------------
2024-05-11 03:06:23.235566 Eastern Daylight Time
| Itration            | 84       |
| Loss                | 10       |
| Real Det Return     | -31.53   |
| Real Sto Return     | -259.83  |
| Running Env Steps   | 105840   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 84       |
----------------------------------
2024-05-11 03:08:11.405235 Eastern Daylight Time
| Itration            | 85       |
| Loss                | 10       |
| Real Det Return     | 148.42   |
| Real Sto Return     | -292.41  |
| Running Env Steps   | 107100   |
| Running Forward KL  | -57.2    |
| Running Reverse KL  | -57.4    |
| Running Update Time | 85       |
----------------------------------
2024-05-11 03:09:56.509471 Eastern Daylight Time
| Itration            | 86       |
| Loss                | 10       |
| Real Det Return     | 209.55   |
| Real Sto Return     | -196.48  |
| Running Env Steps   | 108360   |
| Running Forward KL  | -56.5    |
| Running Reverse KL  | -57.2    |
| Running Update Time | 86       |
----------------------------------
2024-05-11 03:11:42.155565 Eastern Daylight Time
| Itration            | 87       |
| Loss                | 10       |
| Real Det Return     | 147.1    |
| Real Sto Return     | -335.88  |
| Running Env Steps   | 109620   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 87       |
----------------------------------
2024-05-11 03:13:37.152790 Eastern Daylight Time
| Itration            | 88       |
| Loss                | 10       |
| Real Det Return     | 217.79   |
| Real Sto Return     | -273.94  |
| Running Env Steps   | 110880   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 88       |
----------------------------------
2024-05-11 03:15:31.885035 Eastern Daylight Time
| Itration            | 89       |
| Loss                | 10       |
| Real Det Return     | 377.84   |
| Real Sto Return     | -245.49  |
| Running Env Steps   | 112140   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 89       |
----------------------------------
2024-05-11 03:17:18.157786 Eastern Daylight Time
| Itration            | 90       |
| Loss                | 10       |
| Real Det Return     | 113.78   |
| Real Sto Return     | -233.4   |
| Running Env Steps   | 113400   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 90       |
----------------------------------
2024-05-11 03:19:22.833136 Eastern Daylight Time
| Itration            | 91       |
| Loss                | 10       |
| Real Det Return     | 81.68    |
| Real Sto Return     | -194.78  |
| Running Env Steps   | 114660   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 91       |
----------------------------------
2024-05-11 03:21:16.724452 Eastern Daylight Time
| Itration            | 92       |
| Loss                | 10       |
| Real Det Return     | 207.78   |
| Real Sto Return     | -219.31  |
| Running Env Steps   | 115920   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 92       |
----------------------------------
2024-05-11 03:23:02.303911 Eastern Daylight Time
| Itration            | 93       |
| Loss                | 10       |
| Real Det Return     | 269.57   |
| Real Sto Return     | -359.69  |
| Running Env Steps   | 117180   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 93       |
----------------------------------
2024-05-11 03:24:48.802766 Eastern Daylight Time
| Itration            | 94       |
| Loss                | 10       |
| Real Det Return     | 57.03    |
| Real Sto Return     | -261.97  |
| Running Env Steps   | 118440   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 94       |
----------------------------------
2024-05-11 03:26:38.683954 Eastern Daylight Time
| Itration            | 95       |
| Loss                | 10       |
| Real Det Return     | 221.79   |
| Real Sto Return     | -180.48  |
| Running Env Steps   | 119700   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 95       |
----------------------------------
2024-05-11 03:28:24.586572 Eastern Daylight Time
| Itration            | 96       |
| Loss                | 10       |
| Real Det Return     | 42.57    |
| Real Sto Return     | -271.93  |
| Running Env Steps   | 120960   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 96       |
----------------------------------
2024-05-11 03:30:12.117901 Eastern Daylight Time
| Itration            | 97       |
| Loss                | 10       |
| Real Det Return     | 479.67   |
| Real Sto Return     | -280.02  |
| Running Env Steps   | 122220   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 97       |
----------------------------------
2024-05-11 03:31:58.436730 Eastern Daylight Time
| Itration            | 98       |
| Loss                | 10       |
| Real Det Return     | 361.38   |
| Real Sto Return     | -308.11  |
| Running Env Steps   | 123480   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 98       |
----------------------------------
2024-05-11 03:34:29.856227 Eastern Daylight Time
| Itration            | 99       |
| Loss                | 10       |
| Real Det Return     | 139.75   |
| Real Sto Return     | -224.54  |
| Running Env Steps   | 124740   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 99       |
----------------------------------
2024-05-11 03:36:20.140416 Eastern Daylight Time
| Itration            | 100      |
| Loss                | 10       |
| Real Det Return     | 314.18   |
| Real Sto Return     | -268.47  |
| Running Env Steps   | 126000   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 100      |
----------------------------------
2024-05-11 03:38:10.086530 Eastern Daylight Time
| Itration            | 101      |
| Loss                | 10       |
| Real Det Return     | 83.72    |
| Real Sto Return     | -278.0   |
| Running Env Steps   | 127260   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 101      |
----------------------------------
2024-05-11 03:40:07.081843 Eastern Daylight Time
| Itration            | 102      |
| Loss                | 10       |
| Real Det Return     | 329.46   |
| Real Sto Return     | -249.28  |
| Running Env Steps   | 128520   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 102      |
----------------------------------
2024-05-11 03:41:57.294558 Eastern Daylight Time
| Itration            | 103      |
| Loss                | 10       |
| Real Det Return     | 343.13   |
| Real Sto Return     | -213.75  |
| Running Env Steps   | 129780   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 103      |
----------------------------------
2024-05-11 03:43:50.395922 Eastern Daylight Time
| Itration            | 104      |
| Loss                | 10       |
| Real Det Return     | 46.21    |
| Real Sto Return     | -237.03  |
| Running Env Steps   | 131040   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 104      |
----------------------------------
2024-05-11 03:45:41.165617 Eastern Daylight Time
| Itration            | 105      |
| Loss                | 10       |
| Real Det Return     | 410.69   |
| Real Sto Return     | -223.78  |
| Running Env Steps   | 132300   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 105      |
----------------------------------
2024-05-11 03:47:37.956407 Eastern Daylight Time
| Itration            | 106      |
| Loss                | 10       |
| Real Det Return     | 99.87    |
| Real Sto Return     | -268.42  |
| Running Env Steps   | 133560   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 106      |
----------------------------------
2024-05-11 03:49:32.619004 Eastern Daylight Time
| Itration            | 107      |
| Loss                | 10       |
| Real Det Return     | 172.67   |
| Real Sto Return     | -326.76  |
| Running Env Steps   | 134820   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 107      |
----------------------------------
2024-05-11 03:51:27.156296 Eastern Daylight Time
| Itration            | 108      |
| Loss                | 10       |
| Real Det Return     | 304.41   |
| Real Sto Return     | -231.13  |
| Running Env Steps   | 136080   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 108      |
----------------------------------
2024-05-11 03:53:17.899636 Eastern Daylight Time
| Itration            | 109      |
| Loss                | 10       |
| Real Det Return     | 229.94   |
| Real Sto Return     | -205.03  |
| Running Env Steps   | 137340   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 109      |
----------------------------------
2024-05-11 03:55:09.207703 Eastern Daylight Time
| Itration            | 110      |
| Loss                | 10       |
| Real Det Return     | 222.45   |
| Real Sto Return     | -248.44  |
| Running Env Steps   | 138600   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 110      |
----------------------------------
2024-05-11 03:58:22.302375 Eastern Daylight Time
| Itration            | 111      |
| Loss                | 10       |
| Real Det Return     | 182.13   |
| Real Sto Return     | -306.89  |
| Running Env Steps   | 139860   |
| Running Forward KL  | -57.4    |
| Running Reverse KL  | -57.8    |
| Running Update Time | 111      |
----------------------------------
2024-05-11 04:00:27.063172 Eastern Daylight Time
| Itration            | 112      |
| Loss                | 10       |
| Real Det Return     | 390.5    |
| Real Sto Return     | -238.4   |
| Running Env Steps   | 141120   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 112      |
----------------------------------
2024-05-11 04:02:22.420799 Eastern Daylight Time
| Itration            | 113      |
| Loss                | 10       |
| Real Det Return     | 319.29   |
| Real Sto Return     | -289.97  |
| Running Env Steps   | 142380   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 113      |
----------------------------------
2024-05-11 04:04:14.336746 Eastern Daylight Time
| Itration            | 114      |
| Loss                | 10       |
| Real Det Return     | 188.77   |
| Real Sto Return     | -255.41  |
| Running Env Steps   | 143640   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 114      |
----------------------------------
2024-05-11 04:06:06.181814 Eastern Daylight Time
| Itration            | 115      |
| Loss                | 10       |
| Real Det Return     | 181.25   |
| Real Sto Return     | -241.85  |
| Running Env Steps   | 144900   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.7    |
| Running Update Time | 115      |
----------------------------------
2024-05-11 04:07:58.969525 Eastern Daylight Time
| Itration            | 116      |
| Loss                | 10       |
| Real Det Return     | 54.46    |
| Real Sto Return     | -216.98  |
| Running Env Steps   | 146160   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 116      |
----------------------------------
2024-05-11 04:09:52.181030 Eastern Daylight Time
| Itration            | 117      |
| Loss                | 10       |
| Real Det Return     | 88.91    |
| Real Sto Return     | -274.57  |
| Running Env Steps   | 147420   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 117      |
----------------------------------
2024-05-11 04:11:45.605902 Eastern Daylight Time
| Itration            | 118      |
| Loss                | 10       |
| Real Det Return     | 164.02   |
| Real Sto Return     | -275.25  |
| Running Env Steps   | 148680   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 118      |
----------------------------------
2024-05-11 04:13:42.647470 Eastern Daylight Time
| Itration            | 119      |
| Loss                | 10       |
| Real Det Return     | 194.19   |
| Real Sto Return     | -256.04  |
| Running Env Steps   | 149940   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 119      |
----------------------------------
2024-05-11 04:15:45.103186 Eastern Daylight Time
| Itration            | 120      |
| Loss                | 10       |
| Real Det Return     | 240.28   |
| Real Sto Return     | -216.88  |
| Running Env Steps   | 151200   |
| Running Forward KL  | -57.3    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 120      |
----------------------------------
2024-05-11 04:17:38.602311 Eastern Daylight Time
| Itration            | 121      |
| Loss                | 10       |
| Real Det Return     | -13.0    |
| Real Sto Return     | -221.72  |
| Running Env Steps   | 152460   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 121      |
----------------------------------
2024-05-11 04:19:31.474793 Eastern Daylight Time
| Itration            | 122      |
| Loss                | 10       |
| Real Det Return     | 247.15   |
| Real Sto Return     | -304.91  |
| Running Env Steps   | 153720   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 122      |
----------------------------------
2024-05-11 04:21:24.414461 Eastern Daylight Time
| Itration            | 123      |
| Loss                | 10       |
| Real Det Return     | 79.42    |
| Real Sto Return     | -268.8   |
| Running Env Steps   | 154980   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 123      |
----------------------------------
2024-05-11 04:23:18.249044 Eastern Daylight Time
| Itration            | 124      |
| Loss                | 10       |
| Real Det Return     | 106.22   |
| Real Sto Return     | -294.77  |
| Running Env Steps   | 156240   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 124      |
----------------------------------
2024-05-11 04:27:01.200127 Eastern Daylight Time
| Itration            | 125      |
| Loss                | 10       |
| Real Det Return     | 242.71   |
| Real Sto Return     | -219.78  |
| Running Env Steps   | 157500   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 125      |
----------------------------------
2024-05-11 04:28:54.525780 Eastern Daylight Time
| Itration            | 126      |
| Loss                | 10       |
| Real Det Return     | 142.64   |
| Real Sto Return     | -209.12  |
| Running Env Steps   | 158760   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 126      |
----------------------------------
2024-05-11 04:30:47.673525 Eastern Daylight Time
| Itration            | 127      |
| Loss                | 10       |
| Real Det Return     | 30.41    |
| Real Sto Return     | -248.79  |
| Running Env Steps   | 160020   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 127      |
----------------------------------
2024-05-11 04:32:42.050822 Eastern Daylight Time
| Itration            | 128      |
| Loss                | 10       |
| Real Det Return     | 267.54   |
| Real Sto Return     | -243.92  |
| Running Env Steps   | 161280   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 128      |
----------------------------------
2024-05-11 04:34:36.537364 Eastern Daylight Time
| Itration            | 129      |
| Loss                | 10       |
| Real Det Return     | 202.86   |
| Real Sto Return     | -220.84  |
| Running Env Steps   | 162540   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 129      |
----------------------------------
2024-05-11 04:36:32.669072 Eastern Daylight Time
| Itration            | 130      |
| Loss                | 10       |
| Real Det Return     | 119.45   |
| Real Sto Return     | -290.1   |
| Running Env Steps   | 163800   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 130      |
----------------------------------
2024-05-11 04:38:26.731330 Eastern Daylight Time
| Itration            | 131      |
| Loss                | 10       |
| Real Det Return     | 117.78   |
| Real Sto Return     | -236.01  |
| Running Env Steps   | 165060   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 131      |
----------------------------------
2024-05-11 04:40:20.361240 Eastern Daylight Time
| Itration            | 132      |
| Loss                | 10       |
| Real Det Return     | 322.27   |
| Real Sto Return     | -294.46  |
| Running Env Steps   | 166320   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 132      |
----------------------------------
2024-05-11 04:42:13.888778 Eastern Daylight Time
| Itration            | 133      |
| Loss                | 10       |
| Real Det Return     | 182.21   |
| Real Sto Return     | -267.12  |
| Running Env Steps   | 167580   |
| Running Forward KL  | -56.4    |
| Running Reverse KL  | -57.2    |
| Running Update Time | 133      |
----------------------------------
2024-05-11 04:44:07.830671 Eastern Daylight Time
| Itration            | 134      |
| Loss                | 10       |
| Real Det Return     | 162.24   |
| Real Sto Return     | -268.18  |
| Running Env Steps   | 168840   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 134      |
----------------------------------
2024-05-11 04:46:04.993082 Eastern Daylight Time
| Itration            | 135      |
| Loss                | 10       |
| Real Det Return     | 280.17   |
| Real Sto Return     | -268.32  |
| Running Env Steps   | 170100   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 135      |
----------------------------------
2024-05-11 04:47:58.672692 Eastern Daylight Time
| Itration            | 136      |
| Loss                | 10       |
| Real Det Return     | 73.35    |
| Real Sto Return     | -294.34  |
| Running Env Steps   | 171360   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 136      |
----------------------------------
2024-05-11 04:49:52.348112 Eastern Daylight Time
| Itration            | 137      |
| Loss                | 10       |
| Real Det Return     | 238.19   |
| Real Sto Return     | -242.75  |
| Running Env Steps   | 172620   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 137      |
----------------------------------
2024-05-11 04:51:45.256676 Eastern Daylight Time
| Itration            | 138      |
| Loss                | 10       |
| Real Det Return     | 110.96   |
| Real Sto Return     | -353.77  |
| Running Env Steps   | 173880   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 138      |
----------------------------------
2024-05-11 04:56:58.791971 Eastern Daylight Time
| Itration            | 139      |
| Loss                | 10       |
| Real Det Return     | 97.71    |
| Real Sto Return     | -232.95  |
| Running Env Steps   | 175140   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 139      |
----------------------------------
2024-05-11 04:58:56.025451 Eastern Daylight Time
| Itration            | 140      |
| Loss                | 10       |
| Real Det Return     | 343.99   |
| Real Sto Return     | -248.03  |
| Running Env Steps   | 176400   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 140      |
----------------------------------
2024-05-11 05:00:51.010746 Eastern Daylight Time
| Itration            | 141      |
| Loss                | 10       |
| Real Det Return     | 151.34   |
| Real Sto Return     | -268.62  |
| Running Env Steps   | 177660   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 141      |
----------------------------------
2024-05-11 05:02:45.798280 Eastern Daylight Time
| Itration            | 142      |
| Loss                | 10       |
| Real Det Return     | 199.69   |
| Real Sto Return     | -255.74  |
| Running Env Steps   | 178920   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 142      |
----------------------------------
2024-05-11 05:04:41.508213 Eastern Daylight Time
| Itration            | 143      |
| Loss                | 10       |
| Real Det Return     | 529.44   |
| Real Sto Return     | -235.33  |
| Running Env Steps   | 180180   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 143      |
----------------------------------
2024-05-11 05:06:36.071113 Eastern Daylight Time
| Itration            | 144      |
| Loss                | 10       |
| Real Det Return     | 15.69    |
| Real Sto Return     | -245.73  |
| Running Env Steps   | 181440   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 144      |
----------------------------------
2024-05-11 05:08:30.849846 Eastern Daylight Time
| Itration            | 145      |
| Loss                | 10       |
| Real Det Return     | 113.59   |
| Real Sto Return     | -257.92  |
| Running Env Steps   | 182700   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 145      |
----------------------------------
2024-05-11 05:10:26.007018 Eastern Daylight Time
| Itration            | 146      |
| Loss                | 10       |
| Real Det Return     | 73.12    |
| Real Sto Return     | -179.77  |
| Running Env Steps   | 183960   |
| Running Forward KL  | -56.7    |
| Running Reverse KL  | -58      |
| Running Update Time | 146      |
----------------------------------
2024-05-11 05:12:21.839170 Eastern Daylight Time
| Itration            | 147      |
| Loss                | 10       |
| Real Det Return     | 129.24   |
| Real Sto Return     | -220.37  |
| Running Env Steps   | 185220   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 147      |
----------------------------------
2024-05-11 05:14:18.495700 Eastern Daylight Time
| Itration            | 148      |
| Loss                | 10       |
| Real Det Return     | 293.16   |
| Real Sto Return     | -269.56  |
| Running Env Steps   | 186480   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.6    |
| Running Update Time | 148      |
----------------------------------
2024-05-11 05:16:14.789601 Eastern Daylight Time
| Itration            | 149      |
| Loss                | 10       |
| Real Det Return     | 342.98   |
| Real Sto Return     | -208.55  |
| Running Env Steps   | 187740   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 149      |
----------------------------------
2024-05-11 05:18:18.614307 Eastern Daylight Time
| Itration            | 150      |
| Loss                | 10       |
| Real Det Return     | 435.21   |
| Real Sto Return     | -206.34  |
| Running Env Steps   | 189000   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 150      |
----------------------------------
2024-05-11 05:20:12.746391 Eastern Daylight Time
| Itration            | 151      |
| Loss                | 10       |
| Real Det Return     | 439.99   |
| Real Sto Return     | -322.44  |
| Running Env Steps   | 190260   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 151      |
----------------------------------
2024-05-11 05:22:07.953374 Eastern Daylight Time
| Itration            | 152      |
| Loss                | 10       |
| Real Det Return     | 107.39   |
| Real Sto Return     | -254.43  |
| Running Env Steps   | 191520   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 152      |
----------------------------------
2024-05-11 05:24:02.793801 Eastern Daylight Time
| Itration            | 153      |
| Loss                | 10       |
| Real Det Return     | 273.86   |
| Real Sto Return     | -221.15  |
| Running Env Steps   | 192780   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 153      |
----------------------------------
2024-05-11 05:25:58.378039 Eastern Daylight Time
| Itration            | 154      |
| Loss                | 10       |
| Real Det Return     | 366.51   |
| Real Sto Return     | -210.88  |
| Running Env Steps   | 194040   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 154      |
----------------------------------
2024-05-11 05:27:54.334958 Eastern Daylight Time
| Itration            | 155      |
| Loss                | 10       |
| Real Det Return     | 18.46    |
| Real Sto Return     | -232.57  |
| Running Env Steps   | 195300   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 155      |
----------------------------------
2024-05-11 05:34:18.918261 Eastern Daylight Time
| Itration            | 156      |
| Loss                | 10       |
| Real Det Return     | 219.06   |
| Real Sto Return     | -227.21  |
| Running Env Steps   | 196560   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 156      |
----------------------------------
2024-05-11 05:36:19.823162 Eastern Daylight Time
| Itration            | 157      |
| Loss                | 10       |
| Real Det Return     | 154.46   |
| Real Sto Return     | -303.73  |
| Running Env Steps   | 197820   |
| Running Forward KL  | -57.4    |
| Running Reverse KL  | -57.4    |
| Running Update Time | 157      |
----------------------------------
2024-05-11 05:38:13.353641 Eastern Daylight Time
| Itration            | 158      |
| Loss                | 10       |
| Real Det Return     | 166.53   |
| Real Sto Return     | -281.63  |
| Running Env Steps   | 199080   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 158      |
----------------------------------
2024-05-11 05:40:19.664554 Eastern Daylight Time
| Itration            | 159      |
| Loss                | 10       |
| Real Det Return     | 291.75   |
| Real Sto Return     | -247.18  |
| Running Env Steps   | 200340   |
| Running Forward KL  | -56.7    |
| Running Reverse KL  | -58.2    |
| Running Update Time | 159      |
----------------------------------
2024-05-11 05:42:20.351789 Eastern Daylight Time
| Itration            | 160      |
| Loss                | 10       |
| Real Det Return     | 213.51   |
| Real Sto Return     | -275.11  |
| Running Env Steps   | 201600   |
| Running Forward KL  | -57.5    |
| Running Reverse KL  | -57.4    |
| Running Update Time | 160      |
----------------------------------
2024-05-11 05:44:16.950340 Eastern Daylight Time
| Itration            | 161      |
| Loss                | 10       |
| Real Det Return     | 75.55    |
| Real Sto Return     | -225.13  |
| Running Env Steps   | 202860   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 161      |
----------------------------------
2024-05-11 05:46:12.328381 Eastern Daylight Time
| Itration            | 162      |
| Loss                | 10       |
| Real Det Return     | 326.67   |
| Real Sto Return     | -320.54  |
| Running Env Steps   | 204120   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 162      |
----------------------------------
2024-05-11 05:48:07.869203 Eastern Daylight Time
| Itration            | 163      |
| Loss                | 10       |
| Real Det Return     | 170.92   |
| Real Sto Return     | -253.36  |
| Running Env Steps   | 205380   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 163      |
----------------------------------
2024-05-11 05:50:04.681469 Eastern Daylight Time
| Itration            | 164      |
| Loss                | 10       |
| Real Det Return     | 81.68    |
| Real Sto Return     | -252.2   |
| Running Env Steps   | 206640   |
| Running Forward KL  | -56.9    |
| Running Reverse KL  | -57.3    |
| Running Update Time | 164      |
----------------------------------
2024-05-11 05:51:59.655288 Eastern Daylight Time
| Itration            | 165      |
| Loss                | 10       |
| Real Det Return     | 385.56   |
| Real Sto Return     | -272.74  |
| Running Env Steps   | 207900   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 165      |
----------------------------------
2024-05-11 05:53:55.428096 Eastern Daylight Time
| Itration            | 166      |
| Loss                | 10       |
| Real Det Return     | 265.42   |
| Real Sto Return     | -280.53  |
| Running Env Steps   | 209160   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 166      |
----------------------------------
2024-05-11 05:55:51.153834 Eastern Daylight Time
| Itration            | 167      |
| Loss                | 10       |
| Real Det Return     | 52.56    |
| Real Sto Return     | -249.1   |
| Running Env Steps   | 210420   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 167      |
----------------------------------
2024-05-11 05:57:47.070390 Eastern Daylight Time
| Itration            | 168      |
| Loss                | 10       |
| Real Det Return     | 42.84    |
| Real Sto Return     | -248.16  |
| Running Env Steps   | 211680   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 168      |
----------------------------------
2024-05-11 05:59:46.168651 Eastern Daylight Time
| Itration            | 169      |
| Loss                | 10       |
| Real Det Return     | 339.2    |
| Real Sto Return     | -266.06  |
| Running Env Steps   | 212940   |
| Running Forward KL  | -57.3    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 169      |
----------------------------------
2024-05-11 06:01:41.956257 Eastern Daylight Time
| Itration            | 170      |
| Loss                | 10       |
| Real Det Return     | 206.55   |
| Real Sto Return     | -256.3   |
| Running Env Steps   | 214200   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 170      |
----------------------------------
2024-05-11 06:03:38.929739 Eastern Daylight Time
| Itration            | 171      |
| Loss                | 10       |
| Real Det Return     | 366.33   |
| Real Sto Return     | -298.13  |
| Running Env Steps   | 215460   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 171      |
----------------------------------
2024-05-11 06:05:35.040837 Eastern Daylight Time
| Itration            | 172      |
| Loss                | 10       |
| Real Det Return     | 225.46   |
| Real Sto Return     | -235.77  |
| Running Env Steps   | 216720   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 172      |
----------------------------------
2024-05-11 06:07:34.533100 Eastern Daylight Time
| Itration            | 173      |
| Loss                | 10       |
| Real Det Return     | 404.54   |
| Real Sto Return     | -281.68  |
| Running Env Steps   | 217980   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 173      |
----------------------------------
2024-05-11 06:14:48.294930 Eastern Daylight Time
| Itration            | 174      |
| Loss                | 10       |
| Real Det Return     | 183.86   |
| Real Sto Return     | -262.16  |
| Running Env Steps   | 219240   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 174      |
----------------------------------
2024-05-11 06:16:44.066762 Eastern Daylight Time
| Itration            | 175      |
| Loss                | 10       |
| Real Det Return     | 171.32   |
| Real Sto Return     | -269.1   |
| Running Env Steps   | 220500   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 175      |
----------------------------------
2024-05-11 06:18:41.265337 Eastern Daylight Time
| Itration            | 176      |
| Loss                | 10       |
| Real Det Return     | 34.16    |
| Real Sto Return     | -233.87  |
| Running Env Steps   | 221760   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 176      |
----------------------------------
2024-05-11 06:20:37.334616 Eastern Daylight Time
| Itration            | 177      |
| Loss                | 10       |
| Real Det Return     | 340.97   |
| Real Sto Return     | -249.05  |
| Running Env Steps   | 223020   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 177      |
----------------------------------
2024-05-11 06:22:33.346852 Eastern Daylight Time
| Itration            | 178      |
| Loss                | 10       |
| Real Det Return     | 305.78   |
| Real Sto Return     | -271.93  |
| Running Env Steps   | 224280   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 178      |
----------------------------------
2024-05-11 06:24:29.903751 Eastern Daylight Time
| Itration            | 179      |
| Loss                | 10       |
| Real Det Return     | 212.14   |
| Real Sto Return     | -205.38  |
| Running Env Steps   | 225540   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 179      |
----------------------------------
2024-05-11 06:26:25.926290 Eastern Daylight Time
| Itration            | 180      |
| Loss                | 10       |
| Real Det Return     | 234.93   |
| Real Sto Return     | -267.75  |
| Running Env Steps   | 226800   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 180      |
----------------------------------
2024-05-11 06:28:22.501789 Eastern Daylight Time
| Itration            | 181      |
| Loss                | 10       |
| Real Det Return     | 285.96   |
| Real Sto Return     | -220.97  |
| Running Env Steps   | 228060   |
| Running Forward KL  | -57.2    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 181      |
----------------------------------
2024-05-11 06:30:18.888231 Eastern Daylight Time
| Itration            | 182      |
| Loss                | 10       |
| Real Det Return     | 258.73   |
| Real Sto Return     | -222.69  |
| Running Env Steps   | 229320   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 182      |
----------------------------------
2024-05-11 06:32:15.886952 Eastern Daylight Time
| Itration            | 183      |
| Loss                | 10       |
| Real Det Return     | 97.97    |
| Real Sto Return     | -284.29  |
| Running Env Steps   | 230580   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 183      |
----------------------------------
2024-05-11 06:34:15.431950 Eastern Daylight Time
| Itration            | 184      |
| Loss                | 10       |
| Real Det Return     | 153.73   |
| Real Sto Return     | -229.75  |
| Running Env Steps   | 231840   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 184      |
----------------------------------
2024-05-11 06:36:11.805724 Eastern Daylight Time
| Itration            | 185      |
| Loss                | 10       |
| Real Det Return     | 70.74    |
| Real Sto Return     | -285.74  |
| Running Env Steps   | 233100   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 185      |
----------------------------------
2024-05-11 06:38:10.918205 Eastern Daylight Time
| Itration            | 186      |
| Loss                | 10       |
| Real Det Return     | 306.63   |
| Real Sto Return     | -282.33  |
| Running Env Steps   | 234360   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 186      |
----------------------------------
2024-05-11 06:40:08.551576 Eastern Daylight Time
| Itration            | 187      |
| Loss                | 10       |
| Real Det Return     | 207.13   |
| Real Sto Return     | -151.37  |
| Running Env Steps   | 235620   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 187      |
----------------------------------
2024-05-11 06:42:06.267347 Eastern Daylight Time
| Itration            | 188      |
| Loss                | 10       |
| Real Det Return     | 153.1    |
| Real Sto Return     | -272.16  |
| Running Env Steps   | 236880   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 188      |
----------------------------------
2024-05-11 06:44:03.710097 Eastern Daylight Time
| Itration            | 189      |
| Loss                | 10       |
| Real Det Return     | 10.12    |
| Real Sto Return     | -272.64  |
| Running Env Steps   | 238140   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 189      |
----------------------------------
2024-05-11 06:46:01.405296 Eastern Daylight Time
| Itration            | 190      |
| Loss                | 10       |
| Real Det Return     | 161.37   |
| Real Sto Return     | -238.05  |
| Running Env Steps   | 239400   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 190      |
----------------------------------
2024-05-11 06:48:02.742110 Eastern Daylight Time
| Itration            | 191      |
| Loss                | 10       |
| Real Det Return     | 251.01   |
| Real Sto Return     | -245.18  |
| Running Env Steps   | 240660   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 191      |
----------------------------------
2024-05-11 06:50:01.132266 Eastern Daylight Time
| Itration            | 192      |
| Loss                | 10       |
| Real Det Return     | 179.49   |
| Real Sto Return     | -229.15  |
| Running Env Steps   | 241920   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 192      |
----------------------------------
2024-05-11 06:57:34.185925 Eastern Daylight Time
| Itration            | 193      |
| Loss                | 10       |
| Real Det Return     | 224.83   |
| Real Sto Return     | -270.74  |
| Running Env Steps   | 243180   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 193      |
----------------------------------
2024-05-11 06:59:52.070332 Eastern Daylight Time
| Itration            | 194      |
| Loss                | 10       |
| Real Det Return     | 299.86   |
| Real Sto Return     | -226.39  |
| Running Env Steps   | 244440   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 194      |
----------------------------------
2024-05-11 07:01:53.001970 Eastern Daylight Time
| Itration            | 195      |
| Loss                | 10       |
| Real Det Return     | 251.91   |
| Real Sto Return     | -213.58  |
| Running Env Steps   | 245700   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 195      |
----------------------------------
2024-05-11 07:03:53.647827 Eastern Daylight Time
| Itration            | 196      |
| Loss                | 10       |
| Real Det Return     | 198.39   |
| Real Sto Return     | -259.22  |
| Running Env Steps   | 246960   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 196      |
----------------------------------
2024-05-11 07:05:55.085627 Eastern Daylight Time
| Itration            | 197      |
| Loss                | 10       |
| Real Det Return     | 429.56   |
| Real Sto Return     | -272.55  |
| Running Env Steps   | 248220   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 197      |
----------------------------------
2024-05-11 07:07:58.936503 Eastern Daylight Time
| Itration            | 198      |
| Loss                | 10       |
| Real Det Return     | 94.32    |
| Real Sto Return     | -268.42  |
| Running Env Steps   | 249480   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 198      |
----------------------------------
2024-05-11 07:09:59.937654 Eastern Daylight Time
| Itration            | 199      |
| Loss                | 10       |
| Real Det Return     | 234.08   |
| Real Sto Return     | -262.46  |
| Running Env Steps   | 250740   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 199      |
----------------------------------
2024-05-11 07:12:07.504590 Eastern Daylight Time
| Itration            | 200      |
| Loss                | 10       |
| Real Det Return     | 389.61   |
| Real Sto Return     | -227.57  |
| Running Env Steps   | 252000   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 200      |
----------------------------------
2024-05-11 07:14:14.155375 Eastern Daylight Time
| Itration            | 201      |
| Loss                | 10       |
| Real Det Return     | 125.63   |
| Real Sto Return     | -250.27  |
| Running Env Steps   | 253260   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 201      |
----------------------------------
2024-05-11 07:16:21.053567 Eastern Daylight Time
| Itration            | 202      |
| Loss                | 10       |
| Real Det Return     | 215.03   |
| Real Sto Return     | -262.09  |
| Running Env Steps   | 254520   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 202      |
----------------------------------
2024-05-11 07:18:21.519268 Eastern Daylight Time
| Itration            | 203      |
| Loss                | 10       |
| Real Det Return     | 189.48   |
| Real Sto Return     | -201.93  |
| Running Env Steps   | 255780   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 203      |
----------------------------------
2024-05-11 07:20:23.564110 Eastern Daylight Time
| Itration            | 204      |
| Loss                | 10       |
| Real Det Return     | 71.15    |
| Real Sto Return     | -188.26  |
| Running Env Steps   | 257040   |
| Running Forward KL  | -57.3    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 204      |
----------------------------------
2024-05-11 07:22:24.893338 Eastern Daylight Time
| Itration            | 205      |
| Loss                | 10       |
| Real Det Return     | 162.81   |
| Real Sto Return     | -213.36  |
| Running Env Steps   | 258300   |
| Running Forward KL  | -57.3    |
| Running Reverse KL  | -58.2    |
| Running Update Time | 205      |
----------------------------------
2024-05-11 07:24:26.126225 Eastern Daylight Time
| Itration            | 206      |
| Loss                | 10       |
| Real Det Return     | 150.64   |
| Real Sto Return     | -305.0   |
| Running Env Steps   | 259560   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 206      |
----------------------------------
2024-05-11 07:26:28.225609 Eastern Daylight Time
| Itration            | 207      |
| Loss                | 10       |
| Real Det Return     | 189.69   |
| Real Sto Return     | -220.27  |
| Running Env Steps   | 260820   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 207      |
----------------------------------
2024-05-11 07:28:30.228435 Eastern Daylight Time
| Itration            | 208      |
| Loss                | 10       |
| Real Det Return     | 84.9     |
| Real Sto Return     | -228.73  |
| Running Env Steps   | 262080   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 208      |
----------------------------------
2024-05-11 07:30:41.977115 Eastern Daylight Time
| Itration            | 209      |
| Loss                | 10       |
| Real Det Return     | 299.69   |
| Real Sto Return     | -265.35  |
| Running Env Steps   | 263340   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 209      |
----------------------------------
2024-05-11 07:32:48.573133 Eastern Daylight Time
| Itration            | 210      |
| Loss                | 10       |
| Real Det Return     | 211.41   |
| Real Sto Return     | -221.2   |
| Running Env Steps   | 264600   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 210      |
----------------------------------
2024-05-11 07:34:55.797151 Eastern Daylight Time
| Itration            | 211      |
| Loss                | 10       |
| Real Det Return     | 248.35   |
| Real Sto Return     | -280.33  |
| Running Env Steps   | 265860   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 211      |
----------------------------------
2024-05-11 07:37:00.872524 Eastern Daylight Time
| Itration            | 212      |
| Loss                | 10       |
| Real Det Return     | 33.42    |
| Real Sto Return     | -209.71  |
| Running Env Steps   | 267120   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 212      |
----------------------------------
2024-05-11 07:39:11.347587 Eastern Daylight Time
| Itration            | 213      |
| Loss                | 10       |
| Real Det Return     | 179.81   |
| Real Sto Return     | -250.92  |
| Running Env Steps   | 268380   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 213      |
----------------------------------
2024-05-11 07:41:20.268768 Eastern Daylight Time
| Itration            | 214      |
| Loss                | 10       |
| Real Det Return     | 268.88   |
| Real Sto Return     | -280.92  |
| Running Env Steps   | 269640   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 214      |
----------------------------------
2024-05-11 07:50:36.706895 Eastern Daylight Time
| Itration            | 215      |
| Loss                | 10       |
| Real Det Return     | 222.17   |
| Real Sto Return     | -243.09  |
| Running Env Steps   | 270900   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 215      |
----------------------------------
2024-05-11 07:52:42.742434 Eastern Daylight Time
| Itration            | 216      |
| Loss                | 10       |
| Real Det Return     | 239.79   |
| Real Sto Return     | -279.95  |
| Running Env Steps   | 272160   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 216      |
----------------------------------
2024-05-11 07:54:53.042181 Eastern Daylight Time
| Itration            | 217      |
| Loss                | 10       |
| Real Det Return     | 95.97    |
| Real Sto Return     | -212.32  |
| Running Env Steps   | 273420   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 217      |
----------------------------------
2024-05-11 07:56:57.322868 Eastern Daylight Time
| Itration            | 218      |
| Loss                | 10       |
| Real Det Return     | 54.73    |
| Real Sto Return     | -244.52  |
| Running Env Steps   | 274680   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 218      |
----------------------------------
2024-05-11 07:59:02.687766 Eastern Daylight Time
| Itration            | 219      |
| Loss                | 10       |
| Real Det Return     | 122.43   |
| Real Sto Return     | -244.45  |
| Running Env Steps   | 275940   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 219      |
----------------------------------
2024-05-11 08:01:08.277820 Eastern Daylight Time
| Itration            | 220      |
| Loss                | 10       |
| Real Det Return     | 306.91   |
| Real Sto Return     | -242.4   |
| Running Env Steps   | 277200   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 220      |
----------------------------------
2024-05-11 08:03:21.390980 Eastern Daylight Time
| Itration            | 221      |
| Loss                | 10       |
| Real Det Return     | 244.03   |
| Real Sto Return     | -263.3   |
| Running Env Steps   | 278460   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 221      |
----------------------------------
2024-05-11 08:05:36.077940 Eastern Daylight Time
| Itration            | 222      |
| Loss                | 10       |
| Real Det Return     | 317.62   |
| Real Sto Return     | -255.63  |
| Running Env Steps   | 279720   |
| Running Forward KL  | -56.2    |
| Running Reverse KL  | -57.2    |
| Running Update Time | 222      |
----------------------------------
2024-05-11 08:07:32.398290 Eastern Daylight Time
| Itration            | 223      |
| Loss                | 10       |
| Real Det Return     | 223.3    |
| Real Sto Return     | -219.69  |
| Running Env Steps   | 280980   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 223      |
----------------------------------
2024-05-11 08:09:28.814816 Eastern Daylight Time
| Itration            | 224      |
| Loss                | 10       |
| Real Det Return     | 458.87   |
| Real Sto Return     | -223.98  |
| Running Env Steps   | 282240   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 224      |
----------------------------------
2024-05-11 08:11:27.638857 Eastern Daylight Time
| Itration            | 225      |
| Loss                | 10       |
| Real Det Return     | 216.87   |
| Real Sto Return     | -207.52  |
| Running Env Steps   | 283500   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 225      |
----------------------------------
2024-05-11 08:13:17.218656 Eastern Daylight Time
| Itration            | 226      |
| Loss                | 10       |
| Real Det Return     | 188.13   |
| Real Sto Return     | -258.41  |
| Running Env Steps   | 284760   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 226      |
----------------------------------
2024-05-11 08:15:14.209194 Eastern Daylight Time
| Itration            | 227      |
| Loss                | 10       |
| Real Det Return     | 64.87    |
| Real Sto Return     | -270.2   |
| Running Env Steps   | 286020   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 227      |
----------------------------------
2024-05-11 08:17:04.462282 Eastern Daylight Time
| Itration            | 228      |
| Loss                | 10       |
| Real Det Return     | 112.54   |
| Real Sto Return     | -244.63  |
| Running Env Steps   | 287280   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 228      |
----------------------------------
2024-05-11 08:18:58.308168 Eastern Daylight Time
| Itration            | 229      |
| Loss                | 10       |
| Real Det Return     | 207.46   |
| Real Sto Return     | -220.31  |
| Running Env Steps   | 288540   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 229      |
----------------------------------
2024-05-11 08:20:53.100434 Eastern Daylight Time
| Itration            | 230      |
| Loss                | 10       |
| Real Det Return     | 44.37    |
| Real Sto Return     | -207.86  |
| Running Env Steps   | 289800   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 230      |
----------------------------------
2024-05-11 08:22:43.911263 Eastern Daylight Time
| Itration            | 231      |
| Loss                | 10       |
| Real Det Return     | 66.2     |
| Real Sto Return     | -197.55  |
| Running Env Steps   | 291060   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 231      |
----------------------------------
2024-05-11 08:24:38.439958 Eastern Daylight Time
| Itration            | 232      |
| Loss                | 10       |
| Real Det Return     | 131.37   |
| Real Sto Return     | -246.75  |
| Running Env Steps   | 292320   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 232      |
----------------------------------
2024-05-11 08:26:30.057726 Eastern Daylight Time
| Itration            | 233      |
| Loss                | 10       |
| Real Det Return     | 44.52    |
| Real Sto Return     | -272.71  |
| Running Env Steps   | 293580   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 233      |
----------------------------------
2024-05-11 08:28:25.804861 Eastern Daylight Time
| Itration            | 234      |
| Loss                | 10       |
| Real Det Return     | 114.46   |
| Real Sto Return     | -211.1   |
| Running Env Steps   | 294840   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 234      |
----------------------------------
2024-05-11 08:30:17.479300 Eastern Daylight Time
| Itration            | 235      |
| Loss                | 10       |
| Real Det Return     | 71.2     |
| Real Sto Return     | -257.1   |
| Running Env Steps   | 296100   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 235      |
----------------------------------
2024-05-11 08:32:19.426838 Eastern Daylight Time
| Itration            | 236      |
| Loss                | 10       |
| Real Det Return     | 62.6     |
| Real Sto Return     | -212.53  |
| Running Env Steps   | 297360   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 236      |
----------------------------------
2024-05-11 08:34:11.338073 Eastern Daylight Time
| Itration            | 237      |
| Loss                | 10       |
| Real Det Return     | 252.16   |
| Real Sto Return     | -284.04  |
| Running Env Steps   | 298620   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 237      |
----------------------------------
2024-05-11 08:42:37.924975 Eastern Daylight Time
| Itration            | 238      |
| Loss                | 10       |
| Real Det Return     | 222.35   |
| Real Sto Return     | -288.68  |
| Running Env Steps   | 299880   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 238      |
----------------------------------
2024-05-11 08:44:59.523604 Eastern Daylight Time
| Itration            | 239      |
| Loss                | 10       |
| Real Det Return     | 67.02    |
| Real Sto Return     | -249.41  |
| Running Env Steps   | 301140   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 239      |
----------------------------------
2024-05-11 08:46:56.650362 Eastern Daylight Time
| Itration            | 240      |
| Loss                | 10       |
| Real Det Return     | 66.08    |
| Real Sto Return     | -225.11  |
| Running Env Steps   | 302400   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 240      |
----------------------------------
2024-05-11 08:49:06.999867 Eastern Daylight Time
| Itration            | 241      |
| Loss                | 10       |
| Real Det Return     | 399.23   |
| Real Sto Return     | -289.8   |
| Running Env Steps   | 303660   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 241      |
----------------------------------
2024-05-11 08:51:10.197845 Eastern Daylight Time
| Itration            | 242      |
| Loss                | 10       |
| Real Det Return     | -1.7     |
| Real Sto Return     | -238.24  |
| Running Env Steps   | 304920   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 242      |
----------------------------------
2024-05-11 08:53:07.134141 Eastern Daylight Time
| Itration            | 243      |
| Loss                | 10       |
| Real Det Return     | 163.5    |
| Real Sto Return     | -232.36  |
| Running Env Steps   | 306180   |
| Running Forward KL  | -55.9    |
| Running Reverse KL  | -56.9    |
| Running Update Time | 243      |
----------------------------------
2024-05-11 08:55:04.318356 Eastern Daylight Time
| Itration            | 244      |
| Loss                | 10       |
| Real Det Return     | 242.51   |
| Real Sto Return     | -256.51  |
| Running Env Steps   | 307440   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 244      |
----------------------------------
2024-05-11 08:57:01.441412 Eastern Daylight Time
| Itration            | 245      |
| Loss                | 10       |
| Real Det Return     | 265.08   |
| Real Sto Return     | -265.14  |
| Running Env Steps   | 308700   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 245      |
----------------------------------
2024-05-11 08:58:59.146930 Eastern Daylight Time
| Itration            | 246      |
| Loss                | 10       |
| Real Det Return     | 309.61   |
| Real Sto Return     | -208.62  |
| Running Env Steps   | 309960   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 246      |
----------------------------------
2024-05-11 09:00:59.318862 Eastern Daylight Time
| Itration            | 247      |
| Loss                | 10       |
| Real Det Return     | 115.04   |
| Real Sto Return     | -240.05  |
| Running Env Steps   | 311220   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 247      |
----------------------------------
2024-05-11 09:03:01.108956 Eastern Daylight Time
| Itration            | 248      |
| Loss                | 10       |
| Real Det Return     | 279.43   |
| Real Sto Return     | -253.97  |
| Running Env Steps   | 312480   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 248      |
----------------------------------
2024-05-11 09:04:59.379306 Eastern Daylight Time
| Itration            | 249      |
| Loss                | 10       |
| Real Det Return     | 134.62   |
| Real Sto Return     | -268.22  |
| Running Env Steps   | 313740   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 249      |
----------------------------------
2024-05-11 09:07:01.180547 Eastern Daylight Time
| Itration            | 250      |
| Loss                | 10       |
| Real Det Return     | 106.07   |
| Real Sto Return     | -239.08  |
| Running Env Steps   | 315000   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 250      |
----------------------------------
2024-05-11 09:08:59.509054 Eastern Daylight Time
| Itration            | 251      |
| Loss                | 10       |
| Real Det Return     | 231.58   |
| Real Sto Return     | -239.04  |
| Running Env Steps   | 316260   |
| Running Forward KL  | -57.6    |
| Running Reverse KL  | -57.5    |
| Running Update Time | 251      |
----------------------------------
