Logging to logs/HalfCheetahFH-v0/exp-16/fkl/2024_08_11_05_56_06
--2024-08-11 05:57:31.123914 UTC--
| Itration            | 0        |
| Real Det Return     | -19.8    |
| Real Sto Return     | -167     |
| Reward Loss         | 2.54e+06 |
| Running Env Steps   | 0        |
| Running Forward KL  | 31.3     |
| Running Reverse KL  | 10.8     |
| Running Update Time | 0        |
----------------------------------
--2024-08-11 05:58:40.045575 UTC--
| Itration            | 1        |
| Real Det Return     | -38.1    |
| Real Sto Return     | -145     |
| Reward Loss         | 2.74e+06 |
| Running Env Steps   | 5000     |
| Running Forward KL  | 31.7     |
| Running Reverse KL  | 11       |
| Running Update Time | 1        |
----------------------------------
--2024-08-11 05:59:44.813376 UTC--
| Itration            | 2        |
| Real Det Return     | -3.87    |
| Real Sto Return     | -124     |
| Reward Loss         | 2.73e+06 |
| Running Env Steps   | 10000    |
| Running Forward KL  | 32       |
| Running Reverse KL  | 12.2     |
| Running Update Time | 2        |
----------------------------------
--2024-08-11 06:00:48.151711 UTC--
| Itration            | 3        |
| Real Det Return     | 1.38     |
| Real Sto Return     | -82.7    |
| Reward Loss         | 2.61e+06 |
| Running Env Steps   | 15000    |
| Running Forward KL  | 32       |
| Running Reverse KL  | 12.3     |
| Running Update Time | 3        |
----------------------------------
--2024-08-11 06:01:50.593119 UTC--
| Itration            | 4        |
| Real Det Return     | 0.98     |
| Real Sto Return     | -69      |
| Reward Loss         | 2.61e+06 |
| Running Env Steps   | 20000    |
| Running Forward KL  | 32.4     |
| Running Reverse KL  | 12.9     |
| Running Update Time | 4        |
----------------------------------
--2024-08-11 06:02:52.753021 UTC--
| Itration            | 5        |
| Real Det Return     | -0.03    |
| Real Sto Return     | -68.7    |
| Reward Loss         | 2.32e+06 |
| Running Env Steps   | 25000    |
| Running Forward KL  | 32.5     |
| Running Reverse KL  | 12.9     |
| Running Update Time | 5        |
----------------------------------
--2024-08-11 06:04:24.495001 UTC--
| Itration            | 6        |
| Real Det Return     | 0.82     |
| Real Sto Return     | -56.4    |
| Reward Loss         | 2.27e+06 |
| Running Env Steps   | 30000    |
| Running Forward KL  | 32.3     |
| Running Reverse KL  | 12.9     |
| Running Update Time | 6        |
----------------------------------
--2024-08-11 06:05:55.849796 UTC--
| Itration            | 7        |
| Real Det Return     | 0.79     |
| Real Sto Return     | -45.6    |
| Reward Loss         | 1.98e+06 |
| Running Env Steps   | 35000    |
| Running Forward KL  | 32.5     |
| Running Reverse KL  | 12.9     |
| Running Update Time | 7        |
----------------------------------
--2024-08-11 06:07:26.547784 UTC--
| Itration            | 8        |
| Real Det Return     | 2.03     |
| Real Sto Return     | -30.3    |
| Reward Loss         | 1.79e+06 |
| Running Env Steps   | 40000    |
| Running Forward KL  | 32.4     |
| Running Reverse KL  | 12.9     |
| Running Update Time | 8        |
----------------------------------
--2024-08-11 06:09:00.442664 UTC--
| Itration            | 9        |
| Real Det Return     | 0.16     |
| Real Sto Return     | -35.3    |
| Reward Loss         | 1.62e+06 |
| Running Env Steps   | 45000    |
| Running Forward KL  | 32.4     |
| Running Reverse KL  | 13       |
| Running Update Time | 9        |
----------------------------------
--2024-08-11 06:10:31.896956 UTC--
| Itration            | 10       |
| Real Det Return     | 0.17     |
| Real Sto Return     | -41.2    |
| Reward Loss         | 1.41e+06 |
| Running Env Steps   | 50000    |
| Running Forward KL  | 32.2     |
| Running Reverse KL  | 12.9     |
| Running Update Time | 10       |
----------------------------------
--2024-08-11 06:12:07.198654 UTC--
| Itration            | 11       |
| Real Det Return     | 1.8      |
| Real Sto Return     | -38.5    |
| Reward Loss         | 1.23e+06 |
| Running Env Steps   | 55000    |
| Running Forward KL  | 32.4     |
| Running Reverse KL  | 13       |
| Running Update Time | 11       |
----------------------------------
--2024-08-11 06:13:38.063670 UTC--
| Itration            | 12       |
| Real Det Return     | 2.79     |
| Real Sto Return     | -31.8    |
| Reward Loss         | 1.12e+06 |
| Running Env Steps   | 60000    |
| Running Forward KL  | 32.4     |
| Running Reverse KL  | 13       |
| Running Update Time | 12       |
----------------------------------
--2024-08-11 06:15:11.459549 UTC--
| Itration            | 13       |
| Real Det Return     | 2.3      |
| Real Sto Return     | -42.6    |
| Reward Loss         | 8.85e+05 |
| Running Env Steps   | 65000    |
| Running Forward KL  | 32.2     |
| Running Reverse KL  | 12.5     |
| Running Update Time | 13       |
----------------------------------
--2024-08-11 06:16:47.621861 UTC--
| Itration            | 14       |
| Real Det Return     | 4.28     |
| Real Sto Return     | -40.8    |
| Reward Loss         | 7.61e+05 |
| Running Env Steps   | 70000    |
| Running Forward KL  | 32.3     |
| Running Reverse KL  | 12.9     |
| Running Update Time | 14       |
----------------------------------
--2024-08-11 06:18:19.574885 UTC--
| Itration            | 15       |
| Real Det Return     | 3.4      |
| Real Sto Return     | -42.1    |
| Reward Loss         | 5.09e+05 |
| Running Env Steps   | 75000    |
| Running Forward KL  | 32.2     |
| Running Reverse KL  | 12.8     |
| Running Update Time | 15       |
----------------------------------
--2024-08-11 06:19:52.615463 UTC--
| Itration            | 16       |
| Real Det Return     | 3.34     |
| Real Sto Return     | -20.7    |
| Reward Loss         | 3.47e+05 |
| Running Env Steps   | 80000    |
| Running Forward KL  | 32.2     |
| Running Reverse KL  | 12.7     |
| Running Update Time | 16       |
----------------------------------
--2024-08-11 06:21:26.893638 UTC--
| Itration            | 17       |
| Real Det Return     | 6.08     |
| Real Sto Return     | -36.6    |
| Reward Loss         | 1.69e+05 |
| Running Env Steps   | 85000    |
| Running Forward KL  | 32.4     |
| Running Reverse KL  | 12.7     |
| Running Update Time | 17       |
----------------------------------
--2024-08-11 06:22:59.184636 UTC---
| Itration            | 18        |
| Real Det Return     | 3.54      |
| Real Sto Return     | -33       |
| Reward Loss         | -3.58e+03 |
| Running Env Steps   | 90000     |
| Running Forward KL  | 32.4      |
| Running Reverse KL  | 12.9      |
| Running Update Time | 18        |
-----------------------------------
--2024-08-11 06:24:33.415254 UTC---
| Itration            | 19        |
| Real Det Return     | 3.77      |
| Real Sto Return     | -24.2     |
| Reward Loss         | -1.93e+05 |
| Running Env Steps   | 95000     |
| Running Forward KL  | 32.3      |
| Running Reverse KL  | 13        |
| Running Update Time | 19        |
-----------------------------------
--2024-08-11 06:26:04.319008 UTC---
| Itration            | 20        |
| Real Det Return     | 5.17      |
| Real Sto Return     | -27.5     |
| Reward Loss         | -3.53e+05 |
| Running Env Steps   | 100000    |
| Running Forward KL  | 32.1      |
| Running Reverse KL  | 12.5      |
| Running Update Time | 20        |
-----------------------------------
--2024-08-11 06:27:37.042413 UTC---
| Itration            | 21        |
| Real Det Return     | 5.34      |
| Real Sto Return     | -40.6     |
| Reward Loss         | -5.08e+05 |
| Running Env Steps   | 105000    |
| Running Forward KL  | 32.3      |
| Running Reverse KL  | 12.8      |
| Running Update Time | 21        |
-----------------------------------
--2024-08-11 06:29:11.638350 UTC---
| Itration            | 22        |
| Real Det Return     | 5.18      |
| Real Sto Return     | -23.2     |
| Reward Loss         | -6.96e+05 |
| Running Env Steps   | 110000    |
| Running Forward KL  | 32.1      |
| Running Reverse KL  | 12.5      |
| Running Update Time | 22        |
-----------------------------------
--2024-08-11 06:30:43.727700 UTC---
| Itration            | 23        |
| Real Det Return     | 4.72      |
| Real Sto Return     | -31       |
| Reward Loss         | -8.91e+05 |
| Running Env Steps   | 115000    |
| Running Forward KL  | 32.3      |
| Running Reverse KL  | 12.7      |
| Running Update Time | 23        |
-----------------------------------
--2024-08-11 06:32:16.977714 UTC---
| Itration            | 24        |
| Real Det Return     | 4.42      |
| Real Sto Return     | -30       |
| Reward Loss         | -1.05e+06 |
| Running Env Steps   | 120000    |
| Running Forward KL  | 32.4      |
| Running Reverse KL  | 13        |
| Running Update Time | 24        |
-----------------------------------
--2024-08-11 06:33:49.752243 UTC---
| Itration            | 25        |
| Real Det Return     | 5.71      |
| Real Sto Return     | -37.5     |
| Reward Loss         | -1.23e+06 |
| Running Env Steps   | 125000    |
| Running Forward KL  | 32.4      |
| Running Reverse KL  | 12.7      |
| Running Update Time | 25        |
-----------------------------------
--2024-08-11 06:35:22.889971 UTC---
| Itration            | 26        |
| Real Det Return     | 4.95      |
| Real Sto Return     | -35.6     |
| Reward Loss         | -1.38e+06 |
| Running Env Steps   | 130000    |
| Running Forward KL  | 31.9      |
| Running Reverse KL  | 12.3      |
| Running Update Time | 26        |
-----------------------------------
--2024-08-11 06:36:56.380107 UTC---
| Itration            | 27        |
| Real Det Return     | 5.51      |
| Real Sto Return     | -23.3     |
| Reward Loss         | -1.63e+06 |
| Running Env Steps   | 135000    |
| Running Forward KL  | 32.2      |
| Running Reverse KL  | 12.6      |
| Running Update Time | 27        |
-----------------------------------
--2024-08-11 06:38:28.313110 UTC---
| Itration            | 28        |
| Real Det Return     | 4.74      |
| Real Sto Return     | -23       |
| Reward Loss         | -1.76e+06 |
| Running Env Steps   | 140000    |
| Running Forward KL  | 32        |
| Running Reverse KL  | 12.3      |
| Running Update Time | 28        |
-----------------------------------
--2024-08-11 06:40:01.310729 UTC---
| Itration            | 29        |
| Real Det Return     | 4.66      |
| Real Sto Return     | -20.5     |
| Reward Loss         | -1.91e+06 |
| Running Env Steps   | 145000    |
| Running Forward KL  | 32.3      |
| Running Reverse KL  | 12.8      |
| Running Update Time | 29        |
-----------------------------------
--2024-08-11 06:41:33.025493 UTC---
| Itration            | 30        |
| Real Det Return     | 6.12      |
| Real Sto Return     | -17.1     |
| Reward Loss         | -2.08e+06 |
| Running Env Steps   | 150000    |
| Running Forward KL  | 32.3      |
| Running Reverse KL  | 12.7      |
| Running Update Time | 30        |
-----------------------------------
--2024-08-11 06:43:06.044796 UTC---
| Itration            | 31        |
| Real Det Return     | 5.17      |
| Real Sto Return     | -27.5     |
| Reward Loss         | -2.25e+06 |
| Running Env Steps   | 155000    |
| Running Forward KL  | 32.3      |
| Running Reverse KL  | 12.7      |
| Running Update Time | 31        |
-----------------------------------
--2024-08-11 06:44:40.088328 UTC---
| Itration            | 32        |
| Real Det Return     | 6.28      |
| Real Sto Return     | -36.1     |
| Reward Loss         | -2.45e+06 |
| Running Env Steps   | 160000    |
| Running Forward KL  | 32.2      |
| Running Reverse KL  | 12.7      |
| Running Update Time | 32        |
-----------------------------------
--2024-08-11 06:46:12.953451 UTC---
| Itration            | 33        |
| Real Det Return     | 5.28      |
| Real Sto Return     | -11.1     |
| Reward Loss         | -2.64e+06 |
| Running Env Steps   | 165000    |
| Running Forward KL  | 32.3      |
| Running Reverse KL  | 12.7      |
| Running Update Time | 33        |
-----------------------------------
--2024-08-11 06:47:46.329213 UTC--
| Itration            | 34       |
| Real Det Return     | 4.14     |
| Real Sto Return     | -12.4    |
| Reward Loss         | -2.8e+06 |
| Running Env Steps   | 170000   |
| Running Forward KL  | 32.2     |
| Running Reverse KL  | 12.6     |
| Running Update Time | 34       |
----------------------------------
--2024-08-11 06:49:21.144521 UTC---
| Itration            | 35        |
| Real Det Return     | 5.35      |
| Real Sto Return     | -19.8     |
| Reward Loss         | -3.01e+06 |
| Running Env Steps   | 175000    |
| Running Forward KL  | 32.3      |
| Running Reverse KL  | 12.7      |
| Running Update Time | 35        |
-----------------------------------
--2024-08-11 06:50:53.169112 UTC---
| Itration            | 36        |
| Real Det Return     | 6.12      |
| Real Sto Return     | -14.4     |
| Reward Loss         | -3.19e+06 |
| Running Env Steps   | 180000    |
| Running Forward KL  | 32.1      |
| Running Reverse KL  | 12.5      |
| Running Update Time | 36        |
-----------------------------------
--2024-08-11 06:52:26.625214 UTC---
| Itration            | 37        |
| Real Det Return     | 5.49      |
| Real Sto Return     | -15.7     |
| Reward Loss         | -3.28e+06 |
| Running Env Steps   | 185000    |
| Running Forward KL  | 32        |
| Running Reverse KL  | 12.3      |
| Running Update Time | 37        |
-----------------------------------
--2024-08-11 06:53:59.099737 UTC--
| Itration            | 38       |
| Real Det Return     | 5.13     |
| Real Sto Return     | -17.9    |
| Reward Loss         | -3.6e+06 |
| Running Env Steps   | 190000   |
| Running Forward KL  | 32       |
| Running Reverse KL  | 12.3     |
| Running Update Time | 38       |
----------------------------------
--2024-08-11 06:55:32.669569 UTC---
| Itration            | 39        |
| Real Det Return     | 6.46      |
| Real Sto Return     | -2.84     |
| Reward Loss         | -3.75e+06 |
| Running Env Steps   | 195000    |
| Running Forward KL  | 32.2      |
| Running Reverse KL  | 12.6      |
| Running Update Time | 39        |
-----------------------------------
--2024-08-11 06:57:07.900183 UTC---
| Itration            | 40        |
| Real Det Return     | 4.79      |
| Real Sto Return     | -25.2     |
| Reward Loss         | -3.84e+06 |
| Running Env Steps   | 200000    |
| Running Forward KL  | 32        |
| Running Reverse KL  | 12.2      |
| Running Update Time | 40        |
-----------------------------------
--2024-08-11 06:58:41.039842 UTC---
| Itration            | 41        |
| Real Det Return     | 5.67      |
| Real Sto Return     | -6.76     |
| Reward Loss         | -3.99e+06 |
| Running Env Steps   | 205000    |
| Running Forward KL  | 31.9      |
| Running Reverse KL  | 12.4      |
| Running Update Time | 41        |
-----------------------------------
--2024-08-11 07:00:13.761292 UTC--
| Itration            | 42       |
| Real Det Return     | 6.83     |
| Real Sto Return     | -30.6    |
| Reward Loss         | -4.2e+06 |
| Running Env Steps   | 210000   |
| Running Forward KL  | 31.8     |
| Running Reverse KL  | 11.7     |
| Running Update Time | 42       |
----------------------------------
--2024-08-11 07:01:46.188531 UTC---
| Itration            | 43        |
| Real Det Return     | 5.85      |
| Real Sto Return     | -19.2     |
| Reward Loss         | -4.35e+06 |
| Running Env Steps   | 215000    |
| Running Forward KL  | 32        |
| Running Reverse KL  | 12.4      |
| Running Update Time | 43        |
-----------------------------------
--2024-08-11 07:03:18.497769 UTC---
| Itration            | 44        |
| Real Det Return     | 6.23      |
| Real Sto Return     | -13.5     |
| Reward Loss         | -4.54e+06 |
| Running Env Steps   | 220000    |
| Running Forward KL  | 32        |
| Running Reverse KL  | 12        |
| Running Update Time | 44        |
-----------------------------------
--2024-08-11 07:04:52.712226 UTC--
| Itration            | 45       |
| Real Det Return     | 5.97     |
| Real Sto Return     | -13.2    |
| Reward Loss         | -4.8e+06 |
| Running Env Steps   | 225000   |
| Running Forward KL  | 31.8     |
| Running Reverse KL  | 12       |
| Running Update Time | 45       |
----------------------------------
--2024-08-11 07:06:24.649280 UTC---
| Itration            | 46        |
| Real Det Return     | 7.27      |
| Real Sto Return     | -16.4     |
| Reward Loss         | -4.91e+06 |
| Running Env Steps   | 230000    |
| Running Forward KL  | 31.9      |
| Running Reverse KL  | 12.1      |
| Running Update Time | 46        |
-----------------------------------
--2024-08-11 07:07:58.486371 UTC---
| Itration            | 47        |
| Real Det Return     | 6.07      |
| Real Sto Return     | 1.38      |
| Reward Loss         | -5.06e+06 |
| Running Env Steps   | 235000    |
| Running Forward KL  | 31.6      |
| Running Reverse KL  | 11.2      |
| Running Update Time | 47        |
-----------------------------------
--2024-08-11 07:09:33.709497 UTC---
| Itration            | 48        |
| Real Det Return     | 6.16      |
| Real Sto Return     | -14.9     |
| Reward Loss         | -5.39e+06 |
| Running Env Steps   | 240000    |
| Running Forward KL  | 31.8      |
| Running Reverse KL  | 12        |
| Running Update Time | 48        |
-----------------------------------
--2024-08-11 07:11:05.641713 UTC---
| Itration            | 49        |
| Real Det Return     | 6.99      |
| Real Sto Return     | -22.2     |
| Reward Loss         | -5.41e+06 |
| Running Env Steps   | 245000    |
| Running Forward KL  | 31.8      |
| Running Reverse KL  | 12        |
| Running Update Time | 49        |
-----------------------------------
--2024-08-11 07:12:39.435393 UTC--
| Itration            | 50       |
| Real Det Return     | 5.6      |
| Real Sto Return     | -17.3    |
| Reward Loss         | -5.6e+06 |
| Running Env Steps   | 250000   |
| Running Forward KL  | 31.7     |
| Running Reverse KL  | 11.5     |
| Running Update Time | 50       |
----------------------------------
--2024-08-11 07:14:12.909356 UTC---
| Itration            | 51        |
| Real Det Return     | 6.57      |
| Real Sto Return     | -6.77     |
| Reward Loss         | -5.69e+06 |
| Running Env Steps   | 255000    |
| Running Forward KL  | 31.6      |
| Running Reverse KL  | 11.2      |
| Running Update Time | 51        |
-----------------------------------
--2024-08-11 07:15:47.798729 UTC--
| Itration            | 52       |
| Real Det Return     | 5.65     |
| Real Sto Return     | -8.63    |
| Reward Loss         | -5.9e+06 |
| Running Env Steps   | 260000   |
| Running Forward KL  | 31.6     |
| Running Reverse KL  | 11.5     |
| Running Update Time | 52       |
----------------------------------
--2024-08-11 07:17:22.551429 UTC---
| Itration            | 53        |
| Real Det Return     | 6.45      |
| Real Sto Return     | -10.8     |
| Reward Loss         | -6.03e+06 |
| Running Env Steps   | 265000    |
| Running Forward KL  | 31.5      |
| Running Reverse KL  | 11.4      |
| Running Update Time | 53        |
-----------------------------------
--2024-08-11 07:18:55.616813 UTC---
| Itration            | 54        |
| Real Det Return     | 5.88      |
| Real Sto Return     | -28.3     |
| Reward Loss         | -6.45e+06 |
| Running Env Steps   | 270000    |
| Running Forward KL  | 31.6      |
| Running Reverse KL  | 11.8      |
| Running Update Time | 54        |
-----------------------------------
--2024-08-11 07:20:27.998251 UTC---
| Itration            | 55        |
| Real Det Return     | 6.52      |
| Real Sto Return     | -12.4     |
| Reward Loss         | -6.43e+06 |
| Running Env Steps   | 275000    |
| Running Forward KL  | 31.4      |
| Running Reverse KL  | 11.3      |
| Running Update Time | 55        |
-----------------------------------
--2024-08-11 07:22:01.805723 UTC--
| Itration            | 56       |
| Real Det Return     | 5.27     |
| Real Sto Return     | -45.1    |
| Reward Loss         | -6.8e+06 |
| Running Env Steps   | 280000   |
| Running Forward KL  | 31.4     |
| Running Reverse KL  | 11.5     |
| Running Update Time | 56       |
----------------------------------
--2024-08-11 07:23:34.361739 UTC---
| Itration            | 57        |
| Real Det Return     | 7.13      |
| Real Sto Return     | -56.5     |
| Reward Loss         | -6.94e+06 |
| Running Env Steps   | 285000    |
| Running Forward KL  | 31.3      |
| Running Reverse KL  | 11.4      |
| Running Update Time | 57        |
-----------------------------------
--2024-08-11 07:25:09.156210 UTC---
| Itration            | 58        |
| Real Det Return     | 6.48      |
| Real Sto Return     | -27.1     |
| Reward Loss         | -6.87e+06 |
| Running Env Steps   | 290000    |
| Running Forward KL  | 31        |
| Running Reverse KL  | 10.5      |
| Running Update Time | 58        |
-----------------------------------
--2024-08-11 07:26:40.720863 UTC---
| Itration            | 59        |
| Real Det Return     | 7.25      |
| Real Sto Return     | -19.9     |
| Reward Loss         | -7.29e+06 |
| Running Env Steps   | 295000    |
| Running Forward KL  | 31.2      |
| Running Reverse KL  | 11.3      |
| Running Update Time | 59        |
-----------------------------------
--2024-08-11 07:28:14.592569 UTC---
| Itration            | 60        |
| Real Det Return     | 5.73      |
| Real Sto Return     | -2.01     |
| Reward Loss         | -7.24e+06 |
| Running Env Steps   | 300000    |
| Running Forward KL  | 31        |
| Running Reverse KL  | 11.2      |
| Running Update Time | 60        |
-----------------------------------
--2024-08-11 07:29:49.228737 UTC--
| Itration            | 61       |
| Real Det Return     | 5.83     |
| Real Sto Return     | -65.3    |
| Reward Loss         | -7.4e+06 |
| Running Env Steps   | 305000   |
| Running Forward KL  | 30.7     |
| Running Reverse KL  | 10.3     |
| Running Update Time | 61       |
----------------------------------
--2024-08-11 07:31:21.515127 UTC---
| Itration            | 62        |
| Real Det Return     | 4.34      |
| Real Sto Return     | -45.7     |
| Reward Loss         | -7.36e+06 |
| Running Env Steps   | 310000    |
| Running Forward KL  | 30.4      |
| Running Reverse KL  | 9.63      |
| Running Update Time | 62        |
-----------------------------------
--2024-08-11 07:32:54.129811 UTC---
| Itration            | 63        |
| Real Det Return     | 6.18      |
| Real Sto Return     | -1.15     |
| Reward Loss         | -7.48e+06 |
| Running Env Steps   | 315000    |
| Running Forward KL  | 30.5      |
| Running Reverse KL  | 10.2      |
| Running Update Time | 63        |
-----------------------------------
--2024-08-11 07:34:27.708194 UTC--
| Itration            | 64       |
| Real Det Return     | 7.55     |
| Real Sto Return     | -16      |
| Reward Loss         | -7.5e+06 |
| Running Env Steps   | 320000   |
| Running Forward KL  | 30.3     |
| Running Reverse KL  | 10.3     |
| Running Update Time | 64       |
----------------------------------
--2024-08-11 07:36:00.472689 UTC---
| Itration            | 65        |
| Real Det Return     | 6.17      |
| Real Sto Return     | -52.9     |
| Reward Loss         | -7.78e+06 |
| Running Env Steps   | 325000    |
| Running Forward KL  | 30.3      |
| Running Reverse KL  | 9.92      |
| Running Update Time | 65        |
-----------------------------------
--2024-08-11 07:37:35.841138 UTC---
| Itration            | 66        |
| Real Det Return     | 5.79      |
| Real Sto Return     | -13.6     |
| Reward Loss         | -7.23e+06 |
| Running Env Steps   | 330000    |
| Running Forward KL  | 30        |
| Running Reverse KL  | 9.73      |
| Running Update Time | 66        |
-----------------------------------
--2024-08-11 07:39:09.124446 UTC---
| Itration            | 67        |
| Real Det Return     | 5.22      |
| Real Sto Return     | -15.3     |
| Reward Loss         | -6.95e+06 |
| Running Env Steps   | 335000    |
| Running Forward KL  | 29.9      |
| Running Reverse KL  | 9.84      |
| Running Update Time | 67        |
-----------------------------------
--2024-08-11 07:40:43.719706 UTC---
| Itration            | 68        |
| Real Det Return     | 7.2       |
| Real Sto Return     | -32.6     |
| Reward Loss         | -7.46e+06 |
| Running Env Steps   | 340000    |
| Running Forward KL  | 30.1      |
| Running Reverse KL  | 9.62      |
| Running Update Time | 68        |
-----------------------------------
--2024-08-11 07:42:19.158335 UTC---
| Itration            | 69        |
| Real Det Return     | 6.9       |
| Real Sto Return     | -38.6     |
| Reward Loss         | -7.58e+06 |
| Running Env Steps   | 345000    |
| Running Forward KL  | 30.1      |
| Running Reverse KL  | 9.78      |
| Running Update Time | 69        |
-----------------------------------
--2024-08-11 07:43:51.271460 UTC---
| Itration            | 70        |
| Real Det Return     | 30.4      |
| Real Sto Return     | -91.7     |
| Reward Loss         | -7.01e+06 |
| Running Env Steps   | 350000    |
| Running Forward KL  | 29.7      |
| Running Reverse KL  | 10.8      |
| Running Update Time | 70        |
-----------------------------------
--2024-08-11 07:45:26.211665 UTC---
| Itration            | 71        |
| Real Det Return     | -8.46     |
| Real Sto Return     | -14.7     |
| Reward Loss         | -9.48e+06 |
| Running Env Steps   | 355000    |
| Running Forward KL  | 32.5      |
| Running Reverse KL  | 13.2      |
| Running Update Time | 71        |
-----------------------------------
--2024-08-11 07:46:59.699740 UTC--
| Itration            | 72       |
| Real Det Return     | 4.65     |
| Real Sto Return     | -8.31    |
| Reward Loss         | -7.7e+06 |
| Running Env Steps   | 360000   |
| Running Forward KL  | 30       |
| Running Reverse KL  | 9.86     |
| Running Update Time | 72       |
----------------------------------
--2024-08-11 07:48:32.533678 UTC---
| Itration            | 73        |
| Real Det Return     | 128       |
| Real Sto Return     | -62.4     |
| Reward Loss         | -7.25e+06 |
| Running Env Steps   | 365000    |
| Running Forward KL  | 29.9      |
| Running Reverse KL  | 10.5      |
| Running Update Time | 73        |
-----------------------------------
--2024-08-11 07:50:07.002698 UTC---
| Itration            | 74        |
| Real Det Return     | 159       |
| Real Sto Return     | -46.6     |
| Reward Loss         | -7.45e+06 |
| Running Env Steps   | 370000    |
| Running Forward KL  | 29.9      |
| Running Reverse KL  | 10.4      |
| Running Update Time | 74        |
-----------------------------------
--2024-08-11 07:51:39.343153 UTC---
| Itration            | 75        |
| Real Det Return     | 154       |
| Real Sto Return     | -19.7     |
| Reward Loss         | -7.26e+06 |
| Running Env Steps   | 375000    |
| Running Forward KL  | 30        |
| Running Reverse KL  | 10.8      |
| Running Update Time | 75        |
-----------------------------------
--2024-08-11 07:53:12.349754 UTC---
| Itration            | 76        |
| Real Det Return     | 180       |
| Real Sto Return     | -48.6     |
| Reward Loss         | -7.94e+06 |
| Running Env Steps   | 380000    |
| Running Forward KL  | 29.9      |
| Running Reverse KL  | 10.4      |
| Running Update Time | 76        |
-----------------------------------
--2024-08-11 07:54:46.702401 UTC---
| Itration            | 77        |
| Real Det Return     | 223       |
| Real Sto Return     | -3.67     |
| Reward Loss         | -7.61e+06 |
| Running Env Steps   | 385000    |
| Running Forward KL  | 29.9      |
| Running Reverse KL  | 10.4      |
| Running Update Time | 77        |
-----------------------------------
--2024-08-11 07:56:19.114886 UTC---
| Itration            | 78        |
| Real Det Return     | 189       |
| Real Sto Return     | -18.4     |
| Reward Loss         | -7.62e+06 |
| Running Env Steps   | 390000    |
| Running Forward KL  | 30        |
| Running Reverse KL  | 10.8      |
| Running Update Time | 78        |
-----------------------------------
--2024-08-11 07:57:52.818774 UTC---
| Itration            | 79        |
| Real Det Return     | 234       |
| Real Sto Return     | -7.83     |
| Reward Loss         | -7.79e+06 |
| Running Env Steps   | 395000    |
| Running Forward KL  | 29.9      |
| Running Reverse KL  | 10.5      |
| Running Update Time | 79        |
-----------------------------------
--2024-08-11 07:59:25.515250 UTC---
| Itration            | 80        |
| Real Det Return     | 214       |
| Real Sto Return     | -15.4     |
| Reward Loss         | -8.34e+06 |
| Running Env Steps   | 400000    |
| Running Forward KL  | 29.9      |
| Running Reverse KL  | 10.5      |
| Running Update Time | 80        |
-----------------------------------
--2024-08-11 08:01:00.807734 UTC---
| Itration            | 81        |
| Real Det Return     | 251       |
| Real Sto Return     | 3.96      |
| Reward Loss         | -8.07e+06 |
| Running Env Steps   | 405000    |
| Running Forward KL  | 29.8      |
| Running Reverse KL  | 10.5      |
| Running Update Time | 81        |
-----------------------------------
--2024-08-11 08:02:36.228282 UTC---
| Itration            | 82        |
| Real Det Return     | 262       |
| Real Sto Return     | 26        |
| Reward Loss         | -8.55e+06 |
| Running Env Steps   | 410000    |
| Running Forward KL  | 29.8      |
| Running Reverse KL  | 10.6      |
| Running Update Time | 82        |
-----------------------------------
--2024-08-11 08:04:10.903345 UTC---
| Itration            | 83        |
| Real Det Return     | 269       |
| Real Sto Return     | 16.6      |
| Reward Loss         | -8.32e+06 |
| Running Env Steps   | 415000    |
| Running Forward KL  | 29.8      |
| Running Reverse KL  | 10.6      |
| Running Update Time | 83        |
-----------------------------------
--2024-08-11 08:05:44.653472 UTC---
| Itration            | 84        |
| Real Det Return     | 214       |
| Real Sto Return     | -14       |
| Reward Loss         | -8.42e+06 |
| Running Env Steps   | 420000    |
| Running Forward KL  | 29.9      |
| Running Reverse KL  | 10.8      |
| Running Update Time | 84        |
-----------------------------------
--2024-08-11 08:07:18.561886 UTC---
| Itration            | 85        |
| Real Det Return     | 289       |
| Real Sto Return     | 20.1      |
| Reward Loss         | -8.64e+06 |
| Running Env Steps   | 425000    |
| Running Forward KL  | 29.8      |
| Running Reverse KL  | 10.7      |
| Running Update Time | 85        |
-----------------------------------
--2024-08-11 08:08:51.646578 UTC---
| Itration            | 86        |
| Real Det Return     | 243       |
| Real Sto Return     | 4.88      |
| Reward Loss         | -8.83e+06 |
| Running Env Steps   | 430000    |
| Running Forward KL  | 29.9      |
| Running Reverse KL  | 10.6      |
| Running Update Time | 86        |
-----------------------------------
--2024-08-11 08:10:26.099964 UTC---
| Itration            | 87        |
| Real Det Return     | 231       |
| Real Sto Return     | 1.51      |
| Reward Loss         | -8.93e+06 |
| Running Env Steps   | 435000    |
| Running Forward KL  | 29.8      |
| Running Reverse KL  | 10.7      |
| Running Update Time | 87        |
-----------------------------------
--2024-08-11 08:11:59.245823 UTC---
| Itration            | 88        |
| Real Det Return     | 242       |
| Real Sto Return     | -11.2     |
| Reward Loss         | -9.01e+06 |
| Running Env Steps   | 440000    |
| Running Forward KL  | 29.9      |
| Running Reverse KL  | 10.7      |
| Running Update Time | 88        |
-----------------------------------
--2024-08-11 08:13:33.540243 UTC---
| Itration            | 89        |
| Real Det Return     | 238       |
| Real Sto Return     | -6.91     |
| Reward Loss         | -9.53e+06 |
| Running Env Steps   | 445000    |
| Running Forward KL  | 29.9      |
| Running Reverse KL  | 10.7      |
| Running Update Time | 89        |
-----------------------------------
--2024-08-11 08:15:09.879689 UTC---
| Itration            | 90        |
| Real Det Return     | 226       |
| Real Sto Return     | 0.04      |
| Reward Loss         | -9.51e+06 |
| Running Env Steps   | 450000    |
| Running Forward KL  | 29.8      |
| Running Reverse KL  | 10.7      |
| Running Update Time | 90        |
-----------------------------------
--2024-08-11 08:16:42.478875 UTC---
| Itration            | 91        |
| Real Det Return     | 247       |
| Real Sto Return     | 5.96      |
| Reward Loss         | -9.76e+06 |
| Running Env Steps   | 455000    |
| Running Forward KL  | 29.9      |
| Running Reverse KL  | 10.6      |
| Running Update Time | 91        |
-----------------------------------
--2024-08-11 08:18:16.046301 UTC---
| Itration            | 92        |
| Real Det Return     | 267       |
| Real Sto Return     | 12        |
| Reward Loss         | -9.63e+06 |
| Running Env Steps   | 460000    |
| Running Forward KL  | 29.8      |
| Running Reverse KL  | 10.8      |
| Running Update Time | 92        |
-----------------------------------
--2024-08-11 08:19:52.034364 UTC--
| Itration            | 93       |
| Real Det Return     | 260      |
| Real Sto Return     | 11.8     |
| Reward Loss         | -1e+07   |
| Running Env Steps   | 465000   |
| Running Forward KL  | 29.8     |
| Running Reverse KL  | 10.9     |
| Running Update Time | 93       |
----------------------------------
--2024-08-11 08:21:25.435956 UTC--
| Itration            | 94       |
| Real Det Return     | 250      |
| Real Sto Return     | 2.54     |
| Reward Loss         | -9.9e+06 |
| Running Env Steps   | 470000   |
| Running Forward KL  | 29.9     |
| Running Reverse KL  | 10.8     |
| Running Update Time | 94       |
----------------------------------
--2024-08-11 08:23:00.364357 UTC---
| Itration            | 95        |
| Real Det Return     | 260       |
| Real Sto Return     | 15.5      |
| Reward Loss         | -1.04e+07 |
| Running Env Steps   | 475000    |
| Running Forward KL  | 29.9      |
| Running Reverse KL  | 10.7      |
| Running Update Time | 95        |
-----------------------------------
--2024-08-11 08:24:35.080052 UTC---
| Itration            | 96        |
| Real Det Return     | 251       |
| Real Sto Return     | 1.38      |
| Reward Loss         | -1.02e+07 |
| Running Env Steps   | 480000    |
| Running Forward KL  | 29.9      |
| Running Reverse KL  | 10.7      |
| Running Update Time | 96        |
-----------------------------------
--2024-08-11 08:26:09.844378 UTC---
| Itration            | 97        |
| Real Det Return     | 249       |
| Real Sto Return     | 1         |
| Reward Loss         | -1.02e+07 |
| Running Env Steps   | 485000    |
| Running Forward KL  | 29.8      |
| Running Reverse KL  | 10.8      |
| Running Update Time | 97        |
-----------------------------------
--2024-08-11 08:27:45.967597 UTC---
| Itration            | 98        |
| Real Det Return     | 237       |
| Real Sto Return     | -6.64     |
| Reward Loss         | -1.04e+07 |
| Running Env Steps   | 490000    |
| Running Forward KL  | 29.9      |
| Running Reverse KL  | 10.8      |
| Running Update Time | 98        |
-----------------------------------
--2024-08-11 08:29:19.139050 UTC---
| Itration            | 99        |
| Real Det Return     | 240       |
| Real Sto Return     | -1.36     |
| Reward Loss         | -1.05e+07 |
| Running Env Steps   | 495000    |
| Running Forward KL  | 29.8      |
| Running Reverse KL  | 10.8      |
| Running Update Time | 99        |
-----------------------------------
--2024-08-11 08:30:54.518347 UTC---
| Itration            | 100       |
| Real Det Return     | 247       |
| Real Sto Return     | -1.55     |
| Reward Loss         | -1.11e+07 |
| Running Env Steps   | 500000    |
| Running Forward KL  | 29.9      |
| Running Reverse KL  | 10.7      |
| Running Update Time | 100       |
-----------------------------------
--2024-08-11 08:32:30.681141 UTC---
| Itration            | 101       |
| Real Det Return     | 250       |
| Real Sto Return     | 17.6      |
| Reward Loss         | -1.11e+07 |
| Running Env Steps   | 505000    |
| Running Forward KL  | 29.8      |
| Running Reverse KL  | 10.8      |
| Running Update Time | 101       |
-----------------------------------
--2024-08-11 08:34:03.903728 UTC---
| Itration            | 102       |
| Real Det Return     | 255       |
| Real Sto Return     | 9.04      |
| Reward Loss         | -1.13e+07 |
| Running Env Steps   | 510000    |
| Running Forward KL  | 29.8      |
| Running Reverse KL  | 10.7      |
| Running Update Time | 102       |
-----------------------------------
--2024-08-11 08:35:38.950300 UTC---
| Itration            | 103       |
| Real Det Return     | 270       |
| Real Sto Return     | -0.86     |
| Reward Loss         | -1.16e+07 |
| Running Env Steps   | 515000    |
| Running Forward KL  | 29.9      |
| Running Reverse KL  | 10.6      |
| Running Update Time | 103       |
-----------------------------------
--2024-08-11 08:37:13.184857 UTC---
| Itration            | 104       |
| Real Det Return     | 276       |
| Real Sto Return     | 18.8      |
| Reward Loss         | -1.12e+07 |
| Running Env Steps   | 520000    |
| Running Forward KL  | 29.8      |
| Running Reverse KL  | 10.7      |
| Running Update Time | 104       |
-----------------------------------
--2024-08-11 08:38:47.103396 UTC---
| Itration            | 105       |
| Real Det Return     | 247       |
| Real Sto Return     | 8.91      |
| Reward Loss         | -1.15e+07 |
| Running Env Steps   | 525000    |
| Running Forward KL  | 29.9      |
| Running Reverse KL  | 10.7      |
| Running Update Time | 105       |
-----------------------------------
--2024-08-11 08:40:22.970969 UTC---
| Itration            | 106       |
| Real Det Return     | 238       |
| Real Sto Return     | -9.96     |
| Reward Loss         | -1.18e+07 |
| Running Env Steps   | 530000    |
| Running Forward KL  | 29.9      |
| Running Reverse KL  | 10.6      |
| Running Update Time | 106       |
-----------------------------------
--2024-08-11 08:41:56.820523 UTC---
| Itration            | 107       |
| Real Det Return     | 221       |
| Real Sto Return     | 5.55      |
| Reward Loss         | -1.18e+07 |
| Running Env Steps   | 535000    |
| Running Forward KL  | 29.8      |
| Running Reverse KL  | 10.5      |
| Running Update Time | 107       |
-----------------------------------
--2024-08-11 08:43:30.249265 UTC---
| Itration            | 108       |
| Real Det Return     | 267       |
| Real Sto Return     | 5.87      |
| Reward Loss         | -1.22e+07 |
| Running Env Steps   | 540000    |
| Running Forward KL  | 29.8      |
| Running Reverse KL  | 10.7      |
| Running Update Time | 108       |
-----------------------------------
--2024-08-11 08:45:03.269341 UTC--
| Itration            | 109      |
| Real Det Return     | 253      |
| Real Sto Return     | -5.97    |
| Reward Loss         | -1.2e+07 |
| Running Env Steps   | 545000   |
| Running Forward KL  | 29.8     |
| Running Reverse KL  | 10.6     |
| Running Update Time | 109      |
----------------------------------
--2024-08-11 08:46:34.682849 UTC---
| Itration            | 110       |
| Real Det Return     | 240       |
| Real Sto Return     | -8.43     |
| Reward Loss         | -1.27e+07 |
| Running Env Steps   | 550000    |
| Running Forward KL  | 29.8      |
| Running Reverse KL  | 10.6      |
| Running Update Time | 110       |
-----------------------------------
--2024-08-11 08:48:06.368720 UTC---
| Itration            | 111       |
| Real Det Return     | 268       |
| Real Sto Return     | 19.6      |
| Reward Loss         | -1.28e+07 |
| Running Env Steps   | 555000    |
| Running Forward KL  | 29.8      |
| Running Reverse KL  | 10.7      |
| Running Update Time | 111       |
-----------------------------------
--2024-08-11 08:49:38.020028 UTC--
| Itration            | 112      |
| Real Det Return     | 277      |
| Real Sto Return     | 23.3     |
| Reward Loss         | -1.3e+07 |
| Running Env Steps   | 560000   |
| Running Forward KL  | 29.8     |
| Running Reverse KL  | 10.8     |
| Running Update Time | 112      |
----------------------------------
--2024-08-11 08:51:11.070732 UTC---
| Itration            | 113       |
| Real Det Return     | 274       |
| Real Sto Return     | 1.41      |
| Reward Loss         | -1.29e+07 |
| Running Env Steps   | 565000    |
| Running Forward KL  | 29.8      |
| Running Reverse KL  | 10.7      |
| Running Update Time | 113       |
-----------------------------------
--2024-08-11 08:52:45.089802 UTC---
| Itration            | 114       |
| Real Det Return     | 260       |
| Real Sto Return     | -0.53     |
| Reward Loss         | -1.31e+07 |
| Running Env Steps   | 570000    |
| Running Forward KL  | 29.9      |
| Running Reverse KL  | 10.5      |
| Running Update Time | 114       |
-----------------------------------
--2024-08-11 08:54:18.788602 UTC---
| Itration            | 115       |
| Real Det Return     | 250       |
| Real Sto Return     | 27.8      |
| Reward Loss         | -1.36e+07 |
| Running Env Steps   | 575000    |
| Running Forward KL  | 29.9      |
| Running Reverse KL  | 10.7      |
| Running Update Time | 115       |
-----------------------------------
--2024-08-11 08:55:52.329713 UTC---
| Itration            | 116       |
| Real Det Return     | 273       |
| Real Sto Return     | -6.75     |
| Reward Loss         | -1.37e+07 |
| Running Env Steps   | 580000    |
| Running Forward KL  | 29.9      |
| Running Reverse KL  | 10.5      |
| Running Update Time | 116       |
-----------------------------------
--2024-08-11 08:57:26.708352 UTC---
| Itration            | 117       |
| Real Det Return     | 276       |
| Real Sto Return     | 17.6      |
| Reward Loss         | -1.37e+07 |
| Running Env Steps   | 585000    |
| Running Forward KL  | 29.8      |
| Running Reverse KL  | 10.5      |
| Running Update Time | 117       |
-----------------------------------
--2024-08-11 08:58:59.445536 UTC---
| Itration            | 118       |
| Real Det Return     | 269       |
| Real Sto Return     | 20.6      |
| Reward Loss         | -1.34e+07 |
| Running Env Steps   | 590000    |
| Running Forward KL  | 29.8      |
| Running Reverse KL  | 10.5      |
| Running Update Time | 118       |
-----------------------------------
--2024-08-11 09:00:34.581181 UTC--
| Itration            | 119      |
| Real Det Return     | 241      |
| Real Sto Return     | 17.1     |
| Reward Loss         | -1.4e+07 |
| Running Env Steps   | 595000   |
| Running Forward KL  | 29.9     |
| Running Reverse KL  | 10.7     |
| Running Update Time | 119      |
----------------------------------
--2024-08-11 09:02:06.572191 UTC---
| Itration            | 120       |
| Real Det Return     | 274       |
| Real Sto Return     | 30.9      |
| Reward Loss         | -1.38e+07 |
| Running Env Steps   | 600000    |
| Running Forward KL  | 29.8      |
| Running Reverse KL  | 10.7      |
| Running Update Time | 120       |
-----------------------------------
--2024-08-11 09:03:41.144387 UTC--
| Itration            | 121      |
| Real Det Return     | 270      |
| Real Sto Return     | 33.8     |
| Reward Loss         | -1.4e+07 |
| Running Env Steps   | 605000   |
| Running Forward KL  | 29.7     |
| Running Reverse KL  | 10.6     |
| Running Update Time | 121      |
----------------------------------
--2024-08-11 09:05:16.774832 UTC--
| Itration            | 122      |
| Real Det Return     | 263      |
| Real Sto Return     | 17.4     |
| Reward Loss         | -1.4e+07 |
| Running Env Steps   | 610000   |
| Running Forward KL  | 29.8     |
| Running Reverse KL  | 10.8     |
| Running Update Time | 122      |
----------------------------------
--2024-08-11 09:06:50.782821 UTC---
| Itration            | 123       |
| Real Det Return     | 272       |
| Real Sto Return     | 3.38      |
| Reward Loss         | -1.43e+07 |
| Running Env Steps   | 615000    |
| Running Forward KL  | 29.8      |
| Running Reverse KL  | 10.6      |
| Running Update Time | 123       |
-----------------------------------
--2024-08-11 09:08:24.522539 UTC---
| Itration            | 124       |
| Real Det Return     | 269       |
| Real Sto Return     | 28.6      |
| Reward Loss         | -1.45e+07 |
| Running Env Steps   | 620000    |
| Running Forward KL  | 29.8      |
| Running Reverse KL  | 10.7      |
| Running Update Time | 124       |
-----------------------------------
--2024-08-11 09:09:58.709925 UTC---
| Itration            | 125       |
| Real Det Return     | 310       |
| Real Sto Return     | 47.2      |
| Reward Loss         | -1.45e+07 |
| Running Env Steps   | 625000    |
| Running Forward KL  | 29.7      |
| Running Reverse KL  | 10.7      |
| Running Update Time | 125       |
-----------------------------------
--2024-08-11 09:11:31.596733 UTC---
| Itration            | 126       |
| Real Det Return     | 284       |
| Real Sto Return     | 21.5      |
| Reward Loss         | -1.51e+07 |
| Running Env Steps   | 630000    |
| Running Forward KL  | 29.8      |
| Running Reverse KL  | 10.7      |
| Running Update Time | 126       |
-----------------------------------
--2024-08-11 09:13:07.182943 UTC---
| Itration            | 127       |
| Real Det Return     | 277       |
| Real Sto Return     | 44.5      |
| Reward Loss         | -1.49e+07 |
| Running Env Steps   | 635000    |
| Running Forward KL  | 29.7      |
| Running Reverse KL  | 10.6      |
| Running Update Time | 127       |
-----------------------------------
--2024-08-11 09:14:38.228270 UTC---
| Itration            | 128       |
| Real Det Return     | 268       |
| Real Sto Return     | 18.6      |
| Reward Loss         | -1.57e+07 |
| Running Env Steps   | 640000    |
| Running Forward KL  | 29.8      |
| Running Reverse KL  | 10.7      |
| Running Update Time | 128       |
-----------------------------------
--2024-08-11 09:16:12.294371 UTC---
| Itration            | 129       |
| Real Det Return     | 273       |
| Real Sto Return     | 14.5      |
| Reward Loss         | -1.53e+07 |
| Running Env Steps   | 645000    |
| Running Forward KL  | 29.8      |
| Running Reverse KL  | 10.5      |
| Running Update Time | 129       |
-----------------------------------
--2024-08-11 09:17:47.738431 UTC---
| Itration            | 130       |
| Real Det Return     | 261       |
| Real Sto Return     | 31.3      |
| Reward Loss         | -1.59e+07 |
| Running Env Steps   | 650000    |
| Running Forward KL  | 29.8      |
| Running Reverse KL  | 10.6      |
| Running Update Time | 130       |
-----------------------------------
--2024-08-11 09:19:21.514511 UTC---
| Itration            | 131       |
| Real Det Return     | 265       |
| Real Sto Return     | 38.4      |
| Reward Loss         | -1.61e+07 |
| Running Env Steps   | 655000    |
| Running Forward KL  | 29.8      |
| Running Reverse KL  | 10.7      |
| Running Update Time | 131       |
-----------------------------------
--2024-08-11 09:20:55.406956 UTC---
| Itration            | 132       |
| Real Det Return     | 230       |
| Real Sto Return     | 34.5      |
| Reward Loss         | -1.62e+07 |
| Running Env Steps   | 660000    |
| Running Forward KL  | 29.7      |
| Running Reverse KL  | 10.4      |
| Running Update Time | 132       |
-----------------------------------
--2024-08-11 09:22:29.383482 UTC---
| Itration            | 133       |
| Real Det Return     | 275       |
| Real Sto Return     | 26.1      |
| Reward Loss         | -1.66e+07 |
| Running Env Steps   | 665000    |
| Running Forward KL  | 29.8      |
| Running Reverse KL  | 10.4      |
| Running Update Time | 133       |
-----------------------------------
--2024-08-11 09:24:02.644453 UTC---
| Itration            | 134       |
| Real Det Return     | 260       |
| Real Sto Return     | 25        |
| Reward Loss         | -1.61e+07 |
| Running Env Steps   | 670000    |
| Running Forward KL  | 29.8      |
| Running Reverse KL  | 10.6      |
| Running Update Time | 134       |
-----------------------------------
--2024-08-11 09:25:37.923721 UTC---
| Itration            | 135       |
| Real Det Return     | 228       |
| Real Sto Return     | 29.2      |
| Reward Loss         | -1.63e+07 |
| Running Env Steps   | 675000    |
| Running Forward KL  | 29.8      |
| Running Reverse KL  | 10.6      |
| Running Update Time | 135       |
-----------------------------------
--2024-08-11 09:27:10.690024 UTC---
| Itration            | 136       |
| Real Det Return     | 261       |
| Real Sto Return     | 40.9      |
| Reward Loss         | -1.66e+07 |
| Running Env Steps   | 680000    |
| Running Forward KL  | 29.8      |
| Running Reverse KL  | 10.4      |
| Running Update Time | 136       |
-----------------------------------
--2024-08-11 09:28:45.513647 UTC---
| Itration            | 137       |
| Real Det Return     | 261       |
| Real Sto Return     | 48.3      |
| Reward Loss         | -1.71e+07 |
| Running Env Steps   | 685000    |
| Running Forward KL  | 29.8      |
| Running Reverse KL  | 10.5      |
| Running Update Time | 137       |
-----------------------------------
--2024-08-11 09:30:20.829756 UTC---
| Itration            | 138       |
| Real Det Return     | 298       |
| Real Sto Return     | 61.9      |
| Reward Loss         | -1.68e+07 |
| Running Env Steps   | 690000    |
| Running Forward KL  | 29.8      |
| Running Reverse KL  | 10.5      |
| Running Update Time | 138       |
-----------------------------------
--2024-08-11 09:31:54.273025 UTC---
| Itration            | 139       |
| Real Det Return     | 289       |
| Real Sto Return     | 55.5      |
| Reward Loss         | -1.77e+07 |
| Running Env Steps   | 695000    |
| Running Forward KL  | 29.8      |
| Running Reverse KL  | 10.3      |
| Running Update Time | 139       |
-----------------------------------
--2024-08-11 09:33:27.406113 UTC---
| Itration            | 140       |
| Real Det Return     | 351       |
| Real Sto Return     | 69.9      |
| Reward Loss         | -1.71e+07 |
| Running Env Steps   | 700000    |
| Running Forward KL  | 29.8      |
| Running Reverse KL  | 10.6      |
| Running Update Time | 140       |
-----------------------------------
--2024-08-11 09:35:00.663931 UTC---
| Itration            | 141       |
| Real Det Return     | 363       |
| Real Sto Return     | 96.8      |
| Reward Loss         | -1.79e+07 |
| Running Env Steps   | 705000    |
| Running Forward KL  | 29.7      |
| Running Reverse KL  | 10.1      |
| Running Update Time | 141       |
-----------------------------------
--2024-08-11 09:36:33.202971 UTC--
| Itration            | 142      |
| Real Det Return     | 357      |
| Real Sto Return     | 69.3     |
| Reward Loss         | -1.8e+07 |
| Running Env Steps   | 710000   |
| Running Forward KL  | 29.8     |
| Running Reverse KL  | 10.3     |
| Running Update Time | 142      |
----------------------------------
--2024-08-11 09:38:08.576708 UTC---
| Itration            | 143       |
| Real Det Return     | 363       |
| Real Sto Return     | 126       |
| Reward Loss         | -1.87e+07 |
| Running Env Steps   | 715000    |
| Running Forward KL  | 29.9      |
| Running Reverse KL  | 9.89      |
| Running Update Time | 143       |
-----------------------------------
--2024-08-11 09:39:40.836216 UTC---
| Itration            | 144       |
| Real Det Return     | 369       |
| Real Sto Return     | 107       |
| Reward Loss         | -1.82e+07 |
| Running Env Steps   | 720000    |
| Running Forward KL  | 29.8      |
| Running Reverse KL  | 9.97      |
| Running Update Time | 144       |
-----------------------------------
--2024-08-11 09:41:14.848082 UTC---
| Itration            | 145       |
| Real Det Return     | 468       |
| Real Sto Return     | 106       |
| Reward Loss         | -1.88e+07 |
| Running Env Steps   | 725000    |
| Running Forward KL  | 29.8      |
| Running Reverse KL  | 10.1      |
| Running Update Time | 145       |
-----------------------------------
--2024-08-11 09:42:50.951203 UTC---
| Itration            | 146       |
| Real Det Return     | 361       |
| Real Sto Return     | 128       |
| Reward Loss         | -1.83e+07 |
| Running Env Steps   | 730000    |
| Running Forward KL  | 29.7      |
| Running Reverse KL  | 9.94      |
| Running Update Time | 146       |
-----------------------------------
--2024-08-11 09:44:24.164606 UTC---
| Itration            | 147       |
| Real Det Return     | 388       |
| Real Sto Return     | 218       |
| Reward Loss         | -1.93e+07 |
| Running Env Steps   | 735000    |
| Running Forward KL  | 29.8      |
| Running Reverse KL  | 10.1      |
| Running Update Time | 147       |
-----------------------------------
--2024-08-11 09:45:58.088444 UTC--
| Itration            | 148      |
| Real Det Return     | 460      |
| Real Sto Return     | 210      |
| Reward Loss         | -1.9e+07 |
| Running Env Steps   | 740000   |
| Running Forward KL  | 29.9     |
| Running Reverse KL  | 10.1     |
| Running Update Time | 148      |
----------------------------------
--2024-08-11 09:47:33.388784 UTC---
| Itration            | 149       |
| Real Det Return     | 434       |
| Real Sto Return     | 177       |
| Reward Loss         | -1.94e+07 |
| Running Env Steps   | 745000    |
| Running Forward KL  | 29.8      |
| Running Reverse KL  | 10        |
| Running Update Time | 149       |
-----------------------------------
--2024-08-11 09:49:08.012208 UTC---
| Itration            | 150       |
| Real Det Return     | 390       |
| Real Sto Return     | 117       |
| Reward Loss         | -1.95e+07 |
| Running Env Steps   | 750000    |
| Running Forward KL  | 29.8      |
| Running Reverse KL  | 10.5      |
| Running Update Time | 150       |
-----------------------------------
--2024-08-11 09:50:42.640273 UTC---
| Itration            | 151       |
| Real Det Return     | 403       |
| Real Sto Return     | 225       |
| Reward Loss         | -1.94e+07 |
| Running Env Steps   | 755000    |
| Running Forward KL  | 29.7      |
| Running Reverse KL  | 10.2      |
| Running Update Time | 151       |
-----------------------------------
--2024-08-11 09:52:16.159263 UTC---
| Itration            | 152       |
| Real Det Return     | 439       |
| Real Sto Return     | 134       |
| Reward Loss         | -1.99e+07 |
| Running Env Steps   | 760000    |
| Running Forward KL  | 29.7      |
| Running Reverse KL  | 10.3      |
| Running Update Time | 152       |
-----------------------------------
--2024-08-11 09:53:51.123530 UTC---
| Itration            | 153       |
| Real Det Return     | 436       |
| Real Sto Return     | 195       |
| Reward Loss         | -2.01e+07 |
| Running Env Steps   | 765000    |
| Running Forward KL  | 29.7      |
| Running Reverse KL  | 10.1      |
| Running Update Time | 153       |
-----------------------------------
--2024-08-11 09:55:26.546774 UTC--
| Itration            | 154      |
| Real Det Return     | 438      |
| Real Sto Return     | 152      |
| Reward Loss         | -2e+07   |
| Running Env Steps   | 770000   |
| Running Forward KL  | 29.6     |
| Running Reverse KL  | 10.2     |
| Running Update Time | 154      |
----------------------------------
--2024-08-11 09:57:00.554780 UTC---
| Itration            | 155       |
| Real Det Return     | 609       |
| Real Sto Return     | 106       |
| Reward Loss         | -1.96e+07 |
| Running Env Steps   | 775000    |
| Running Forward KL  | 29.7      |
| Running Reverse KL  | 10.3      |
| Running Update Time | 155       |
-----------------------------------
--2024-08-11 09:58:34.808198 UTC---
| Itration            | 156       |
| Real Det Return     | 372       |
| Real Sto Return     | 148       |
| Reward Loss         | -1.98e+07 |
| Running Env Steps   | 780000    |
| Running Forward KL  | 29.6      |
| Running Reverse KL  | 10.3      |
| Running Update Time | 156       |
-----------------------------------
--2024-08-11 10:00:08.666478 UTC---
| Itration            | 157       |
| Real Det Return     | 534       |
| Real Sto Return     | 120       |
| Reward Loss         | -2.08e+07 |
| Running Env Steps   | 785000    |
| Running Forward KL  | 29.7      |
| Running Reverse KL  | 10.5      |
| Running Update Time | 157       |
-----------------------------------
--2024-08-11 10:01:41.748525 UTC---
| Itration            | 158       |
| Real Det Return     | 449       |
| Real Sto Return     | 160       |
| Reward Loss         | -2.08e+07 |
| Running Env Steps   | 790000    |
| Running Forward KL  | 29.6      |
| Running Reverse KL  | 10.4      |
| Running Update Time | 158       |
-----------------------------------
--2024-08-11 10:03:15.546588 UTC---
| Itration            | 159       |
| Real Det Return     | 488       |
| Real Sto Return     | 106       |
| Reward Loss         | -2.03e+07 |
| Running Env Steps   | 795000    |
| Running Forward KL  | 29.6      |
| Running Reverse KL  | 10.7      |
| Running Update Time | 159       |
-----------------------------------
--2024-08-11 10:04:47.635267 UTC--
| Itration            | 160      |
| Real Det Return     | 539      |
| Real Sto Return     | 155      |
| Reward Loss         | -2.1e+07 |
| Running Env Steps   | 800000   |
| Running Forward KL  | 29.6     |
| Running Reverse KL  | 10.8     |
| Running Update Time | 160      |
----------------------------------
--2024-08-11 10:06:23.431464 UTC---
| Itration            | 161       |
| Real Det Return     | 891       |
| Real Sto Return     | 144       |
| Reward Loss         | -2.14e+07 |
| Running Env Steps   | 805000    |
| Running Forward KL  | 29.7      |
| Running Reverse KL  | 10.5      |
| Running Update Time | 161       |
-----------------------------------
--2024-08-11 10:07:58.901472 UTC---
| Itration            | 162       |
| Real Det Return     | 733       |
| Real Sto Return     | 123       |
| Reward Loss         | -2.08e+07 |
| Running Env Steps   | 810000    |
| Running Forward KL  | 29.7      |
| Running Reverse KL  | 10.7      |
| Running Update Time | 162       |
-----------------------------------
--2024-08-11 10:09:32.785804 UTC---
| Itration            | 163       |
| Real Det Return     | 695       |
| Real Sto Return     | 95.8      |
| Reward Loss         | -2.13e+07 |
| Running Env Steps   | 815000    |
| Running Forward KL  | 29.6      |
| Running Reverse KL  | 10.9      |
| Running Update Time | 163       |
-----------------------------------
--2024-08-11 10:11:06.409901 UTC---
| Itration            | 164       |
| Real Det Return     | 530       |
| Real Sto Return     | 128       |
| Reward Loss         | -2.13e+07 |
| Running Env Steps   | 820000    |
| Running Forward KL  | 29.6      |
| Running Reverse KL  | 10.7      |
| Running Update Time | 164       |
-----------------------------------
--2024-08-11 10:12:41.771753 UTC---
| Itration            | 165       |
| Real Det Return     | 579       |
| Real Sto Return     | 134       |
| Reward Loss         | -2.15e+07 |
| Running Env Steps   | 825000    |
| Running Forward KL  | 29.6      |
| Running Reverse KL  | 10.9      |
| Running Update Time | 165       |
-----------------------------------
--2024-08-11 10:14:14.212110 UTC---
| Itration            | 166       |
| Real Det Return     | 767       |
| Real Sto Return     | 188       |
| Reward Loss         | -2.17e+07 |
| Running Env Steps   | 830000    |
| Running Forward KL  | 29.6      |
| Running Reverse KL  | 10.7      |
| Running Update Time | 166       |
-----------------------------------
--2024-08-11 10:15:48.475051 UTC---
| Itration            | 167       |
| Real Det Return     | 666       |
| Real Sto Return     | 176       |
| Reward Loss         | -2.26e+07 |
| Running Env Steps   | 835000    |
| Running Forward KL  | 29.6      |
| Running Reverse KL  | 10.5      |
| Running Update Time | 167       |
-----------------------------------
--2024-08-11 10:17:22.121582 UTC---
| Itration            | 168       |
| Real Det Return     | 855       |
| Real Sto Return     | 180       |
| Reward Loss         | -2.28e+07 |
| Running Env Steps   | 840000    |
| Running Forward KL  | 29.5      |
| Running Reverse KL  | 10.7      |
| Running Update Time | 168       |
-----------------------------------
--2024-08-11 10:18:57.095591 UTC--
| Itration            | 169      |
| Real Det Return     | 928      |
| Real Sto Return     | 128      |
| Reward Loss         | -2.3e+07 |
| Running Env Steps   | 845000   |
| Running Forward KL  | 29.7     |
| Running Reverse KL  | 10.8     |
| Running Update Time | 169      |
----------------------------------
--2024-08-11 10:20:32.536413 UTC---
| Itration            | 170       |
| Real Det Return     | 634       |
| Real Sto Return     | 132       |
| Reward Loss         | -2.23e+07 |
| Running Env Steps   | 850000    |
| Running Forward KL  | 29.7      |
| Running Reverse KL  | 10.8      |
| Running Update Time | 170       |
-----------------------------------
--2024-08-11 10:22:05.895982 UTC---
| Itration            | 171       |
| Real Det Return     | 832       |
| Real Sto Return     | 247       |
| Reward Loss         | -2.28e+07 |
| Running Env Steps   | 855000    |
| Running Forward KL  | 29.6      |
| Running Reverse KL  | 10.3      |
| Running Update Time | 171       |
-----------------------------------
--2024-08-11 10:23:39.684388 UTC---
| Itration            | 172       |
| Real Det Return     | 667       |
| Real Sto Return     | 208       |
| Reward Loss         | -2.29e+07 |
| Running Env Steps   | 860000    |
| Running Forward KL  | 29.7      |
| Running Reverse KL  | 10.3      |
| Running Update Time | 172       |
-----------------------------------
--2024-08-11 10:25:14.946595 UTC---
| Itration            | 173       |
| Real Det Return     | 781       |
| Real Sto Return     | 206       |
| Reward Loss         | -2.38e+07 |
| Running Env Steps   | 865000    |
| Running Forward KL  | 29.5      |
| Running Reverse KL  | 10.4      |
| Running Update Time | 173       |
-----------------------------------
--2024-08-11 10:26:47.251002 UTC--
| Itration            | 174      |
| Real Det Return     | 516      |
| Real Sto Return     | 274      |
| Reward Loss         | -2.4e+07 |
| Running Env Steps   | 870000   |
| Running Forward KL  | 29.5     |
| Running Reverse KL  | 10.3     |
| Running Update Time | 174      |
----------------------------------
--2024-08-11 10:28:22.479581 UTC---
| Itration            | 175       |
| Real Det Return     | 886       |
| Real Sto Return     | 268       |
| Reward Loss         | -2.34e+07 |
| Running Env Steps   | 875000    |
| Running Forward KL  | 29.5      |
| Running Reverse KL  | 10.3      |
| Running Update Time | 175       |
-----------------------------------
--2024-08-11 10:29:56.216475 UTC---
| Itration            | 176       |
| Real Det Return     | 902       |
| Real Sto Return     | 397       |
| Reward Loss         | -2.39e+07 |
| Running Env Steps   | 880000    |
| Running Forward KL  | 29.6      |
| Running Reverse KL  | 10.5      |
| Running Update Time | 176       |
-----------------------------------
--2024-08-11 10:31:30.347577 UTC---
| Itration            | 177       |
| Real Det Return     | 865       |
| Real Sto Return     | 339       |
| Reward Loss         | -2.47e+07 |
| Running Env Steps   | 885000    |
| Running Forward KL  | 29.5      |
| Running Reverse KL  | 10.2      |
| Running Update Time | 177       |
-----------------------------------
--2024-08-11 10:33:06.587525 UTC--
| Itration            | 178      |
| Real Det Return     | 976      |
| Real Sto Return     | 252      |
| Reward Loss         | -2.4e+07 |
| Running Env Steps   | 890000   |
| Running Forward KL  | 29.5     |
| Running Reverse KL  | 10.6     |
| Running Update Time | 178      |
----------------------------------
--2024-08-11 10:34:39.633888 UTC---
| Itration            | 179       |
| Real Det Return     | 1.01e+03  |
| Real Sto Return     | 505       |
| Reward Loss         | -2.49e+07 |
| Running Env Steps   | 895000    |
| Running Forward KL  | 29.5      |
| Running Reverse KL  | 10.3      |
| Running Update Time | 179       |
-----------------------------------
--2024-08-11 10:36:13.584129 UTC---
| Itration            | 180       |
| Real Det Return     | 853       |
| Real Sto Return     | 509       |
| Reward Loss         | -2.49e+07 |
| Running Env Steps   | 900000    |
| Running Forward KL  | 29.6      |
| Running Reverse KL  | 11        |
| Running Update Time | 180       |
-----------------------------------
--2024-08-11 10:37:48.448882 UTC---
| Itration            | 181       |
| Real Det Return     | 1.17e+03  |
| Real Sto Return     | 257       |
| Reward Loss         | -2.52e+07 |
| Running Env Steps   | 905000    |
| Running Forward KL  | 29.4      |
| Running Reverse KL  | 10.4      |
| Running Update Time | 181       |
-----------------------------------
--2024-08-11 10:39:20.463977 UTC---
| Itration            | 182       |
| Real Det Return     | 1.07e+03  |
| Real Sto Return     | 533       |
| Reward Loss         | -2.52e+07 |
| Running Env Steps   | 910000    |
| Running Forward KL  | 29.6      |
| Running Reverse KL  | 10.4      |
| Running Update Time | 182       |
-----------------------------------
--2024-08-11 10:40:54.458508 UTC---
| Itration            | 183       |
| Real Det Return     | 1.05e+03  |
| Real Sto Return     | 664       |
| Reward Loss         | -2.62e+07 |
| Running Env Steps   | 915000    |
| Running Forward KL  | 29.9      |
| Running Reverse KL  | 11.9      |
| Running Update Time | 183       |
-----------------------------------
--2024-08-11 10:42:27.510228 UTC---
| Itration            | 184       |
| Real Det Return     | 1.31e+03  |
| Real Sto Return     | 557       |
| Reward Loss         | -2.53e+07 |
| Running Env Steps   | 920000    |
| Running Forward KL  | 29.3      |
| Running Reverse KL  | 10.2      |
| Running Update Time | 184       |
-----------------------------------
--2024-08-11 10:44:01.070525 UTC---
| Itration            | 185       |
| Real Det Return     | 1.07e+03  |
| Real Sto Return     | 457       |
| Reward Loss         | -2.57e+07 |
| Running Env Steps   | 925000    |
| Running Forward KL  | 29.4      |
| Running Reverse KL  | 10.3      |
| Running Update Time | 185       |
-----------------------------------
--2024-08-11 10:45:36.659561 UTC---
| Itration            | 186       |
| Real Det Return     | 1.43e+03  |
| Real Sto Return     | 352       |
| Reward Loss         | -2.55e+07 |
| Running Env Steps   | 930000    |
| Running Forward KL  | 29.3      |
| Running Reverse KL  | 10.5      |
| Running Update Time | 186       |
-----------------------------------
--2024-08-11 10:47:08.978467 UTC---
| Itration            | 187       |
| Real Det Return     | 1.27e+03  |
| Real Sto Return     | 420       |
| Reward Loss         | -2.66e+07 |
| Running Env Steps   | 935000    |
| Running Forward KL  | 29.3      |
| Running Reverse KL  | 10.4      |
| Running Update Time | 187       |
-----------------------------------
--2024-08-11 10:48:43.808241 UTC---
| Itration            | 188       |
| Real Det Return     | 1.39e+03  |
| Real Sto Return     | 300       |
| Reward Loss         | -2.58e+07 |
| Running Env Steps   | 940000    |
| Running Forward KL  | 29.3      |
| Running Reverse KL  | 10.5      |
| Running Update Time | 188       |
-----------------------------------
--2024-08-11 10:50:18.841718 UTC---
| Itration            | 189       |
| Real Det Return     | 1.42e+03  |
| Real Sto Return     | 305       |
| Reward Loss         | -2.67e+07 |
| Running Env Steps   | 945000    |
| Running Forward KL  | 29.2      |
| Running Reverse KL  | 10.7      |
| Running Update Time | 189       |
-----------------------------------
--2024-08-11 10:51:50.680947 UTC---
| Itration            | 190       |
| Real Det Return     | 782       |
| Real Sto Return     | 259       |
| Reward Loss         | -2.69e+07 |
| Running Env Steps   | 950000    |
| Running Forward KL  | 29.3      |
| Running Reverse KL  | 11.2      |
| Running Update Time | 190       |
-----------------------------------
--2024-08-11 10:53:24.773666 UTC---
| Itration            | 191       |
| Real Det Return     | 630       |
| Real Sto Return     | 237       |
| Reward Loss         | -2.72e+07 |
| Running Env Steps   | 955000    |
| Running Forward KL  | 29.3      |
| Running Reverse KL  | 11        |
| Running Update Time | 191       |
-----------------------------------
--2024-08-11 10:54:59.117098 UTC---
| Itration            | 192       |
| Real Det Return     | 537       |
| Real Sto Return     | 213       |
| Reward Loss         | -2.66e+07 |
| Running Env Steps   | 960000    |
| Running Forward KL  | 29.4      |
| Running Reverse KL  | 11.3      |
| Running Update Time | 192       |
-----------------------------------
--2024-08-11 10:56:32.321257 UTC--
| Itration            | 193      |
| Real Det Return     | 559      |
| Real Sto Return     | 239      |
| Reward Loss         | -2.8e+07 |
| Running Env Steps   | 965000   |
| Running Forward KL  | 29.3     |
| Running Reverse KL  | 11.4     |
| Running Update Time | 193      |
----------------------------------
--2024-08-11 10:58:06.890344 UTC---
| Itration            | 194       |
| Real Det Return     | 568       |
| Real Sto Return     | 269       |
| Reward Loss         | -2.81e+07 |
| Running Env Steps   | 970000    |
| Running Forward KL  | 29.4      |
| Running Reverse KL  | 11.3      |
| Running Update Time | 194       |
-----------------------------------
--2024-08-11 10:59:39.961649 UTC---
| Itration            | 195       |
| Real Det Return     | 715       |
| Real Sto Return     | 230       |
| Reward Loss         | -2.75e+07 |
| Running Env Steps   | 975000    |
| Running Forward KL  | 29.3      |
| Running Reverse KL  | 10.9      |
| Running Update Time | 195       |
-----------------------------------
--2024-08-11 11:01:14.046363 UTC---
| Itration            | 196       |
| Real Det Return     | 769       |
| Real Sto Return     | 276       |
| Reward Loss         | -2.88e+07 |
| Running Env Steps   | 980000    |
| Running Forward KL  | 29.2      |
| Running Reverse KL  | 11.2      |
| Running Update Time | 196       |
-----------------------------------
--2024-08-11 11:02:49.736360 UTC---
| Itration            | 197       |
| Real Det Return     | 1.06e+03  |
| Real Sto Return     | 329       |
| Reward Loss         | -2.77e+07 |
| Running Env Steps   | 985000    |
| Running Forward KL  | 29.1      |
| Running Reverse KL  | 10.7      |
| Running Update Time | 197       |
-----------------------------------
--2024-08-11 11:04:23.269426 UTC---
| Itration            | 198       |
| Real Det Return     | 528       |
| Real Sto Return     | 237       |
| Reward Loss         | -2.79e+07 |
| Running Env Steps   | 990000    |
| Running Forward KL  | 29.2      |
| Running Reverse KL  | 11.1      |
| Running Update Time | 198       |
-----------------------------------
--2024-08-11 11:05:56.523342 UTC---
| Itration            | 199       |
| Real Det Return     | 576       |
| Real Sto Return     | 275       |
| Reward Loss         | -2.83e+07 |
| Running Env Steps   | 995000    |
| Running Forward KL  | 29.2      |
| Running Reverse KL  | 10.9      |
| Running Update Time | 199       |
-----------------------------------
--2024-08-11 11:07:30.695756 UTC---
| Itration            | 200       |
| Real Det Return     | 526       |
| Real Sto Return     | 247       |
| Reward Loss         | -2.84e+07 |
| Running Env Steps   | 1000000   |
| Running Forward KL  | 29.2      |
| Running Reverse KL  | 11.4      |
| Running Update Time | 200       |
-----------------------------------
--2024-08-11 11:09:03.155144 UTC---
| Itration            | 201       |
| Real Det Return     | 757       |
| Real Sto Return     | 407       |
| Reward Loss         | -2.97e+07 |
| Running Env Steps   | 1005000   |
| Running Forward KL  | 29.1      |
| Running Reverse KL  | 11        |
| Running Update Time | 201       |
-----------------------------------
--2024-08-11 11:10:38.151955 UTC---
| Itration            | 202       |
| Real Det Return     | 1.26e+03  |
| Real Sto Return     | 433       |
| Reward Loss         | -2.94e+07 |
| Running Env Steps   | 1010000   |
| Running Forward KL  | 29.1      |
| Running Reverse KL  | 10.6      |
| Running Update Time | 202       |
-----------------------------------
--2024-08-11 11:12:10.158068 UTC---
| Itration            | 203       |
| Real Det Return     | 1.49e+03  |
| Real Sto Return     | 442       |
| Reward Loss         | -2.98e+07 |
| Running Env Steps   | 1015000   |
| Running Forward KL  | 29.1      |
| Running Reverse KL  | 10.4      |
| Running Update Time | 203       |
-----------------------------------
--2024-08-11 11:13:44.584924 UTC---
| Itration            | 204       |
| Real Det Return     | 1.52e+03  |
| Real Sto Return     | 437       |
| Reward Loss         | -2.91e+07 |
| Running Env Steps   | 1020000   |
| Running Forward KL  | 29        |
| Running Reverse KL  | 10.5      |
| Running Update Time | 204       |
-----------------------------------
--2024-08-11 11:15:20.627787 UTC---
| Itration            | 205       |
| Real Det Return     | 1.58e+03  |
| Real Sto Return     | 484       |
| Reward Loss         | -3.06e+07 |
| Running Env Steps   | 1025000   |
| Running Forward KL  | 29.1      |
| Running Reverse KL  | 10.4      |
| Running Update Time | 205       |
-----------------------------------
--2024-08-11 11:16:54.088541 UTC---
| Itration            | 206       |
| Real Det Return     | 1.62e+03  |
| Real Sto Return     | 682       |
| Reward Loss         | -2.97e+07 |
| Running Env Steps   | 1030000   |
| Running Forward KL  | 28.9      |
| Running Reverse KL  | 10.2      |
| Running Update Time | 206       |
-----------------------------------
--2024-08-11 11:18:27.664501 UTC---
| Itration            | 207       |
| Real Det Return     | 1.35e+03  |
| Real Sto Return     | 855       |
| Reward Loss         | -3.05e+07 |
| Running Env Steps   | 1035000   |
| Running Forward KL  | 29        |
| Running Reverse KL  | 10.3      |
| Running Update Time | 207       |
-----------------------------------
--2024-08-11 11:20:02.186132 UTC---
| Itration            | 208       |
| Real Det Return     | 1.59e+03  |
| Real Sto Return     | 1.01e+03  |
| Reward Loss         | -3.01e+07 |
| Running Env Steps   | 1040000   |
| Running Forward KL  | 29        |
| Running Reverse KL  | 10.5      |
| Running Update Time | 208       |
-----------------------------------
--2024-08-11 11:21:34.636058 UTC---
| Itration            | 209       |
| Real Det Return     | 1.67e+03  |
| Real Sto Return     | 1.17e+03  |
| Reward Loss         | -3.01e+07 |
| Running Env Steps   | 1045000   |
| Running Forward KL  | 29        |
| Running Reverse KL  | 10.7      |
| Running Update Time | 209       |
-----------------------------------
--2024-08-11 11:23:09.056920 UTC--
| Itration            | 210      |
| Real Det Return     | 1.88e+03 |
| Real Sto Return     | 1.33e+03 |
| Reward Loss         | -3e+07   |
| Running Env Steps   | 1050000  |
| Running Forward KL  | 28.7     |
| Running Reverse KL  | 10.7     |
| Running Update Time | 210      |
----------------------------------
--2024-08-11 11:24:41.343330 UTC--
| Itration            | 211      |
| Real Det Return     | 1.77e+03 |
| Real Sto Return     | 1.21e+03 |
| Reward Loss         | -3.1e+07 |
| Running Env Steps   | 1055000  |
| Running Forward KL  | 29.5     |
| Running Reverse KL  | 11.3     |
| Running Update Time | 211      |
----------------------------------
--2024-08-11 11:26:16.987231 UTC---
| Itration            | 212       |
| Real Det Return     | 1.83e+03  |
| Real Sto Return     | 1.36e+03  |
| Reward Loss         | -3.14e+07 |
| Running Env Steps   | 1060000   |
| Running Forward KL  | 28.7      |
| Running Reverse KL  | 10.7      |
| Running Update Time | 212       |
-----------------------------------
--2024-08-11 11:27:52.071878 UTC---
| Itration            | 213       |
| Real Det Return     | 1.97e+03  |
| Real Sto Return     | 1.5e+03   |
| Reward Loss         | -3.17e+07 |
| Running Env Steps   | 1065000   |
| Running Forward KL  | 28.8      |
| Running Reverse KL  | 10.7      |
| Running Update Time | 213       |
-----------------------------------
--2024-08-11 11:29:26.288538 UTC---
| Itration            | 214       |
| Real Det Return     | 1.92e+03  |
| Real Sto Return     | 1.15e+03  |
| Reward Loss         | -3.11e+07 |
| Running Env Steps   | 1070000   |
| Running Forward KL  | 28.7      |
| Running Reverse KL  | 10        |
| Running Update Time | 214       |
-----------------------------------
--2024-08-11 11:31:00.293695 UTC---
| Itration            | 215       |
| Real Det Return     | 2.09e+03  |
| Real Sto Return     | 1.5e+03   |
| Reward Loss         | -3.09e+07 |
| Running Env Steps   | 1075000   |
| Running Forward KL  | 28.6      |
| Running Reverse KL  | 10.4      |
| Running Update Time | 215       |
-----------------------------------
--2024-08-11 11:32:35.878403 UTC--
| Itration            | 216      |
| Real Det Return     | 2.06e+03 |
| Real Sto Return     | 1.48e+03 |
| Reward Loss         | -3.1e+07 |
| Running Env Steps   | 1080000  |
| Running Forward KL  | 28.6     |
| Running Reverse KL  | 10.5     |
| Running Update Time | 216      |
----------------------------------
--2024-08-11 11:34:08.851943 UTC---
| Itration            | 217       |
| Real Det Return     | 2.3e+03   |
| Real Sto Return     | 1.61e+03  |
| Reward Loss         | -3.12e+07 |
| Running Env Steps   | 1085000   |
| Running Forward KL  | 29        |
| Running Reverse KL  | 11        |
| Running Update Time | 217       |
-----------------------------------
--2024-08-11 11:35:42.532356 UTC--
| Itration            | 218      |
| Real Det Return     | 2.37e+03 |
| Real Sto Return     | 1.61e+03 |
| Reward Loss         | -3.2e+07 |
| Running Env Steps   | 1090000  |
| Running Forward KL  | 28.8     |
| Running Reverse KL  | 10.7     |
| Running Update Time | 218      |
----------------------------------
--2024-08-11 11:37:16.248363 UTC---
| Itration            | 219       |
| Real Det Return     | 2.38e+03  |
| Real Sto Return     | 1.51e+03  |
| Reward Loss         | -3.08e+07 |
| Running Env Steps   | 1095000   |
| Running Forward KL  | 27.9      |
| Running Reverse KL  | 10.1      |
| Running Update Time | 219       |
-----------------------------------
--2024-08-11 11:38:50.368614 UTC---
| Itration            | 220       |
| Real Det Return     | 2.6e+03   |
| Real Sto Return     | 1.84e+03  |
| Reward Loss         | -3.11e+07 |
| Running Env Steps   | 1100000   |
| Running Forward KL  | 28.2      |
| Running Reverse KL  | 10.5      |
| Running Update Time | 220       |
-----------------------------------
--2024-08-11 11:40:25.571925 UTC---
| Itration            | 221       |
| Real Det Return     | 2.67e+03  |
| Real Sto Return     | 1.7e+03   |
| Reward Loss         | -3.11e+07 |
| Running Env Steps   | 1105000   |
| Running Forward KL  | 27.7      |
| Running Reverse KL  | 10.1      |
| Running Update Time | 221       |
-----------------------------------
--2024-08-11 11:41:58.948111 UTC---
| Itration            | 222       |
| Real Det Return     | 3.16e+03  |
| Real Sto Return     | 2.17e+03  |
| Reward Loss         | -2.99e+07 |
| Running Env Steps   | 1110000   |
| Running Forward KL  | 27.8      |
| Running Reverse KL  | 10.7      |
| Running Update Time | 222       |
-----------------------------------
--2024-08-11 11:43:33.373203 UTC--
| Itration            | 223      |
| Real Det Return     | 3.32e+03 |
| Real Sto Return     | 2.22e+03 |
| Reward Loss         | -3e+07   |
| Running Env Steps   | 1115000  |
| Running Forward KL  | 27       |
| Running Reverse KL  | 11.1     |
| Running Update Time | 223      |
----------------------------------
--2024-08-11 11:45:08.711804 UTC---
| Itration            | 224       |
| Real Det Return     | 2.88e+03  |
| Real Sto Return     | 2.19e+03  |
| Reward Loss         | -3.12e+07 |
| Running Env Steps   | 1120000   |
| Running Forward KL  | 26.5      |
| Running Reverse KL  | 11.3      |
| Running Update Time | 224       |
-----------------------------------
--2024-08-11 11:46:42.538369 UTC---
| Itration            | 225       |
| Real Det Return     | 3.39e+03  |
| Real Sto Return     | 2.06e+03  |
| Reward Loss         | -3.13e+07 |
| Running Env Steps   | 1125000   |
| Running Forward KL  | 26.7      |
| Running Reverse KL  | 12.5      |
| Running Update Time | 225       |
-----------------------------------
--2024-08-11 11:48:16.010426 UTC---
| Itration            | 226       |
| Real Det Return     | 3.74e+03  |
| Real Sto Return     | 2.47e+03  |
| Reward Loss         | -2.97e+07 |
| Running Env Steps   | 1130000   |
| Running Forward KL  | 26.1      |
| Running Reverse KL  | 10.1      |
| Running Update Time | 226       |
-----------------------------------
--2024-08-11 11:49:49.454100 UTC---
| Itration            | 227       |
| Real Det Return     | 3.81e+03  |
| Real Sto Return     | 2.96e+03  |
| Reward Loss         | -2.91e+07 |
| Running Env Steps   | 1135000   |
| Running Forward KL  | 26.5      |
| Running Reverse KL  | 10.3      |
| Running Update Time | 227       |
-----------------------------------
--2024-08-11 11:51:21.315379 UTC---
| Itration            | 228       |
| Real Det Return     | 3.45e+03  |
| Real Sto Return     | 2.52e+03  |
| Reward Loss         | -2.99e+07 |
| Running Env Steps   | 1140000   |
| Running Forward KL  | 26.1      |
| Running Reverse KL  | 12        |
| Running Update Time | 228       |
-----------------------------------
--2024-08-11 11:52:56.363771 UTC---
| Itration            | 229       |
| Real Det Return     | 3.75e+03  |
| Real Sto Return     | 2.61e+03  |
| Reward Loss         | -2.99e+07 |
| Running Env Steps   | 1145000   |
| Running Forward KL  | 26.1      |
| Running Reverse KL  | 9.88      |
| Running Update Time | 229       |
-----------------------------------
--2024-08-11 11:54:27.712304 UTC---
| Itration            | 230       |
| Real Det Return     | 4.28e+03  |
| Real Sto Return     | 2.99e+03  |
| Reward Loss         | -2.94e+07 |
| Running Env Steps   | 1150000   |
| Running Forward KL  | 26.3      |
| Running Reverse KL  | 10.6      |
| Running Update Time | 230       |
-----------------------------------
--2024-08-11 11:56:01.556447 UTC---
| Itration            | 231       |
| Real Det Return     | 2.92e+03  |
| Real Sto Return     | 2.62e+03  |
| Reward Loss         | -2.93e+07 |
| Running Env Steps   | 1155000   |
| Running Forward KL  | 25.2      |
| Running Reverse KL  | 10.1      |
| Running Update Time | 231       |
-----------------------------------
--2024-08-11 11:57:35.564752 UTC---
| Itration            | 232       |
| Real Det Return     | 3e+03     |
| Real Sto Return     | 2.33e+03  |
| Reward Loss         | -3.13e+07 |
| Running Env Steps   | 1160000   |
| Running Forward KL  | 26.6      |
| Running Reverse KL  | 11.1      |
| Running Update Time | 232       |
-----------------------------------
--2024-08-11 11:59:08.433654 UTC---
| Itration            | 233       |
| Real Det Return     | 4.17e+03  |
| Real Sto Return     | 3.37e+03  |
| Reward Loss         | -2.92e+07 |
| Running Env Steps   | 1165000   |
| Running Forward KL  | 26.7      |
| Running Reverse KL  | 11.3      |
| Running Update Time | 233       |
-----------------------------------
--2024-08-11 12:00:42.116635 UTC---
| Itration            | 234       |
| Real Det Return     | 4.49e+03  |
| Real Sto Return     | 3.63e+03  |
| Reward Loss         | -2.74e+07 |
| Running Env Steps   | 1170000   |
| Running Forward KL  | 25.4      |
| Running Reverse KL  | 10.2      |
| Running Update Time | 234       |
-----------------------------------
--2024-08-11 12:02:14.985488 UTC---
| Itration            | 235       |
| Real Det Return     | 4.36e+03  |
| Real Sto Return     | 3.53e+03  |
| Reward Loss         | -2.76e+07 |
| Running Env Steps   | 1175000   |
| Running Forward KL  | 25.9      |
| Running Reverse KL  | 11.1      |
| Running Update Time | 235       |
-----------------------------------
--2024-08-11 12:03:47.651642 UTC---
| Itration            | 236       |
| Real Det Return     | 4.69e+03  |
| Real Sto Return     | 3.83e+03  |
| Reward Loss         | -2.74e+07 |
| Running Env Steps   | 1180000   |
| Running Forward KL  | 25.5      |
| Running Reverse KL  | 10.7      |
| Running Update Time | 236       |
-----------------------------------
--2024-08-11 12:05:20.946690 UTC---
| Itration            | 237       |
| Real Det Return     | 4.62e+03  |
| Real Sto Return     | 3.93e+03  |
| Reward Loss         | -2.71e+07 |
| Running Env Steps   | 1185000   |
| Running Forward KL  | 25.7      |
| Running Reverse KL  | 10.9      |
| Running Update Time | 237       |
-----------------------------------
--2024-08-11 12:06:52.455078 UTC---
| Itration            | 238       |
| Real Det Return     | 5e+03     |
| Real Sto Return     | 3.95e+03  |
| Reward Loss         | -2.67e+07 |
| Running Env Steps   | 1190000   |
| Running Forward KL  | 24.3      |
| Running Reverse KL  | 10.4      |
| Running Update Time | 238       |
-----------------------------------
--2024-08-11 12:08:24.910344 UTC---
| Itration            | 239       |
| Real Det Return     | 5.09e+03  |
| Real Sto Return     | 4.26e+03  |
| Reward Loss         | -2.68e+07 |
| Running Env Steps   | 1195000   |
| Running Forward KL  | 24.2      |
| Running Reverse KL  | 10.3      |
| Running Update Time | 239       |
-----------------------------------
--2024-08-11 12:09:56.908921 UTC---
| Itration            | 240       |
| Real Det Return     | 4.96e+03  |
| Real Sto Return     | 4.37e+03  |
| Reward Loss         | -2.56e+07 |
| Running Env Steps   | 1200000   |
| Running Forward KL  | 24.5      |
| Running Reverse KL  | 10.2      |
| Running Update Time | 240       |
-----------------------------------
--2024-08-11 12:11:27.933147 UTC---
| Itration            | 241       |
| Real Det Return     | 5.22e+03  |
| Real Sto Return     | 4.53e+03  |
| Reward Loss         | -2.79e+07 |
| Running Env Steps   | 1205000   |
| Running Forward KL  | 24.2      |
| Running Reverse KL  | 10.4      |
| Running Update Time | 241       |
-----------------------------------
--2024-08-11 12:13:00.872185 UTC---
| Itration            | 242       |
| Real Det Return     | 5.67e+03  |
| Real Sto Return     | 4.33e+03  |
| Reward Loss         | -2.52e+07 |
| Running Env Steps   | 1210000   |
| Running Forward KL  | 23.6      |
| Running Reverse KL  | 10.5      |
| Running Update Time | 242       |
-----------------------------------
--2024-08-11 12:14:31.608818 UTC---
| Itration            | 243       |
| Real Det Return     | 5.63e+03  |
| Real Sto Return     | 4.68e+03  |
| Reward Loss         | -2.45e+07 |
| Running Env Steps   | 1215000   |
| Running Forward KL  | 22.5      |
| Running Reverse KL  | 9.88      |
| Running Update Time | 243       |
-----------------------------------
--2024-08-11 12:16:04.478271 UTC---
| Itration            | 244       |
| Real Det Return     | 5.68e+03  |
| Real Sto Return     | 4.65e+03  |
| Reward Loss         | -2.55e+07 |
| Running Env Steps   | 1220000   |
| Running Forward KL  | 23.5      |
| Running Reverse KL  | 10.2      |
| Running Update Time | 244       |
-----------------------------------
--2024-08-11 12:17:35.658016 UTC---
| Itration            | 245       |
| Real Det Return     | 5.71e+03  |
| Real Sto Return     | 4.7e+03   |
| Reward Loss         | -2.49e+07 |
| Running Env Steps   | 1225000   |
| Running Forward KL  | 22.5      |
| Running Reverse KL  | 9.52      |
| Running Update Time | 245       |
-----------------------------------
--2024-08-11 12:19:05.832156 UTC---
| Itration            | 246       |
| Real Det Return     | 5.86e+03  |
| Real Sto Return     | 5.2e+03   |
| Reward Loss         | -2.49e+07 |
| Running Env Steps   | 1230000   |
| Running Forward KL  | 22.6      |
| Running Reverse KL  | 10.5      |
| Running Update Time | 246       |
-----------------------------------
--2024-08-11 12:20:38.589800 UTC---
| Itration            | 247       |
| Real Det Return     | 5.83e+03  |
| Real Sto Return     | 5.13e+03  |
| Reward Loss         | -2.39e+07 |
| Running Env Steps   | 1235000   |
| Running Forward KL  | 23.3      |
| Running Reverse KL  | 10.6      |
| Running Update Time | 247       |
-----------------------------------
--2024-08-11 12:22:08.870391 UTC---
| Itration            | 248       |
| Real Det Return     | 5.83e+03  |
| Real Sto Return     | 5.06e+03  |
| Reward Loss         | -2.43e+07 |
| Running Env Steps   | 1240000   |
| Running Forward KL  | 22.4      |
| Running Reverse KL  | 10.2      |
| Running Update Time | 248       |
-----------------------------------
--2024-08-11 12:23:40.747691 UTC---
| Itration            | 249       |
| Real Det Return     | 6.13e+03  |
| Real Sto Return     | 5.57e+03  |
| Reward Loss         | -2.29e+07 |
| Running Env Steps   | 1245000   |
| Running Forward KL  | 22.4      |
| Running Reverse KL  | 10.8      |
| Running Update Time | 249       |
-----------------------------------
--2024-08-11 12:25:15.004568 UTC--
| Itration            | 250      |
| Real Det Return     | 5.75e+03 |
| Real Sto Return     | 4.99e+03 |
| Reward Loss         | -2.5e+07 |
| Running Env Steps   | 1250000  |
| Running Forward KL  | 22.8     |
| Running Reverse KL  | 9.82     |
| Running Update Time | 250      |
----------------------------------
--2024-08-11 12:26:46.489881 UTC---
| Itration            | 251       |
| Real Det Return     | 6.05e+03  |
| Real Sto Return     | 5.31e+03  |
| Reward Loss         | -2.52e+07 |
| Running Env Steps   | 1255000   |
| Running Forward KL  | 22.4      |
| Running Reverse KL  | 9.86      |
| Running Update Time | 251       |
-----------------------------------
--2024-08-11 12:28:18.707230 UTC---
| Itration            | 252       |
| Real Det Return     | 6.17e+03  |
| Real Sto Return     | 5.58e+03  |
| Reward Loss         | -2.32e+07 |
| Running Env Steps   | 1260000   |
| Running Forward KL  | 22        |
| Running Reverse KL  | 10.3      |
| Running Update Time | 252       |
-----------------------------------
--2024-08-11 12:29:50.270100 UTC---
| Itration            | 253       |
| Real Det Return     | 6.01e+03  |
| Real Sto Return     | 5.46e+03  |
| Reward Loss         | -2.44e+07 |
| Running Env Steps   | 1265000   |
| Running Forward KL  | 22.7      |
| Running Reverse KL  | 10.5      |
| Running Update Time | 253       |
-----------------------------------
--2024-08-11 12:31:23.890717 UTC---
| Itration            | 254       |
| Real Det Return     | 6.76e+03  |
| Real Sto Return     | 5.65e+03  |
| Reward Loss         | -2.27e+07 |
| Running Env Steps   | 1270000   |
| Running Forward KL  | 21.7      |
| Running Reverse KL  | 10.2      |
| Running Update Time | 254       |
-----------------------------------
--2024-08-11 12:32:56.522182 UTC---
| Itration            | 255       |
| Real Det Return     | 6.74e+03  |
| Real Sto Return     | 5.85e+03  |
| Reward Loss         | -2.21e+07 |
| Running Env Steps   | 1275000   |
| Running Forward KL  | 21.8      |
| Running Reverse KL  | 10.5      |
| Running Update Time | 255       |
-----------------------------------
--2024-08-11 12:34:26.855201 UTC---
| Itration            | 256       |
| Real Det Return     | 6.67e+03  |
| Real Sto Return     | 5.9e+03   |
| Reward Loss         | -2.28e+07 |
| Running Env Steps   | 1280000   |
| Running Forward KL  | 20.7      |
| Running Reverse KL  | 9.85      |
| Running Update Time | 256       |
-----------------------------------
--2024-08-11 12:35:57.064884 UTC---
| Itration            | 257       |
| Real Det Return     | 6.4e+03   |
| Real Sto Return     | 5.66e+03  |
| Reward Loss         | -2.31e+07 |
| Running Env Steps   | 1285000   |
| Running Forward KL  | 21.5      |
| Running Reverse KL  | 9.76      |
| Running Update Time | 257       |
-----------------------------------
--2024-08-11 12:37:28.366609 UTC---
| Itration            | 258       |
| Real Det Return     | 6.52e+03  |
| Real Sto Return     | 5.97e+03  |
| Reward Loss         | -2.35e+07 |
| Running Env Steps   | 1290000   |
| Running Forward KL  | 21.4      |
| Running Reverse KL  | 10.4      |
| Running Update Time | 258       |
-----------------------------------
--2024-08-11 12:39:01.280912 UTC---
| Itration            | 259       |
| Real Det Return     | 6.24e+03  |
| Real Sto Return     | 5.94e+03  |
| Reward Loss         | -2.21e+07 |
| Running Env Steps   | 1295000   |
| Running Forward KL  | 21.7      |
| Running Reverse KL  | 10.7      |
| Running Update Time | 259       |
-----------------------------------
--2024-08-11 12:40:34.991440 UTC---
| Itration            | 260       |
| Real Det Return     | 6.9e+03   |
| Real Sto Return     | 5.91e+03  |
| Reward Loss         | -2.23e+07 |
| Running Env Steps   | 1300000   |
| Running Forward KL  | 20.5      |
| Running Reverse KL  | 10.5      |
| Running Update Time | 260       |
-----------------------------------
--2024-08-11 12:42:07.510268 UTC--
| Itration            | 261      |
| Real Det Return     | 7.38e+03 |
| Real Sto Return     | 6.39e+03 |
| Reward Loss         | -2.3e+07 |
| Running Env Steps   | 1305000  |
| Running Forward KL  | 20.5     |
| Running Reverse KL  | 9.64     |
| Running Update Time | 261      |
----------------------------------
--2024-08-11 12:43:39.446483 UTC---
| Itration            | 262       |
| Real Det Return     | 6.73e+03  |
| Real Sto Return     | 6.17e+03  |
| Reward Loss         | -2.11e+07 |
| Running Env Steps   | 1310000   |
| Running Forward KL  | 20.7      |
| Running Reverse KL  | 10.2      |
| Running Update Time | 262       |
-----------------------------------
--2024-08-11 12:45:11.738335 UTC---
| Itration            | 263       |
| Real Det Return     | 7.38e+03  |
| Real Sto Return     | 6.58e+03  |
| Reward Loss         | -2.14e+07 |
| Running Env Steps   | 1315000   |
| Running Forward KL  | 20.6      |
| Running Reverse KL  | 10.2      |
| Running Update Time | 263       |
-----------------------------------
--2024-08-11 12:46:45.258977 UTC---
| Itration            | 264       |
| Real Det Return     | 7.16e+03  |
| Real Sto Return     | 6.37e+03  |
| Reward Loss         | -2.17e+07 |
| Running Env Steps   | 1320000   |
| Running Forward KL  | 21.2      |
| Running Reverse KL  | 10.9      |
| Running Update Time | 264       |
-----------------------------------
--2024-08-11 12:48:17.365973 UTC---
| Itration            | 265       |
| Real Det Return     | 7.04e+03  |
| Real Sto Return     | 5.66e+03  |
| Reward Loss         | -2.26e+07 |
| Running Env Steps   | 1325000   |
| Running Forward KL  | 21.2      |
| Running Reverse KL  | 10.2      |
| Running Update Time | 265       |
-----------------------------------
--2024-08-11 12:49:48.613311 UTC---
| Itration            | 266       |
| Real Det Return     | 6.86e+03  |
| Real Sto Return     | 6.16e+03  |
| Reward Loss         | -2.26e+07 |
| Running Env Steps   | 1330000   |
| Running Forward KL  | 21        |
| Running Reverse KL  | 9.96      |
| Running Update Time | 266       |
-----------------------------------
--2024-08-11 12:51:20.209953 UTC---
| Itration            | 267       |
| Real Det Return     | 6.4e+03   |
| Real Sto Return     | 6.08e+03  |
| Reward Loss         | -2.19e+07 |
| Running Env Steps   | 1335000   |
| Running Forward KL  | 21.7      |
| Running Reverse KL  | 10.9      |
| Running Update Time | 267       |
-----------------------------------
--2024-08-11 12:52:51.909986 UTC--
| Itration            | 268      |
| Real Det Return     | 7.57e+03 |
| Real Sto Return     | 6.4e+03  |
| Reward Loss         | -2.2e+07 |
| Running Env Steps   | 1340000  |
| Running Forward KL  | 20.4     |
| Running Reverse KL  | 9.91     |
| Running Update Time | 268      |
----------------------------------
--2024-08-11 12:54:21.368733 UTC---
| Itration            | 269       |
| Real Det Return     | 6.89e+03  |
| Real Sto Return     | 6.43e+03  |
| Reward Loss         | -2.16e+07 |
| Running Env Steps   | 1345000   |
| Running Forward KL  | 20.9      |
| Running Reverse KL  | 10.8      |
| Running Update Time | 269       |
-----------------------------------
--2024-08-11 12:55:54.941381 UTC---
| Itration            | 270       |
| Real Det Return     | 7.64e+03  |
| Real Sto Return     | 6.78e+03  |
| Reward Loss         | -2.05e+07 |
| Running Env Steps   | 1350000   |
| Running Forward KL  | 20        |
| Running Reverse KL  | 10.3      |
| Running Update Time | 270       |
-----------------------------------
--2024-08-11 12:57:24.888659 UTC---
| Itration            | 271       |
| Real Det Return     | 7.9e+03   |
| Real Sto Return     | 6.98e+03  |
| Reward Loss         | -2.05e+07 |
| Running Env Steps   | 1355000   |
| Running Forward KL  | 20.2      |
| Running Reverse KL  | 10.2      |
| Running Update Time | 271       |
-----------------------------------
--2024-08-11 12:58:57.747882 UTC---
| Itration            | 272       |
| Real Det Return     | 7.93e+03  |
| Real Sto Return     | 6.71e+03  |
| Reward Loss         | -2.15e+07 |
| Running Env Steps   | 1360000   |
| Running Forward KL  | 20.4      |
| Running Reverse KL  | 10.4      |
| Running Update Time | 272       |
-----------------------------------
--2024-08-11 13:00:31.307638 UTC---
| Itration            | 273       |
| Real Det Return     | 7.74e+03  |
| Real Sto Return     | 6.87e+03  |
| Reward Loss         | -2.21e+07 |
| Running Env Steps   | 1365000   |
| Running Forward KL  | 20.2      |
| Running Reverse KL  | 9.91      |
| Running Update Time | 273       |
-----------------------------------
--2024-08-11 13:02:03.598878 UTC---
| Itration            | 274       |
| Real Det Return     | 7.77e+03  |
| Real Sto Return     | 6.92e+03  |
| Reward Loss         | -1.95e+07 |
| Running Env Steps   | 1370000   |
| Running Forward KL  | 19.9      |
| Running Reverse KL  | 9.88      |
| Running Update Time | 274       |
-----------------------------------
--2024-08-11 13:03:35.590253 UTC---
| Itration            | 275       |
| Real Det Return     | 8e+03     |
| Real Sto Return     | 7.09e+03  |
| Reward Loss         | -2.03e+07 |
| Running Env Steps   | 1375000   |
| Running Forward KL  | 19.4      |
| Running Reverse KL  | 9.76      |
| Running Update Time | 275       |
-----------------------------------
--2024-08-11 13:05:07.560153 UTC--
| Itration            | 276      |
| Real Det Return     | 8.1e+03  |
| Real Sto Return     | 7.25e+03 |
| Reward Loss         | -2.1e+07 |
| Running Env Steps   | 1380000  |
| Running Forward KL  | 20.5     |
| Running Reverse KL  | 10.4     |
| Running Update Time | 276      |
----------------------------------
--2024-08-11 13:06:39.161637 UTC---
| Itration            | 277       |
| Real Det Return     | 7.83e+03  |
| Real Sto Return     | 7.03e+03  |
| Reward Loss         | -2.03e+07 |
| Running Env Steps   | 1385000   |
| Running Forward KL  | 20.1      |
| Running Reverse KL  | 9.97      |
| Running Update Time | 277       |
-----------------------------------
--2024-08-11 13:08:11.987645 UTC---
| Itration            | 278       |
| Real Det Return     | 8.38e+03  |
| Real Sto Return     | 7.45e+03  |
| Reward Loss         | -1.94e+07 |
| Running Env Steps   | 1390000   |
| Running Forward KL  | 19.4      |
| Running Reverse KL  | 9.89      |
| Running Update Time | 278       |
-----------------------------------
--2024-08-11 13:09:43.416736 UTC---
| Itration            | 279       |
| Real Det Return     | 8.21e+03  |
| Real Sto Return     | 7.38e+03  |
| Reward Loss         | -1.91e+07 |
| Running Env Steps   | 1395000   |
| Running Forward KL  | 20        |
| Running Reverse KL  | 10.3      |
| Running Update Time | 279       |
-----------------------------------
--2024-08-11 13:11:15.945388 UTC--
| Itration            | 280      |
| Real Det Return     | 7.98e+03 |
| Real Sto Return     | 7.21e+03 |
| Reward Loss         | -1.9e+07 |
| Running Env Steps   | 1400000  |
| Running Forward KL  | 19.5     |
| Running Reverse KL  | 9.93     |
| Running Update Time | 280      |
----------------------------------
--2024-08-11 13:12:49.313671 UTC---
| Itration            | 281       |
| Real Det Return     | 7.83e+03  |
| Real Sto Return     | 7.44e+03  |
| Reward Loss         | -1.97e+07 |
| Running Env Steps   | 1405000   |
| Running Forward KL  | 19.2      |
| Running Reverse KL  | 9.79      |
| Running Update Time | 281       |
-----------------------------------
--2024-08-11 13:14:20.159698 UTC---
| Itration            | 282       |
| Real Det Return     | 7.55e+03  |
| Real Sto Return     | 7.33e+03  |
| Reward Loss         | -1.95e+07 |
| Running Env Steps   | 1410000   |
| Running Forward KL  | 19.7      |
| Running Reverse KL  | 10.1      |
| Running Update Time | 282       |
-----------------------------------
--2024-08-11 13:15:52.415630 UTC---
| Itration            | 283       |
| Real Det Return     | 8.55e+03  |
| Real Sto Return     | 7.39e+03  |
| Reward Loss         | -1.85e+07 |
| Running Env Steps   | 1415000   |
| Running Forward KL  | 19.4      |
| Running Reverse KL  | 9.99      |
| Running Update Time | 283       |
-----------------------------------
--2024-08-11 13:17:22.979020 UTC---
| Itration            | 284       |
| Real Det Return     | 8.7e+03   |
| Real Sto Return     | 7.57e+03  |
| Reward Loss         | -1.84e+07 |
| Running Env Steps   | 1420000   |
| Running Forward KL  | 19.4      |
| Running Reverse KL  | 9.99      |
| Running Update Time | 284       |
-----------------------------------
--2024-08-11 13:18:56.328082 UTC---
| Itration            | 285       |
| Real Det Return     | 8.05e+03  |
| Real Sto Return     | 7.47e+03  |
| Reward Loss         | -1.94e+07 |
| Running Env Steps   | 1425000   |
| Running Forward KL  | 19.4      |
| Running Reverse KL  | 9.94      |
| Running Update Time | 285       |
-----------------------------------
--2024-08-11 13:20:30.006771 UTC---
| Itration            | 286       |
| Real Det Return     | 8.87e+03  |
| Real Sto Return     | 7.94e+03  |
| Reward Loss         | -1.81e+07 |
| Running Env Steps   | 1430000   |
| Running Forward KL  | 19.1      |
| Running Reverse KL  | 10.2      |
| Running Update Time | 286       |
-----------------------------------
--2024-08-11 13:22:02.419766 UTC---
| Itration            | 287       |
| Real Det Return     | 8.77e+03  |
| Real Sto Return     | 7.94e+03  |
| Reward Loss         | -1.68e+07 |
| Running Env Steps   | 1435000   |
| Running Forward KL  | 19.2      |
| Running Reverse KL  | 9.95      |
| Running Update Time | 287       |
-----------------------------------
--2024-08-11 13:23:34.646898 UTC---
| Itration            | 288       |
| Real Det Return     | 8.66e+03  |
| Real Sto Return     | 7.93e+03  |
| Reward Loss         | -1.63e+07 |
| Running Env Steps   | 1440000   |
| Running Forward KL  | 18.9      |
| Running Reverse KL  | 10.2      |
| Running Update Time | 288       |
-----------------------------------
--2024-08-11 13:25:08.183611 UTC---
| Itration            | 289       |
| Real Det Return     | 8.57e+03  |
| Real Sto Return     | 7.37e+03  |
| Reward Loss         | -2.11e+07 |
| Running Env Steps   | 1445000   |
| Running Forward KL  | 19.6      |
| Running Reverse KL  | 9.86      |
| Running Update Time | 289       |
-----------------------------------
--2024-08-11 13:26:41.785335 UTC---
| Itration            | 290       |
| Real Det Return     | 8.68e+03  |
| Real Sto Return     | 8.01e+03  |
| Reward Loss         | -1.84e+07 |
| Running Env Steps   | 1450000   |
| Running Forward KL  | 19.2      |
| Running Reverse KL  | 10.3      |
| Running Update Time | 290       |
-----------------------------------
--2024-08-11 13:28:17.895049 UTC--
| Itration            | 291      |
| Real Det Return     | 9.23e+03 |
| Real Sto Return     | 8.33e+03 |
| Reward Loss         | -1.7e+07 |
| Running Env Steps   | 1455000  |
| Running Forward KL  | 18.6     |
| Running Reverse KL  | 10.1     |
| Running Update Time | 291      |
----------------------------------
--2024-08-11 13:29:49.560533 UTC---
| Itration            | 292       |
| Real Det Return     | 8.55e+03  |
| Real Sto Return     | 8.06e+03  |
| Reward Loss         | -1.77e+07 |
| Running Env Steps   | 1460000   |
| Running Forward KL  | 18.7      |
| Running Reverse KL  | 9.65      |
| Running Update Time | 292       |
-----------------------------------
--2024-08-11 13:31:23.310037 UTC---
| Itration            | 293       |
| Real Det Return     | 8.49e+03  |
| Real Sto Return     | 7.98e+03  |
| Reward Loss         | -1.89e+07 |
| Running Env Steps   | 1465000   |
| Running Forward KL  | 19.1      |
| Running Reverse KL  | 9.87      |
| Running Update Time | 293       |
-----------------------------------
--2024-08-11 13:32:57.775528 UTC--
| Itration            | 294      |
| Real Det Return     | 8.59e+03 |
| Real Sto Return     | 8.14e+03 |
| Reward Loss         | -1.6e+07 |
| Running Env Steps   | 1470000  |
| Running Forward KL  | 18.3     |
| Running Reverse KL  | 9.77     |
| Running Update Time | 294      |
----------------------------------
--2024-08-11 13:34:29.479833 UTC---
| Itration            | 295       |
| Real Det Return     | 8.9e+03   |
| Real Sto Return     | 8.28e+03  |
| Reward Loss         | -1.61e+07 |
| Running Env Steps   | 1475000   |
| Running Forward KL  | 18.3      |
| Running Reverse KL  | 9.92      |
| Running Update Time | 295       |
-----------------------------------
--2024-08-11 13:36:00.846953 UTC---
| Itration            | 296       |
| Real Det Return     | 8.69e+03  |
| Real Sto Return     | 8.11e+03  |
| Reward Loss         | -1.65e+07 |
| Running Env Steps   | 1480000   |
| Running Forward KL  | 18.9      |
| Running Reverse KL  | 10        |
| Running Update Time | 296       |
-----------------------------------
--2024-08-11 13:37:33.833121 UTC---
| Itration            | 297       |
| Real Det Return     | 9.01e+03  |
| Real Sto Return     | 8.39e+03  |
| Reward Loss         | -1.51e+07 |
| Running Env Steps   | 1485000   |
| Running Forward KL  | 18.5      |
| Running Reverse KL  | 10.2      |
| Running Update Time | 297       |
-----------------------------------
--2024-08-11 13:39:08.739833 UTC---
| Itration            | 298       |
| Real Det Return     | 8.48e+03  |
| Real Sto Return     | 7.51e+03  |
| Reward Loss         | -1.88e+07 |
| Running Env Steps   | 1490000   |
| Running Forward KL  | 18.9      |
| Running Reverse KL  | 9.63      |
| Running Update Time | 298       |
-----------------------------------
--2024-08-11 13:40:42.256252 UTC---
| Itration            | 299       |
| Real Det Return     | 9.03e+03  |
| Real Sto Return     | 8.24e+03  |
| Reward Loss         | -1.58e+07 |
| Running Env Steps   | 1495000   |
| Running Forward KL  | 18.3      |
| Running Reverse KL  | 9.7       |
| Running Update Time | 299       |
-----------------------------------
--2024-08-11 13:42:13.779607 UTC---
| Itration            | 300       |
| Real Det Return     | 9.09e+03  |
| Real Sto Return     | 8.56e+03  |
| Reward Loss         | -1.61e+07 |
| Running Env Steps   | 1500000   |
| Running Forward KL  | 17.9      |
| Running Reverse KL  | 9.68      |
| Running Update Time | 300       |
-----------------------------------
--2024-08-11 13:43:45.869651 UTC---
| Itration            | 301       |
| Real Det Return     | 9.36e+03  |
| Real Sto Return     | 8.68e+03  |
| Reward Loss         | -1.51e+07 |
| Running Env Steps   | 1505000   |
| Running Forward KL  | 18.5      |
| Running Reverse KL  | 10.2      |
| Running Update Time | 301       |
-----------------------------------
--2024-08-11 13:45:20.131756 UTC---
| Itration            | 302       |
| Real Det Return     | 9.46e+03  |
| Real Sto Return     | 8.65e+03  |
| Reward Loss         | -1.49e+07 |
| Running Env Steps   | 1510000   |
| Running Forward KL  | 18.1      |
| Running Reverse KL  | 10.3      |
| Running Update Time | 302       |
-----------------------------------
--2024-08-11 13:46:52.074310 UTC--
| Itration            | 303      |
| Real Det Return     | 9.02e+03 |
| Real Sto Return     | 8.32e+03 |
| Reward Loss         | -1.6e+07 |
| Running Env Steps   | 1515000  |
| Running Forward KL  | 18.3     |
| Running Reverse KL  | 10.6     |
| Running Update Time | 303      |
----------------------------------
--2024-08-11 13:48:27.090304 UTC---
| Itration            | 304       |
| Real Det Return     | 9.64e+03  |
| Real Sto Return     | 8.78e+03  |
| Reward Loss         | -1.38e+07 |
| Running Env Steps   | 1520000   |
| Running Forward KL  | 18.2      |
| Running Reverse KL  | 10.4      |
| Running Update Time | 304       |
-----------------------------------
--2024-08-11 13:49:59.024951 UTC---
| Itration            | 305       |
| Real Det Return     | 9.31e+03  |
| Real Sto Return     | 8.35e+03  |
| Reward Loss         | -1.64e+07 |
| Running Env Steps   | 1525000   |
| Running Forward KL  | 18.8      |
| Running Reverse KL  | 10.5      |
| Running Update Time | 305       |
-----------------------------------
--2024-08-11 13:51:33.234463 UTC---
| Itration            | 306       |
| Real Det Return     | 9.3e+03   |
| Real Sto Return     | 8.81e+03  |
| Reward Loss         | -1.41e+07 |
| Running Env Steps   | 1530000   |
| Running Forward KL  | 17.8      |
| Running Reverse KL  | 10.4      |
| Running Update Time | 306       |
-----------------------------------
--2024-08-11 13:53:08.377302 UTC---
| Itration            | 307       |
| Real Det Return     | 9.44e+03  |
| Real Sto Return     | 8.38e+03  |
| Reward Loss         | -1.59e+07 |
| Running Env Steps   | 1535000   |
| Running Forward KL  | 18.7      |
| Running Reverse KL  | 10.9      |
| Running Update Time | 307       |
-----------------------------------
--2024-08-11 13:54:41.579578 UTC---
| Itration            | 308       |
| Real Det Return     | 9.5e+03   |
| Real Sto Return     | 8.76e+03  |
| Reward Loss         | -1.54e+07 |
| Running Env Steps   | 1540000   |
| Running Forward KL  | 18.1      |
| Running Reverse KL  | 10.3      |
| Running Update Time | 308       |
-----------------------------------
--2024-08-11 13:56:14.891727 UTC--
| Itration            | 309      |
| Real Det Return     | 9.98e+03 |
| Real Sto Return     | 8.75e+03 |
| Reward Loss         | -1.4e+07 |
| Running Env Steps   | 1545000  |
| Running Forward KL  | 17.8     |
| Running Reverse KL  | 10.3     |
| Running Update Time | 309      |
----------------------------------
--2024-08-11 13:57:48.580756 UTC---
| Itration            | 310       |
| Real Det Return     | 9.55e+03  |
| Real Sto Return     | 9.11e+03  |
| Reward Loss         | -1.43e+07 |
| Running Env Steps   | 1550000   |
| Running Forward KL  | 17.4      |
| Running Reverse KL  | 9.85      |
| Running Update Time | 310       |
-----------------------------------
--2024-08-11 13:59:20.656638 UTC--
| Itration            | 311      |
| Real Det Return     | 9.88e+03 |
| Real Sto Return     | 9.2e+03  |
| Reward Loss         | -1.3e+07 |
| Running Env Steps   | 1555000  |
| Running Forward KL  | 17.6     |
| Running Reverse KL  | 10.6     |
| Running Update Time | 311      |
----------------------------------
--2024-08-11 14:00:55.034338 UTC---
| Itration            | 312       |
| Real Det Return     | 1.06e+04  |
| Real Sto Return     | 9.54e+03  |
| Reward Loss         | -1.23e+07 |
| Running Env Steps   | 1560000   |
| Running Forward KL  | 17.3      |
| Running Reverse KL  | 10.3      |
| Running Update Time | 312       |
-----------------------------------
--2024-08-11 14:02:26.997170 UTC---
| Itration            | 313       |
| Real Det Return     | 1.05e+04  |
| Real Sto Return     | 8.8e+03   |
| Reward Loss         | -1.37e+07 |
| Running Env Steps   | 1565000   |
| Running Forward KL  | 17        |
| Running Reverse KL  | 10.2      |
| Running Update Time | 313       |
-----------------------------------
--2024-08-11 14:04:00.752137 UTC---
| Itration            | 314       |
| Real Det Return     | 9.99e+03  |
| Real Sto Return     | 9.22e+03  |
| Reward Loss         | -1.39e+07 |
| Running Env Steps   | 1570000   |
| Running Forward KL  | 17.9      |
| Running Reverse KL  | 11.5      |
| Running Update Time | 314       |
-----------------------------------
--2024-08-11 14:05:35.346990 UTC---
| Itration            | 315       |
| Real Det Return     | 1.04e+04  |
| Real Sto Return     | 9.44e+03  |
| Reward Loss         | -1.18e+07 |
| Running Env Steps   | 1575000   |
| Running Forward KL  | 16.8      |
| Running Reverse KL  | 10.4      |
| Running Update Time | 315       |
-----------------------------------
--2024-08-11 14:07:08.157506 UTC--
| Itration            | 316      |
| Real Det Return     | 1.01e+04 |
| Real Sto Return     | 9.33e+03 |
| Reward Loss         | -1.5e+07 |
| Running Env Steps   | 1580000  |
| Running Forward KL  | 17.7     |
| Running Reverse KL  | 10.6     |
| Running Update Time | 316      |
----------------------------------
--2024-08-11 14:08:41.576547 UTC---
| Itration            | 317       |
| Real Det Return     | 1.06e+04  |
| Real Sto Return     | 9.7e+03   |
| Reward Loss         | -1.27e+07 |
| Running Env Steps   | 1585000   |
| Running Forward KL  | 17.3      |
| Running Reverse KL  | 10.7      |
| Running Update Time | 317       |
-----------------------------------
--2024-08-11 14:10:15.353584 UTC---
| Itration            | 318       |
| Real Det Return     | 9.77e+03  |
| Real Sto Return     | 9.06e+03  |
| Reward Loss         | -1.37e+07 |
| Running Env Steps   | 1590000   |
| Running Forward KL  | 18.1      |
| Running Reverse KL  | 11.3      |
| Running Update Time | 318       |
-----------------------------------
--2024-08-11 14:11:47.750160 UTC---
| Itration            | 319       |
| Real Det Return     | 1.05e+04  |
| Real Sto Return     | 9.43e+03  |
| Reward Loss         | -1.23e+07 |
| Running Env Steps   | 1595000   |
| Running Forward KL  | 16.8      |
| Running Reverse KL  | 10.6      |
| Running Update Time | 319       |
-----------------------------------
--2024-08-11 14:13:22.355197 UTC---
| Itration            | 320       |
| Real Det Return     | 1.04e+04  |
| Real Sto Return     | 9.45e+03  |
| Reward Loss         | -1.19e+07 |
| Running Env Steps   | 1600000   |
| Running Forward KL  | 17.8      |
| Running Reverse KL  | 11.1      |
| Running Update Time | 320       |
-----------------------------------
--2024-08-11 14:14:53.852329 UTC---
| Itration            | 321       |
| Real Det Return     | 9.66e+03  |
| Real Sto Return     | 9.21e+03  |
| Reward Loss         | -1.37e+07 |
| Running Env Steps   | 1605000   |
| Running Forward KL  | 17        |
| Running Reverse KL  | 9.58      |
| Running Update Time | 321       |
-----------------------------------
--2024-08-11 14:16:28.629876 UTC---
| Itration            | 322       |
| Real Det Return     | 1.06e+04  |
| Real Sto Return     | 9.86e+03  |
| Reward Loss         | -1.14e+07 |
| Running Env Steps   | 1610000   |
| Running Forward KL  | 16.6      |
| Running Reverse KL  | 10.3      |
| Running Update Time | 322       |
-----------------------------------
--2024-08-11 14:18:02.945820 UTC---
| Itration            | 323       |
| Real Det Return     | 1.06e+04  |
| Real Sto Return     | 9.6e+03   |
| Reward Loss         | -1.11e+07 |
| Running Env Steps   | 1615000   |
| Running Forward KL  | 16.9      |
| Running Reverse KL  | 10.7      |
| Running Update Time | 323       |
-----------------------------------
--2024-08-11 14:19:35.178328 UTC---
| Itration            | 324       |
| Real Det Return     | 1.02e+04  |
| Real Sto Return     | 9.63e+03  |
| Reward Loss         | -1.44e+07 |
| Running Env Steps   | 1620000   |
| Running Forward KL  | 17.3      |
| Running Reverse KL  | 10.3      |
| Running Update Time | 324       |
-----------------------------------
--2024-08-11 14:21:08.206751 UTC---
| Itration            | 325       |
| Real Det Return     | 1.11e+04  |
| Real Sto Return     | 9.81e+03  |
| Reward Loss         | -1.17e+07 |
| Running Env Steps   | 1625000   |
| Running Forward KL  | 16.6      |
| Running Reverse KL  | 11.6      |
| Running Update Time | 325       |
-----------------------------------
--2024-08-11 14:22:42.746339 UTC--
| Itration            | 326      |
| Real Det Return     | 1.05e+04 |
| Real Sto Return     | 9.85e+03 |
| Reward Loss         | -1.1e+07 |
| Running Env Steps   | 1630000  |
| Running Forward KL  | 16.8     |
| Running Reverse KL  | 10       |
| Running Update Time | 326      |
----------------------------------
--2024-08-11 14:24:14.564132 UTC---
| Itration            | 327       |
| Real Det Return     | 1.02e+04  |
| Real Sto Return     | 9.41e+03  |
| Reward Loss         | -1.27e+07 |
| Running Env Steps   | 1635000   |
| Running Forward KL  | 17.5      |
| Running Reverse KL  | 12        |
| Running Update Time | 327       |
-----------------------------------
--2024-08-11 14:25:48.879760 UTC---
| Itration            | 328       |
| Real Det Return     | 1.08e+04  |
| Real Sto Return     | 9.92e+03  |
| Reward Loss         | -1.23e+07 |
| Running Env Steps   | 1640000   |
| Running Forward KL  | 17.2      |
| Running Reverse KL  | 10        |
| Running Update Time | 328       |
-----------------------------------
--2024-08-11 14:27:20.773495 UTC---
| Itration            | 329       |
| Real Det Return     | 1.01e+04  |
| Real Sto Return     | 9.74e+03  |
| Reward Loss         | -1.22e+07 |
| Running Env Steps   | 1645000   |
| Running Forward KL  | 16.9      |
| Running Reverse KL  | 10.8      |
| Running Update Time | 329       |
-----------------------------------
--2024-08-11 14:28:54.259568 UTC---
| Itration            | 330       |
| Real Det Return     | 1.06e+04  |
| Real Sto Return     | 9.69e+03  |
| Reward Loss         | -1.05e+07 |
| Running Env Steps   | 1650000   |
| Running Forward KL  | 16.6      |
| Running Reverse KL  | 10.2      |
| Running Update Time | 330       |
-----------------------------------
--2024-08-11 14:30:31.809107 UTC---
| Itration            | 331       |
| Real Det Return     | 1.09e+04  |
| Real Sto Return     | 9.73e+03  |
| Reward Loss         | -1.03e+07 |
| Running Env Steps   | 1655000   |
| Running Forward KL  | 16.9      |
| Running Reverse KL  | 10.9      |
| Running Update Time | 331       |
-----------------------------------
--2024-08-11 14:32:04.973263 UTC---
| Itration            | 332       |
| Real Det Return     | 1.09e+04  |
| Real Sto Return     | 1e+04     |
| Reward Loss         | -1.03e+07 |
| Running Env Steps   | 1660000   |
| Running Forward KL  | 16.7      |
| Running Reverse KL  | 10.8      |
| Running Update Time | 332       |
-----------------------------------
--2024-08-11 14:33:37.570043 UTC---
| Itration            | 333       |
| Real Det Return     | 1.08e+04  |
| Real Sto Return     | 9.97e+03  |
| Reward Loss         | -1.11e+07 |
| Running Env Steps   | 1665000   |
| Running Forward KL  | 16.8      |
| Running Reverse KL  | 10.5      |
| Running Update Time | 333       |
-----------------------------------
--2024-08-11 14:35:11.838117 UTC---
| Itration            | 334       |
| Real Det Return     | 1.06e+04  |
| Real Sto Return     | 9.98e+03  |
| Reward Loss         | -1.07e+07 |
| Running Env Steps   | 1670000   |
| Running Forward KL  | 16.6      |
| Running Reverse KL  | 10.3      |
| Running Update Time | 334       |
-----------------------------------
--2024-08-11 14:36:43.558255 UTC---
| Itration            | 335       |
| Real Det Return     | 1.08e+04  |
| Real Sto Return     | 9.55e+03  |
| Reward Loss         | -1.09e+07 |
| Running Env Steps   | 1675000   |
| Running Forward KL  | 16.5      |
| Running Reverse KL  | 10.4      |
| Running Update Time | 335       |
-----------------------------------
--2024-08-11 14:38:17.323602 UTC---
| Itration            | 336       |
| Real Det Return     | 1.08e+04  |
| Real Sto Return     | 1.02e+04  |
| Reward Loss         | -1.04e+07 |
| Running Env Steps   | 1680000   |
| Running Forward KL  | 16.7      |
| Running Reverse KL  | 10.8      |
| Running Update Time | 336       |
-----------------------------------
--2024-08-11 14:39:50.448644 UTC---
| Itration            | 337       |
| Real Det Return     | 9.94e+03  |
| Real Sto Return     | 9.43e+03  |
| Reward Loss         | -1.39e+07 |
| Running Env Steps   | 1685000   |
| Running Forward KL  | 17.3      |
| Running Reverse KL  | 10.9      |
| Running Update Time | 337       |
-----------------------------------
--2024-08-11 14:41:25.192478 UTC---
| Itration            | 338       |
| Real Det Return     | 1.1e+04   |
| Real Sto Return     | 9.99e+03  |
| Reward Loss         | -1.08e+07 |
| Running Env Steps   | 1690000   |
| Running Forward KL  | 16.5      |
| Running Reverse KL  | 10.4      |
| Running Update Time | 338       |
-----------------------------------
--2024-08-11 14:42:59.408805 UTC---
| Itration            | 339       |
| Real Det Return     | 1.09e+04  |
| Real Sto Return     | 1.02e+04  |
| Reward Loss         | -1.07e+07 |
| Running Env Steps   | 1695000   |
| Running Forward KL  | 16.7      |
| Running Reverse KL  | 10.2      |
| Running Update Time | 339       |
-----------------------------------
--2024-08-11 14:44:32.432546 UTC---
| Itration            | 340       |
| Real Det Return     | 1.12e+04  |
| Real Sto Return     | 1.03e+04  |
| Reward Loss         | -1.01e+07 |
| Running Env Steps   | 1700000   |
| Running Forward KL  | 16.6      |
| Running Reverse KL  | 11.3      |
| Running Update Time | 340       |
-----------------------------------
--2024-08-11 14:46:06.942299 UTC---
| Itration            | 341       |
| Real Det Return     | 1.07e+04  |
| Real Sto Return     | 9.62e+03  |
| Reward Loss         | -1.06e+07 |
| Running Env Steps   | 1705000   |
| Running Forward KL  | 16.2      |
| Running Reverse KL  | 10.4      |
| Running Update Time | 341       |
-----------------------------------
--2024-08-11 14:47:43.110835 UTC---
| Itration            | 342       |
| Real Det Return     | 1.08e+04  |
| Real Sto Return     | 1.02e+04  |
| Reward Loss         | -9.66e+06 |
| Running Env Steps   | 1710000   |
| Running Forward KL  | 16.3      |
| Running Reverse KL  | 10.6      |
| Running Update Time | 342       |
-----------------------------------
--2024-08-11 14:49:14.820437 UTC---
| Itration            | 343       |
| Real Det Return     | 1.08e+04  |
| Real Sto Return     | 9.72e+03  |
| Reward Loss         | -1.02e+07 |
| Running Env Steps   | 1715000   |
| Running Forward KL  | 16.8      |
| Running Reverse KL  | 11.1      |
| Running Update Time | 343       |
-----------------------------------
--2024-08-11 14:50:48.861839 UTC---
| Itration            | 344       |
| Real Det Return     | 1.1e+04   |
| Real Sto Return     | 1.02e+04  |
| Reward Loss         | -1.18e+07 |
| Running Env Steps   | 1720000   |
| Running Forward KL  | 16.5      |
| Running Reverse KL  | 9.89      |
| Running Update Time | 344       |
-----------------------------------
--2024-08-11 14:52:21.997081 UTC---
| Itration            | 345       |
| Real Det Return     | 1.09e+04  |
| Real Sto Return     | 1.02e+04  |
| Reward Loss         | -9.45e+06 |
| Running Env Steps   | 1725000   |
| Running Forward KL  | 16.8      |
| Running Reverse KL  | 11        |
| Running Update Time | 345       |
-----------------------------------
--2024-08-11 14:53:55.041294 UTC---
| Itration            | 346       |
| Real Det Return     | 1.09e+04  |
| Real Sto Return     | 9.65e+03  |
| Reward Loss         | -1.07e+07 |
| Running Env Steps   | 1730000   |
| Running Forward KL  | 16.6      |
| Running Reverse KL  | 10.6      |
| Running Update Time | 346       |
-----------------------------------
--2024-08-11 14:55:28.723149 UTC---
| Itration            | 347       |
| Real Det Return     | 1.08e+04  |
| Real Sto Return     | 1.01e+04  |
| Reward Loss         | -9.89e+06 |
| Running Env Steps   | 1735000   |
| Running Forward KL  | 16.9      |
| Running Reverse KL  | 11.8      |
| Running Update Time | 347       |
-----------------------------------
--2024-08-11 14:57:00.602506 UTC---
| Itration            | 348       |
| Real Det Return     | 1.08e+04  |
| Real Sto Return     | 9.97e+03  |
| Reward Loss         | -1.03e+07 |
| Running Env Steps   | 1740000   |
| Running Forward KL  | 17.2      |
| Running Reverse KL  | 11.7      |
| Running Update Time | 348       |
-----------------------------------
--2024-08-11 14:58:33.786485 UTC---
| Itration            | 349       |
| Real Det Return     | 1.08e+04  |
| Real Sto Return     | 1.01e+04  |
| Reward Loss         | -1.27e+07 |
| Running Env Steps   | 1745000   |
| Running Forward KL  | 16.4      |
| Running Reverse KL  | 10.4      |
| Running Update Time | 349       |
-----------------------------------
--2024-08-11 15:00:06.571387 UTC---
| Itration            | 350       |
| Real Det Return     | 9.82e+03  |
| Real Sto Return     | 9.58e+03  |
| Reward Loss         | -1.26e+07 |
| Running Env Steps   | 1750000   |
| Running Forward KL  | 16.6      |
| Running Reverse KL  | 10.5      |
| Running Update Time | 350       |
-----------------------------------
--2024-08-11 15:01:37.298356 UTC---
| Itration            | 351       |
| Real Det Return     | 1.1e+04   |
| Real Sto Return     | 1.04e+04  |
| Reward Loss         | -8.57e+06 |
| Running Env Steps   | 1755000   |
| Running Forward KL  | 16.5      |
| Running Reverse KL  | 11        |
| Running Update Time | 351       |
-----------------------------------
--2024-08-11 15:03:10.154278 UTC---
| Itration            | 352       |
| Real Det Return     | 1.07e+04  |
| Real Sto Return     | 9.99e+03  |
| Reward Loss         | -9.22e+06 |
| Running Env Steps   | 1760000   |
| Running Forward KL  | 16.7      |
| Running Reverse KL  | 10.8      |
| Running Update Time | 352       |
-----------------------------------
--2024-08-11 15:04:42.242947 UTC---
| Itration            | 353       |
| Real Det Return     | 1.04e+04  |
| Real Sto Return     | 9.9e+03   |
| Reward Loss         | -1.22e+07 |
| Running Env Steps   | 1765000   |
| Running Forward KL  | 17.3      |
| Running Reverse KL  | 11.8      |
| Running Update Time | 353       |
-----------------------------------
--2024-08-11 15:06:16.491966 UTC---
| Itration            | 354       |
| Real Det Return     | 1.08e+04  |
| Real Sto Return     | 1.02e+04  |
| Reward Loss         | -9.68e+06 |
| Running Env Steps   | 1770000   |
| Running Forward KL  | 16.5      |
| Running Reverse KL  | 11.2      |
| Running Update Time | 354       |
-----------------------------------
--2024-08-11 15:07:50.000791 UTC---
| Itration            | 355       |
| Real Det Return     | 1.12e+04  |
| Real Sto Return     | 1.01e+04  |
| Reward Loss         | -1.13e+07 |
| Running Env Steps   | 1775000   |
| Running Forward KL  | 16.2      |
| Running Reverse KL  | 10.3      |
| Running Update Time | 355       |
-----------------------------------
--2024-08-11 15:09:21.795472 UTC---
| Itration            | 356       |
| Real Det Return     | 1.03e+04  |
| Real Sto Return     | 9.81e+03  |
| Reward Loss         | -1.12e+07 |
| Running Env Steps   | 1780000   |
| Running Forward KL  | 17.1      |
| Running Reverse KL  | 11.7      |
| Running Update Time | 356       |
-----------------------------------
--2024-08-11 15:10:53.965022 UTC---
| Itration            | 357       |
| Real Det Return     | 1.11e+04  |
| Real Sto Return     | 1.06e+04  |
| Reward Loss         | -8.99e+06 |
| Running Env Steps   | 1785000   |
| Running Forward KL  | 15.7      |
| Running Reverse KL  | 10.1      |
| Running Update Time | 357       |
-----------------------------------
--2024-08-11 15:12:27.116167 UTC---
| Itration            | 358       |
| Real Det Return     | 1.1e+04   |
| Real Sto Return     | 1.03e+04  |
| Reward Loss         | -9.51e+06 |
| Running Env Steps   | 1790000   |
| Running Forward KL  | 16.8      |
| Running Reverse KL  | 10.4      |
| Running Update Time | 358       |
-----------------------------------
--2024-08-11 15:13:59.135724 UTC---
| Itration            | 359       |
| Real Det Return     | 1.12e+04  |
| Real Sto Return     | 1.06e+04  |
| Reward Loss         | -8.54e+06 |
| Running Env Steps   | 1795000   |
| Running Forward KL  | 15.9      |
| Running Reverse KL  | 9.96      |
| Running Update Time | 359       |
-----------------------------------
--2024-08-11 15:15:32.097910 UTC---
| Itration            | 360       |
| Real Det Return     | 1.15e+04  |
| Real Sto Return     | 1.02e+04  |
| Reward Loss         | -1.01e+07 |
| Running Env Steps   | 1800000   |
| Running Forward KL  | 15.8      |
| Running Reverse KL  | 9.68      |
| Running Update Time | 360       |
-----------------------------------
--2024-08-11 15:17:02.676359 UTC---
| Itration            | 361       |
| Real Det Return     | 1.09e+04  |
| Real Sto Return     | 1.04e+04  |
| Reward Loss         | -9.84e+06 |
| Running Env Steps   | 1805000   |
| Running Forward KL  | 16.1      |
| Running Reverse KL  | 10.1      |
| Running Update Time | 361       |
-----------------------------------
--2024-08-11 15:18:36.226085 UTC---
| Itration            | 362       |
| Real Det Return     | 1.15e+04  |
| Real Sto Return     | 1.03e+04  |
| Reward Loss         | -8.15e+06 |
| Running Env Steps   | 1810000   |
| Running Forward KL  | 16.1      |
| Running Reverse KL  | 10.8      |
| Running Update Time | 362       |
-----------------------------------
--2024-08-11 15:20:09.706777 UTC---
| Itration            | 363       |
| Real Det Return     | 1.14e+04  |
| Real Sto Return     | 1.06e+04  |
| Reward Loss         | -8.83e+06 |
| Running Env Steps   | 1815000   |
| Running Forward KL  | 16        |
| Running Reverse KL  | 10.5      |
| Running Update Time | 363       |
-----------------------------------
--2024-08-11 15:21:42.079755 UTC---
| Itration            | 364       |
| Real Det Return     | 1.13e+04  |
| Real Sto Return     | 1.07e+04  |
| Reward Loss         | -8.65e+06 |
| Running Env Steps   | 1820000   |
| Running Forward KL  | 15.8      |
| Running Reverse KL  | 10.7      |
| Running Update Time | 364       |
-----------------------------------
--2024-08-11 15:23:14.834627 UTC---
| Itration            | 365       |
| Real Det Return     | 1.1e+04   |
| Real Sto Return     | 1.04e+04  |
| Reward Loss         | -9.59e+06 |
| Running Env Steps   | 1825000   |
| Running Forward KL  | 15.9      |
| Running Reverse KL  | 10.4      |
| Running Update Time | 365       |
-----------------------------------
--2024-08-11 15:24:47.073052 UTC--
| Itration            | 366      |
| Real Det Return     | 1.08e+04 |
| Real Sto Return     | 1.03e+04 |
| Reward Loss         | -9.7e+06 |
| Running Env Steps   | 1830000  |
| Running Forward KL  | 16.2     |
| Running Reverse KL  | 11       |
| Running Update Time | 366      |
----------------------------------
--2024-08-11 15:26:18.753877 UTC--
| Itration            | 367      |
| Real Det Return     | 1.07e+04 |
| Real Sto Return     | 1e+04    |
| Reward Loss         | -9.9e+06 |
| Running Env Steps   | 1835000  |
| Running Forward KL  | 16.3     |
| Running Reverse KL  | 10       |
| Running Update Time | 367      |
----------------------------------
--2024-08-11 15:27:52.632488 UTC---
| Itration            | 368       |
| Real Det Return     | 1.1e+04   |
| Real Sto Return     | 1e+04     |
| Reward Loss         | -8.88e+06 |
| Running Env Steps   | 1840000   |
| Running Forward KL  | 16.1      |
| Running Reverse KL  | 10.7      |
| Running Update Time | 368       |
-----------------------------------
--2024-08-11 15:29:23.616135 UTC--
| Itration            | 369      |
| Real Det Return     | 1.11e+04 |
| Real Sto Return     | 1.07e+04 |
| Reward Loss         | -7.9e+06 |
| Running Env Steps   | 1845000  |
| Running Forward KL  | 16       |
| Running Reverse KL  | 10.7     |
| Running Update Time | 369      |
----------------------------------
--2024-08-11 15:30:57.212260 UTC---
| Itration            | 370       |
| Real Det Return     | 1.15e+04  |
| Real Sto Return     | 1.08e+04  |
| Reward Loss         | -7.71e+06 |
| Running Env Steps   | 1850000   |
| Running Forward KL  | 16.1      |
| Running Reverse KL  | 10.9      |
| Running Update Time | 370       |
-----------------------------------
--2024-08-11 15:32:30.489634 UTC---
| Itration            | 371       |
| Real Det Return     | 1.11e+04  |
| Real Sto Return     | 1.04e+04  |
| Reward Loss         | -8.59e+06 |
| Running Env Steps   | 1855000   |
| Running Forward KL  | 16.1      |
| Running Reverse KL  | 10.1      |
| Running Update Time | 371       |
-----------------------------------
--2024-08-11 15:34:02.468010 UTC---
| Itration            | 372       |
| Real Det Return     | 1.15e+04  |
| Real Sto Return     | 1.1e+04   |
| Reward Loss         | -8.55e+06 |
| Running Env Steps   | 1860000   |
| Running Forward KL  | 15.8      |
| Running Reverse KL  | 11        |
| Running Update Time | 372       |
-----------------------------------
--2024-08-11 15:35:35.650965 UTC--
| Itration            | 373      |
| Real Det Return     | 1.14e+04 |
| Real Sto Return     | 1.07e+04 |
| Reward Loss         | -9.2e+06 |
| Running Env Steps   | 1865000  |
| Running Forward KL  | 15.6     |
| Running Reverse KL  | 10.3     |
| Running Update Time | 373      |
----------------------------------
--2024-08-11 15:37:07.120754 UTC---
| Itration            | 374       |
| Real Det Return     | 1.08e+04  |
| Real Sto Return     | 1e+04     |
| Reward Loss         | -1.01e+07 |
| Running Env Steps   | 1870000   |
| Running Forward KL  | 16.2      |
| Running Reverse KL  | 11.6      |
| Running Update Time | 374       |
-----------------------------------
--2024-08-11 15:38:40.769488 UTC---
| Itration            | 375       |
| Real Det Return     | 1.13e+04  |
| Real Sto Return     | 1.07e+04  |
| Reward Loss         | -8.12e+06 |
| Running Env Steps   | 1875000   |
| Running Forward KL  | 15.8      |
| Running Reverse KL  | 10.2      |
| Running Update Time | 375       |
-----------------------------------
--2024-08-11 15:40:14.182293 UTC---
| Itration            | 376       |
| Real Det Return     | 1.11e+04  |
| Real Sto Return     | 1.05e+04  |
| Reward Loss         | -9.14e+06 |
| Running Env Steps   | 1880000   |
| Running Forward KL  | 15.6      |
| Running Reverse KL  | 10.1      |
| Running Update Time | 376       |
-----------------------------------
--2024-08-11 15:41:46.247408 UTC---
| Itration            | 377       |
| Real Det Return     | 1.1e+04   |
| Real Sto Return     | 1.05e+04  |
| Reward Loss         | -1.05e+07 |
| Running Env Steps   | 1885000   |
| Running Forward KL  | 16.3      |
| Running Reverse KL  | 10.5      |
| Running Update Time | 377       |
-----------------------------------
--2024-08-11 15:43:18.913789 UTC--
| Itration            | 378      |
| Real Det Return     | 1.15e+04 |
| Real Sto Return     | 1.09e+04 |
| Reward Loss         | -9.9e+06 |
| Running Env Steps   | 1890000  |
| Running Forward KL  | 15.7     |
| Running Reverse KL  | 9.91     |
| Running Update Time | 378      |
----------------------------------
--2024-08-11 15:44:52.570797 UTC---
| Itration            | 379       |
| Real Det Return     | 1.17e+04  |
| Real Sto Return     | 1.1e+04   |
| Reward Loss         | -8.45e+06 |
| Running Env Steps   | 1895000   |
| Running Forward KL  | 15.8      |
| Running Reverse KL  | 10.5      |
| Running Update Time | 379       |
-----------------------------------
--2024-08-11 15:46:23.734837 UTC---
| Itration            | 380       |
| Real Det Return     | 1.14e+04  |
| Real Sto Return     | 1.08e+04  |
| Reward Loss         | -8.77e+06 |
| Running Env Steps   | 1900000   |
| Running Forward KL  | 15.4      |
| Running Reverse KL  | 10.2      |
| Running Update Time | 380       |
-----------------------------------
--2024-08-11 15:47:57.233996 UTC---
| Itration            | 381       |
| Real Det Return     | 1.1e+04   |
| Real Sto Return     | 1.06e+04  |
| Reward Loss         | -9.26e+06 |
| Running Env Steps   | 1905000   |
| Running Forward KL  | 16        |
| Running Reverse KL  | 10.6      |
| Running Update Time | 381       |
-----------------------------------
--2024-08-11 15:49:29.066741 UTC---
| Itration            | 382       |
| Real Det Return     | 1.16e+04  |
| Real Sto Return     | 1.06e+04  |
| Reward Loss         | -7.77e+06 |
| Running Env Steps   | 1910000   |
| Running Forward KL  | 15.7      |
| Running Reverse KL  | 10.6      |
| Running Update Time | 382       |
-----------------------------------
--2024-08-11 15:51:03.800289 UTC---
| Itration            | 383       |
| Real Det Return     | 1.18e+04  |
| Real Sto Return     | 1.1e+04   |
| Reward Loss         | -6.67e+06 |
| Running Env Steps   | 1915000   |
| Running Forward KL  | 15.4      |
| Running Reverse KL  | 10.5      |
| Running Update Time | 383       |
-----------------------------------
--2024-08-11 15:52:37.740499 UTC---
| Itration            | 384       |
| Real Det Return     | 1.17e+04  |
| Real Sto Return     | 1.08e+04  |
| Reward Loss         | -6.67e+06 |
| Running Env Steps   | 1920000   |
| Running Forward KL  | 15.6      |
| Running Reverse KL  | 10.8      |
| Running Update Time | 384       |
-----------------------------------
--2024-08-11 15:54:10.014776 UTC---
| Itration            | 385       |
| Real Det Return     | 1.1e+04   |
| Real Sto Return     | 1.05e+04  |
| Reward Loss         | -9.59e+06 |
| Running Env Steps   | 1925000   |
| Running Forward KL  | 16.3      |
| Running Reverse KL  | 10.9      |
| Running Update Time | 385       |
-----------------------------------
--2024-08-11 15:55:42.306034 UTC---
| Itration            | 386       |
| Real Det Return     | 1.14e+04  |
| Real Sto Return     | 9.84e+03  |
| Reward Loss         | -7.67e+06 |
| Running Env Steps   | 1930000   |
| Running Forward KL  | 15.6      |
| Running Reverse KL  | 10.4      |
| Running Update Time | 386       |
-----------------------------------
--2024-08-11 15:57:15.853384 UTC---
| Itration            | 387       |
| Real Det Return     | 1.1e+04   |
| Real Sto Return     | 9.7e+03   |
| Reward Loss         | -8.11e+06 |
| Running Env Steps   | 1935000   |
| Running Forward KL  | 15.8      |
| Running Reverse KL  | 9.84      |
| Running Update Time | 387       |
-----------------------------------
--2024-08-11 15:58:48.214903 UTC---
| Itration            | 388       |
| Real Det Return     | 1.18e+04  |
| Real Sto Return     | 1.12e+04  |
| Reward Loss         | -6.87e+06 |
| Running Env Steps   | 1940000   |
| Running Forward KL  | 15.7      |
| Running Reverse KL  | 10.8      |
| Running Update Time | 388       |
-----------------------------------
--2024-08-11 16:00:22.635260 UTC---
| Itration            | 389       |
| Real Det Return     | 1.19e+04  |
| Real Sto Return     | 1.12e+04  |
| Reward Loss         | -6.91e+06 |
| Running Env Steps   | 1945000   |
| Running Forward KL  | 15.5      |
| Running Reverse KL  | 9.98      |
| Running Update Time | 389       |
-----------------------------------
--2024-08-11 16:01:53.135966 UTC---
| Itration            | 390       |
| Real Det Return     | 1.19e+04  |
| Real Sto Return     | 1.13e+04  |
| Reward Loss         | -6.62e+06 |
| Running Env Steps   | 1950000   |
| Running Forward KL  | 15.6      |
| Running Reverse KL  | 11.2      |
| Running Update Time | 390       |
-----------------------------------
--2024-08-11 16:03:27.383757 UTC---
| Itration            | 391       |
| Real Det Return     | 1.19e+04  |
| Real Sto Return     | 1.11e+04  |
| Reward Loss         | -6.27e+06 |
| Running Env Steps   | 1955000   |
| Running Forward KL  | 15.5      |
| Running Reverse KL  | 10.4      |
| Running Update Time | 391       |
-----------------------------------
--2024-08-11 16:05:00.685627 UTC---
| Itration            | 392       |
| Real Det Return     | 1.17e+04  |
| Real Sto Return     | 1.12e+04  |
| Reward Loss         | -6.92e+06 |
| Running Env Steps   | 1960000   |
| Running Forward KL  | 15.7      |
| Running Reverse KL  | 10.8      |
| Running Update Time | 392       |
-----------------------------------
--2024-08-11 16:06:32.391188 UTC---
| Itration            | 393       |
| Real Det Return     | 1.15e+04  |
| Real Sto Return     | 1.11e+04  |
| Reward Loss         | -7.15e+06 |
| Running Env Steps   | 1965000   |
| Running Forward KL  | 15.5      |
| Running Reverse KL  | 10.4      |
| Running Update Time | 393       |
-----------------------------------
--2024-08-11 16:08:04.405357 UTC---
| Itration            | 394       |
| Real Det Return     | 1.19e+04  |
| Real Sto Return     | 1.02e+04  |
| Reward Loss         | -7.65e+06 |
| Running Env Steps   | 1970000   |
| Running Forward KL  | 15.1      |
| Running Reverse KL  | 10.4      |
| Running Update Time | 394       |
-----------------------------------
--2024-08-11 16:09:37.222574 UTC---
| Itration            | 395       |
| Real Det Return     | 1.15e+04  |
| Real Sto Return     | 1.1e+04   |
| Reward Loss         | -8.99e+06 |
| Running Env Steps   | 1975000   |
| Running Forward KL  | 15.7      |
| Running Reverse KL  | 10.8      |
| Running Update Time | 395       |
-----------------------------------
--2024-08-11 16:11:09.600110 UTC---
| Itration            | 396       |
| Real Det Return     | 1.13e+04  |
| Real Sto Return     | 1.05e+04  |
| Reward Loss         | -7.74e+06 |
| Running Env Steps   | 1980000   |
| Running Forward KL  | 15.6      |
| Running Reverse KL  | 10.5      |
| Running Update Time | 396       |
-----------------------------------
--2024-08-11 16:12:43.495439 UTC---
| Itration            | 397       |
| Real Det Return     | 1.15e+04  |
| Real Sto Return     | 1.1e+04   |
| Reward Loss         | -7.76e+06 |
| Running Env Steps   | 1985000   |
| Running Forward KL  | 15.4      |
| Running Reverse KL  | 10.2      |
| Running Update Time | 397       |
-----------------------------------
--2024-08-11 16:14:14.481555 UTC---
| Itration            | 398       |
| Real Det Return     | 1.11e+04  |
| Real Sto Return     | 1.05e+04  |
| Reward Loss         | -9.43e+06 |
| Running Env Steps   | 1990000   |
| Running Forward KL  | 16.1      |
| Running Reverse KL  | 11        |
| Running Update Time | 398       |
-----------------------------------
--2024-08-11 16:15:48.200799 UTC--
| Itration            | 399      |
| Real Det Return     | 1.14e+04 |
| Real Sto Return     | 1.12e+04 |
| Reward Loss         | -8e+06   |
| Running Env Steps   | 1995000  |
| Running Forward KL  | 15.2     |
| Running Reverse KL  | 9.87     |
| Running Update Time | 399      |
----------------------------------
--2024-08-11 16:17:21.930714 UTC---
| Itration            | 400       |
| Real Det Return     | 1.2e+04   |
| Real Sto Return     | 1.14e+04  |
| Reward Loss         | -6.41e+06 |
| Running Env Steps   | 2000000   |
| Running Forward KL  | 15.3      |
| Running Reverse KL  | 10.8      |
| Running Update Time | 400       |
-----------------------------------
--2024-08-11 16:18:53.403527 UTC---
| Itration            | 401       |
| Real Det Return     | 1.17e+04  |
| Real Sto Return     | 1.12e+04  |
| Reward Loss         | -6.62e+06 |
| Running Env Steps   | 2005000   |
| Running Forward KL  | 15.3      |
| Running Reverse KL  | 10.5      |
| Running Update Time | 401       |
-----------------------------------
--2024-08-11 16:20:26.580041 UTC---
| Itration            | 402       |
| Real Det Return     | 1.13e+04  |
| Real Sto Return     | 1.09e+04  |
| Reward Loss         | -8.25e+06 |
| Running Env Steps   | 2010000   |
| Running Forward KL  | 15.3      |
| Running Reverse KL  | 10.2      |
| Running Update Time | 402       |
-----------------------------------
--2024-08-11 16:21:58.206844 UTC---
| Itration            | 403       |
| Real Det Return     | 1.2e+04   |
| Real Sto Return     | 1.13e+04  |
| Reward Loss         | -6.22e+06 |
| Running Env Steps   | 2015000   |
| Running Forward KL  | 15.2      |
| Running Reverse KL  | 10        |
| Running Update Time | 403       |
-----------------------------------
--2024-08-11 16:23:30.715347 UTC---
| Itration            | 404       |
| Real Det Return     | 1.15e+04  |
| Real Sto Return     | 1.1e+04   |
| Reward Loss         | -7.95e+06 |
| Running Env Steps   | 2020000   |
| Running Forward KL  | 15.6      |
| Running Reverse KL  | 10.5      |
| Running Update Time | 404       |
-----------------------------------
--2024-08-11 16:25:04.522939 UTC---
| Itration            | 405       |
| Real Det Return     | 1.23e+04  |
| Real Sto Return     | 1.16e+04  |
| Reward Loss         | -6.16e+06 |
| Running Env Steps   | 2025000   |
| Running Forward KL  | 15.5      |
| Running Reverse KL  | 11        |
| Running Update Time | 405       |
-----------------------------------
--2024-08-11 16:26:36.144224 UTC---
| Itration            | 406       |
| Real Det Return     | 1.18e+04  |
| Real Sto Return     | 1.14e+04  |
| Reward Loss         | -5.91e+06 |
| Running Env Steps   | 2030000   |
| Running Forward KL  | 15        |
| Running Reverse KL  | 10.3      |
| Running Update Time | 406       |
-----------------------------------
--2024-08-11 16:28:09.770556 UTC--
| Itration            | 407      |
| Real Det Return     | 1.18e+04 |
| Real Sto Return     | 1.12e+04 |
| Reward Loss         | -7.9e+06 |
| Running Env Steps   | 2035000  |
| Running Forward KL  | 15.3     |
| Running Reverse KL  | 10.2     |
| Running Update Time | 407      |
----------------------------------
--2024-08-11 16:29:43.922008 UTC--
| Itration            | 408      |
| Real Det Return     | 1.17e+04 |
| Real Sto Return     | 1.1e+04  |
| Reward Loss         | -6.7e+06 |
| Running Env Steps   | 2040000  |
| Running Forward KL  | 15.6     |
| Running Reverse KL  | 11       |
| Running Update Time | 408      |
----------------------------------
--2024-08-11 16:31:16.079397 UTC---
| Itration            | 409       |
| Real Det Return     | 1.23e+04  |
| Real Sto Return     | 1.14e+04  |
| Reward Loss         | -7.36e+06 |
| Running Env Steps   | 2045000   |
| Running Forward KL  | 15        |
| Running Reverse KL  | 10.3      |
| Running Update Time | 409       |
-----------------------------------
--2024-08-11 16:32:48.435768 UTC---
| Itration            | 410       |
| Real Det Return     | 1.2e+04   |
| Real Sto Return     | 1.1e+04   |
| Reward Loss         | -7.33e+06 |
| Running Env Steps   | 2050000   |
| Running Forward KL  | 14.9      |
| Running Reverse KL  | 10.6      |
| Running Update Time | 410       |
-----------------------------------
--2024-08-11 16:34:20.023644 UTC---
| Itration            | 411       |
| Real Det Return     | 1.2e+04   |
| Real Sto Return     | 1.11e+04  |
| Reward Loss         | -7.17e+06 |
| Running Env Steps   | 2055000   |
| Running Forward KL  | 15.5      |
| Running Reverse KL  | 10.8      |
| Running Update Time | 411       |
-----------------------------------
--2024-08-11 16:35:52.546203 UTC---
| Itration            | 412       |
| Real Det Return     | 1.2e+04   |
| Real Sto Return     | 1.15e+04  |
| Reward Loss         | -5.76e+06 |
| Running Env Steps   | 2060000   |
| Running Forward KL  | 15        |
| Running Reverse KL  | 10.2      |
| Running Update Time | 412       |
-----------------------------------
--2024-08-11 16:37:26.709872 UTC---
| Itration            | 413       |
| Real Det Return     | 1.19e+04  |
| Real Sto Return     | 1.14e+04  |
| Reward Loss         | -5.91e+06 |
| Running Env Steps   | 2065000   |
| Running Forward KL  | 15.1      |
| Running Reverse KL  | 10.7      |
| Running Update Time | 413       |
-----------------------------------
--2024-08-11 16:38:58.124985 UTC---
| Itration            | 414       |
| Real Det Return     | 1.18e+04  |
| Real Sto Return     | 1.13e+04  |
| Reward Loss         | -7.64e+06 |
| Running Env Steps   | 2070000   |
| Running Forward KL  | 15        |
| Running Reverse KL  | 9.85      |
| Running Update Time | 414       |
-----------------------------------
--2024-08-11 16:40:31.681613 UTC---
| Itration            | 415       |
| Real Det Return     | 1.15e+04  |
| Real Sto Return     | 1.04e+04  |
| Reward Loss         | -7.93e+06 |
| Running Env Steps   | 2075000   |
| Running Forward KL  | 15.1      |
| Running Reverse KL  | 10.3      |
| Running Update Time | 415       |
-----------------------------------
--2024-08-11 16:42:05.111552 UTC---
| Itration            | 416       |
| Real Det Return     | 1.21e+04  |
| Real Sto Return     | 1.12e+04  |
| Reward Loss         | -7.75e+06 |
| Running Env Steps   | 2080000   |
| Running Forward KL  | 15.2      |
| Running Reverse KL  | 10.2      |
| Running Update Time | 416       |
-----------------------------------
--2024-08-11 16:43:36.341314 UTC---
| Itration            | 417       |
| Real Det Return     | 1.06e+04  |
| Real Sto Return     | 1.02e+04  |
| Reward Loss         | -1.03e+07 |
| Running Env Steps   | 2085000   |
| Running Forward KL  | 16.2      |
| Running Reverse KL  | 11.8      |
| Running Update Time | 417       |
-----------------------------------
--2024-08-11 16:45:09.321717 UTC---
| Itration            | 418       |
| Real Det Return     | 1.08e+04  |
| Real Sto Return     | 1.03e+04  |
| Reward Loss         | -7.07e+06 |
| Running Env Steps   | 2090000   |
| Running Forward KL  | 14.6      |
| Running Reverse KL  | 9.9       |
| Running Update Time | 418       |
-----------------------------------
--2024-08-11 16:46:41.763163 UTC---
| Itration            | 419       |
| Real Det Return     | 1.21e+04  |
| Real Sto Return     | 1.16e+04  |
| Reward Loss         | -6.05e+06 |
| Running Env Steps   | 2095000   |
| Running Forward KL  | 15        |
| Running Reverse KL  | 10.5      |
| Running Update Time | 419       |
-----------------------------------
--2024-08-11 16:48:15.537996 UTC---
| Itration            | 420       |
| Real Det Return     | 1.17e+04  |
| Real Sto Return     | 1.12e+04  |
| Reward Loss         | -7.41e+06 |
| Running Env Steps   | 2100000   |
| Running Forward KL  | 14.9      |
| Running Reverse KL  | 10.8      |
| Running Update Time | 420       |
-----------------------------------
--2024-08-11 16:49:49.504463 UTC---
| Itration            | 421       |
| Real Det Return     | 1.19e+04  |
| Real Sto Return     | 1.14e+04  |
| Reward Loss         | -6.96e+06 |
| Running Env Steps   | 2105000   |
| Running Forward KL  | 14.6      |
| Running Reverse KL  | 10.3      |
| Running Update Time | 421       |
-----------------------------------
--2024-08-11 16:51:21.103609 UTC---
| Itration            | 422       |
| Real Det Return     | 1.2e+04   |
| Real Sto Return     | 1.13e+04  |
| Reward Loss         | -6.33e+06 |
| Running Env Steps   | 2110000   |
| Running Forward KL  | 14.8      |
| Running Reverse KL  | 9.93      |
| Running Update Time | 422       |
-----------------------------------
--2024-08-11 16:52:55.062249 UTC---
| Itration            | 423       |
| Real Det Return     | 1.13e+04  |
| Real Sto Return     | 1.05e+04  |
| Reward Loss         | -8.81e+06 |
| Running Env Steps   | 2115000   |
| Running Forward KL  | 15.3      |
| Running Reverse KL  | 9.59      |
| Running Update Time | 423       |
-----------------------------------
--2024-08-11 16:54:28.628859 UTC---
| Itration            | 424       |
| Real Det Return     | 1.21e+04  |
| Real Sto Return     | 1.15e+04  |
| Reward Loss         | -5.68e+06 |
| Running Env Steps   | 2120000   |
| Running Forward KL  | 14.8      |
| Running Reverse KL  | 10.1      |
| Running Update Time | 424       |
-----------------------------------
--2024-08-11 16:56:00.459144 UTC---
| Itration            | 425       |
| Real Det Return     | 1.11e+04  |
| Real Sto Return     | 1.1e+04   |
| Reward Loss         | -7.25e+06 |
| Running Env Steps   | 2125000   |
| Running Forward KL  | 15        |
| Running Reverse KL  | 9.58      |
| Running Update Time | 425       |
-----------------------------------
--2024-08-11 16:57:33.211093 UTC---
| Itration            | 426       |
| Real Det Return     | 1.16e+04  |
| Real Sto Return     | 1.13e+04  |
| Reward Loss         | -7.52e+06 |
| Running Env Steps   | 2130000   |
| Running Forward KL  | 15.1      |
| Running Reverse KL  | 10.5      |
| Running Update Time | 426       |
-----------------------------------
--2024-08-11 16:59:05.429223 UTC---
| Itration            | 427       |
| Real Det Return     | 1.15e+04  |
| Real Sto Return     | 1.13e+04  |
| Reward Loss         | -6.08e+06 |
| Running Env Steps   | 2135000   |
| Running Forward KL  | 14.8      |
| Running Reverse KL  | 10.2      |
| Running Update Time | 427       |
-----------------------------------
--2024-08-11 17:00:38.088564 UTC---
| Itration            | 428       |
| Real Det Return     | 1.17e+04  |
| Real Sto Return     | 1.11e+04  |
| Reward Loss         | -6.62e+06 |
| Running Env Steps   | 2140000   |
| Running Forward KL  | 14.9      |
| Running Reverse KL  | 10.7      |
| Running Update Time | 428       |
-----------------------------------
--2024-08-11 17:02:12.658935 UTC---
| Itration            | 429       |
| Real Det Return     | 1.11e+04  |
| Real Sto Return     | 1.12e+04  |
| Reward Loss         | -7.29e+06 |
| Running Env Steps   | 2145000   |
| Running Forward KL  | 15        |
| Running Reverse KL  | 10.5      |
| Running Update Time | 429       |
-----------------------------------
--2024-08-11 17:03:43.141195 UTC---
| Itration            | 430       |
| Real Det Return     | 1.07e+04  |
| Real Sto Return     | 1.04e+04  |
| Reward Loss         | -9.86e+06 |
| Running Env Steps   | 2150000   |
| Running Forward KL  | 15.7      |
| Running Reverse KL  | 10.5      |
| Running Update Time | 430       |
-----------------------------------
--2024-08-11 17:05:16.936262 UTC---
| Itration            | 431       |
| Real Det Return     | 1.19e+04  |
| Real Sto Return     | 1.17e+04  |
| Reward Loss         | -5.31e+06 |
| Running Env Steps   | 2155000   |
| Running Forward KL  | 14.7      |
| Running Reverse KL  | 10.7      |
| Running Update Time | 431       |
-----------------------------------
--2024-08-11 17:06:50.565814 UTC--
| Itration            | 432      |
| Real Det Return     | 1.08e+04 |
| Real Sto Return     | 1.14e+04 |
| Reward Loss         | -6.7e+06 |
| Running Env Steps   | 2160000  |
| Running Forward KL  | 15.1     |
| Running Reverse KL  | 10.7     |
| Running Update Time | 432      |
----------------------------------
--2024-08-11 17:08:22.243046 UTC---
| Itration            | 433       |
| Real Det Return     | 1.19e+04  |
| Real Sto Return     | 1.05e+04  |
| Reward Loss         | -5.82e+06 |
| Running Env Steps   | 2165000   |
| Running Forward KL  | 15.1      |
| Running Reverse KL  | 11.3      |
| Running Update Time | 433       |
-----------------------------------
--2024-08-11 17:09:54.742795 UTC--
| Itration            | 434      |
| Real Det Return     | 1.15e+04 |
| Real Sto Return     | 1.12e+04 |
| Reward Loss         | -9.7e+06 |
| Running Env Steps   | 2170000  |
| Running Forward KL  | 15       |
| Running Reverse KL  | 9.88     |
| Running Update Time | 434      |
----------------------------------
--2024-08-11 17:11:26.926622 UTC---
| Itration            | 435       |
| Real Det Return     | 1.2e+04   |
| Real Sto Return     | 1.15e+04  |
| Reward Loss         | -7.13e+06 |
| Running Env Steps   | 2175000   |
| Running Forward KL  | 15.2      |
| Running Reverse KL  | 10.8      |
| Running Update Time | 435       |
-----------------------------------
--2024-08-11 17:12:58.829330 UTC---
| Itration            | 436       |
| Real Det Return     | 1.21e+04  |
| Real Sto Return     | 1.15e+04  |
| Reward Loss         | -5.96e+06 |
| Running Env Steps   | 2180000   |
| Running Forward KL  | 15        |
| Running Reverse KL  | 10.5      |
| Running Update Time | 436       |
-----------------------------------
--2024-08-11 17:14:32.764621 UTC--
| Itration            | 437      |
| Real Det Return     | 1.17e+04 |
| Real Sto Return     | 1.1e+04  |
| Reward Loss         | -7.4e+06 |
| Running Env Steps   | 2185000  |
| Running Forward KL  | 15.4     |
| Running Reverse KL  | 10.2     |
| Running Update Time | 437      |
----------------------------------
--2024-08-11 17:16:03.224859 UTC---
| Itration            | 438       |
| Real Det Return     | 1.2e+04   |
| Real Sto Return     | 1.11e+04  |
| Reward Loss         | -6.48e+06 |
| Running Env Steps   | 2190000   |
| Running Forward KL  | 14.6      |
| Running Reverse KL  | 10.1      |
| Running Update Time | 438       |
-----------------------------------
--2024-08-11 17:17:37.118281 UTC---
| Itration            | 439       |
| Real Det Return     | 1.12e+04  |
| Real Sto Return     | 1.12e+04  |
| Reward Loss         | -1.62e+07 |
| Running Env Steps   | 2195000   |
| Running Forward KL  | 15        |
| Running Reverse KL  | 9.51      |
| Running Update Time | 439       |
-----------------------------------
--2024-08-11 17:19:10.784112 UTC---
| Itration            | 440       |
| Real Det Return     | 1.21e+04  |
| Real Sto Return     | 1.14e+04  |
| Reward Loss         | -5.71e+06 |
| Running Env Steps   | 2200000   |
| Running Forward KL  | 14.9      |
| Running Reverse KL  | 10.4      |
| Running Update Time | 440       |
-----------------------------------
--2024-08-11 17:20:42.509450 UTC---
| Itration            | 441       |
| Real Det Return     | 1.2e+04   |
| Real Sto Return     | 1.15e+04  |
| Reward Loss         | -5.44e+06 |
| Running Env Steps   | 2205000   |
| Running Forward KL  | 14.3      |
| Running Reverse KL  | 10.4      |
| Running Update Time | 441       |
-----------------------------------
--2024-08-11 17:22:14.520565 UTC---
| Itration            | 442       |
| Real Det Return     | 1.2e+04   |
| Real Sto Return     | 1.15e+04  |
| Reward Loss         | -6.53e+06 |
| Running Env Steps   | 2210000   |
| Running Forward KL  | 14.9      |
| Running Reverse KL  | 9.99      |
| Running Update Time | 442       |
-----------------------------------
--2024-08-11 17:23:46.200541 UTC---
| Itration            | 443       |
| Real Det Return     | 1.21e+04  |
| Real Sto Return     | 1.15e+04  |
| Reward Loss         | -5.85e+06 |
| Running Env Steps   | 2215000   |
| Running Forward KL  | 15.4      |
| Running Reverse KL  | 10.4      |
| Running Update Time | 443       |
-----------------------------------
--2024-08-11 17:25:18.009792 UTC---
| Itration            | 444       |
| Real Det Return     | 1.17e+04  |
| Real Sto Return     | 1.14e+04  |
| Reward Loss         | -5.38e+06 |
| Running Env Steps   | 2220000   |
| Running Forward KL  | 14.6      |
| Running Reverse KL  | 10.5      |
| Running Update Time | 444       |
-----------------------------------
--2024-08-11 17:26:51.658088 UTC---
| Itration            | 445       |
| Real Det Return     | 1.16e+04  |
| Real Sto Return     | 1.12e+04  |
| Reward Loss         | -7.52e+06 |
| Running Env Steps   | 2225000   |
| Running Forward KL  | 14.8      |
| Running Reverse KL  | 10.4      |
| Running Update Time | 445       |
-----------------------------------
--2024-08-11 17:28:21.797985 UTC--
| Itration            | 446      |
| Real Det Return     | 1.1e+04  |
| Real Sto Return     | 1.11e+04 |
| Reward Loss         | -8.7e+06 |
| Running Env Steps   | 2230000  |
| Running Forward KL  | 14.5     |
| Running Reverse KL  | 9.63     |
| Running Update Time | 446      |
----------------------------------
--2024-08-11 17:29:55.708953 UTC---
| Itration            | 447       |
| Real Det Return     | 1.22e+04  |
| Real Sto Return     | 1.13e+04  |
| Reward Loss         | -5.93e+06 |
| Running Env Steps   | 2235000   |
| Running Forward KL  | 14.4      |
| Running Reverse KL  | 9.72      |
| Running Update Time | 447       |
-----------------------------------
--2024-08-11 17:31:28.573419 UTC---
| Itration            | 448       |
| Real Det Return     | 1.19e+04  |
| Real Sto Return     | 1.14e+04  |
| Reward Loss         | -6.28e+06 |
| Running Env Steps   | 2240000   |
| Running Forward KL  | 14.8      |
| Running Reverse KL  | 10.8      |
| Running Update Time | 448       |
-----------------------------------
--2024-08-11 17:33:00.071954 UTC---
| Itration            | 449       |
| Real Det Return     | 1.21e+04  |
| Real Sto Return     | 1.16e+04  |
| Reward Loss         | -6.23e+06 |
| Running Env Steps   | 2245000   |
| Running Forward KL  | 14.9      |
| Running Reverse KL  | 10.1      |
| Running Update Time | 449       |
-----------------------------------
--2024-08-11 17:34:32.428582 UTC---
| Itration            | 450       |
| Real Det Return     | 1.16e+04  |
| Real Sto Return     | 1.1e+04   |
| Reward Loss         | -5.98e+06 |
| Running Env Steps   | 2250000   |
| Running Forward KL  | 14.2      |
| Running Reverse KL  | 10.6      |
| Running Update Time | 450       |
-----------------------------------
--2024-08-11 17:36:04.403481 UTC---
| Itration            | 451       |
| Real Det Return     | 1.2e+04   |
| Real Sto Return     | 1.13e+04  |
| Reward Loss         | -8.17e+06 |
| Running Env Steps   | 2255000   |
| Running Forward KL  | 14.4      |
| Running Reverse KL  | 9.21      |
| Running Update Time | 451       |
-----------------------------------
--2024-08-11 17:37:35.773913 UTC--
| Itration            | 452      |
| Real Det Return     | 1.23e+04 |
| Real Sto Return     | 1.16e+04 |
| Reward Loss         | -5.6e+06 |
| Running Env Steps   | 2260000  |
| Running Forward KL  | 14.4     |
| Running Reverse KL  | 9.64     |
| Running Update Time | 452      |
----------------------------------
--2024-08-11 17:39:09.545250 UTC---
| Itration            | 453       |
| Real Det Return     | 1.18e+04  |
| Real Sto Return     | 1.13e+04  |
| Reward Loss         | -6.69e+06 |
| Running Env Steps   | 2265000   |
| Running Forward KL  | 14.8      |
| Running Reverse KL  | 9.86      |
| Running Update Time | 453       |
-----------------------------------
--2024-08-11 17:40:39.805406 UTC---
| Itration            | 454       |
| Real Det Return     | 1.17e+04  |
| Real Sto Return     | 1.13e+04  |
| Reward Loss         | -6.88e+06 |
| Running Env Steps   | 2270000   |
| Running Forward KL  | 15.1      |
| Running Reverse KL  | 10.4      |
| Running Update Time | 454       |
-----------------------------------
--2024-08-11 17:42:13.553071 UTC---
| Itration            | 455       |
| Real Det Return     | 1.23e+04  |
| Real Sto Return     | 1.17e+04  |
| Reward Loss         | -4.41e+06 |
| Running Env Steps   | 2275000   |
| Running Forward KL  | 14        |
| Running Reverse KL  | 9.93      |
| Running Update Time | 455       |
-----------------------------------
--2024-08-11 17:43:46.069815 UTC---
| Itration            | 456       |
| Real Det Return     | 1.23e+04  |
| Real Sto Return     | 1.18e+04  |
| Reward Loss         | -5.01e+06 |
| Running Env Steps   | 2280000   |
| Running Forward KL  | 14.7      |
| Running Reverse KL  | 10.9      |
| Running Update Time | 456       |
-----------------------------------
--2024-08-11 17:45:17.927386 UTC---
| Itration            | 457       |
| Real Det Return     | 1.18e+04  |
| Real Sto Return     | 1.1e+04   |
| Reward Loss         | -6.57e+06 |
| Running Env Steps   | 2285000   |
| Running Forward KL  | 14.2      |
| Running Reverse KL  | 10.1      |
| Running Update Time | 457       |
-----------------------------------
--2024-08-11 17:46:50.431122 UTC--
| Itration            | 458      |
| Real Det Return     | 1.18e+04 |
| Real Sto Return     | 1.08e+04 |
| Reward Loss         | -7.1e+06 |
| Running Env Steps   | 2290000  |
| Running Forward KL  | 14.3     |
| Running Reverse KL  | 9.47     |
| Running Update Time | 458      |
----------------------------------
--2024-08-11 17:48:22.570307 UTC---
| Itration            | 459       |
| Real Det Return     | 1.23e+04  |
| Real Sto Return     | 1.17e+04  |
| Reward Loss         | -5.84e+06 |
| Running Env Steps   | 2295000   |
| Running Forward KL  | 14.8      |
| Running Reverse KL  | 10.7      |
| Running Update Time | 459       |
-----------------------------------
--2024-08-11 17:49:54.217153 UTC---
| Itration            | 460       |
| Real Det Return     | 1.2e+04   |
| Real Sto Return     | 1.15e+04  |
| Reward Loss         | -8.47e+06 |
| Running Env Steps   | 2300000   |
| Running Forward KL  | 14.4      |
| Running Reverse KL  | 9.66      |
| Running Update Time | 460       |
-----------------------------------
--2024-08-11 17:51:27.198218 UTC---
| Itration            | 461       |
| Real Det Return     | 1.22e+04  |
| Real Sto Return     | 1.15e+04  |
| Reward Loss         | -6.75e+06 |
| Running Env Steps   | 2305000   |
| Running Forward KL  | 14        |
| Running Reverse KL  | 9.76      |
| Running Update Time | 461       |
-----------------------------------
--2024-08-11 17:52:58.370514 UTC---
| Itration            | 462       |
| Real Det Return     | 1.2e+04   |
| Real Sto Return     | 1.13e+04  |
| Reward Loss         | -5.43e+06 |
| Running Env Steps   | 2310000   |
| Running Forward KL  | 14.2      |
| Running Reverse KL  | 9.86      |
| Running Update Time | 462       |
-----------------------------------
--2024-08-11 17:54:32.489671 UTC---
| Itration            | 463       |
| Real Det Return     | 1.22e+04  |
| Real Sto Return     | 1.16e+04  |
| Reward Loss         | -6.07e+06 |
| Running Env Steps   | 2315000   |
| Running Forward KL  | 14.4      |
| Running Reverse KL  | 10.6      |
| Running Update Time | 463       |
-----------------------------------
--2024-08-11 17:56:05.829909 UTC---
| Itration            | 464       |
| Real Det Return     | 1.22e+04  |
| Real Sto Return     | 1.17e+04  |
| Reward Loss         | -5.32e+06 |
| Running Env Steps   | 2320000   |
| Running Forward KL  | 14.4      |
| Running Reverse KL  | 10.8      |
| Running Update Time | 464       |
-----------------------------------
--2024-08-11 17:57:38.299290 UTC---
| Itration            | 465       |
| Real Det Return     | 1.18e+04  |
| Real Sto Return     | 1.04e+04  |
| Reward Loss         | -8.38e+06 |
| Running Env Steps   | 2325000   |
| Running Forward KL  | 14.5      |
| Running Reverse KL  | 10        |
| Running Update Time | 465       |
-----------------------------------
--2024-08-11 17:59:11.080726 UTC---
| Itration            | 466       |
| Real Det Return     | 1.21e+04  |
| Real Sto Return     | 1.16e+04  |
| Reward Loss         | -5.12e+06 |
| Running Env Steps   | 2330000   |
| Running Forward KL  | 14.5      |
| Running Reverse KL  | 10.8      |
| Running Update Time | 466       |
-----------------------------------
--2024-08-11 18:00:43.180738 UTC---
| Itration            | 467       |
| Real Det Return     | 1.2e+04   |
| Real Sto Return     | 1.16e+04  |
| Reward Loss         | -6.69e+06 |
| Running Env Steps   | 2335000   |
| Running Forward KL  | 14.3      |
| Running Reverse KL  | 9.78      |
| Running Update Time | 467       |
-----------------------------------
--2024-08-11 18:02:15.686987 UTC---
| Itration            | 468       |
| Real Det Return     | 1.2e+04   |
| Real Sto Return     | 1.1e+04   |
| Reward Loss         | -5.75e+06 |
| Running Env Steps   | 2340000   |
| Running Forward KL  | 14.1      |
| Running Reverse KL  | 10.3      |
| Running Update Time | 468       |
-----------------------------------
--2024-08-11 18:03:49.582882 UTC---
| Itration            | 469       |
| Real Det Return     | 1.2e+04   |
| Real Sto Return     | 1.16e+04  |
| Reward Loss         | -5.12e+06 |
| Running Env Steps   | 2345000   |
| Running Forward KL  | 14.2      |
| Running Reverse KL  | 10.2      |
| Running Update Time | 469       |
-----------------------------------
--2024-08-11 18:05:20.114859 UTC---
| Itration            | 470       |
| Real Det Return     | 1.15e+04  |
| Real Sto Return     | 1.05e+04  |
| Reward Loss         | -8.59e+06 |
| Running Env Steps   | 2350000   |
| Running Forward KL  | 14.3      |
| Running Reverse KL  | 9.43      |
| Running Update Time | 470       |
-----------------------------------
--2024-08-11 18:06:54.015402 UTC---
| Itration            | 471       |
| Real Det Return     | 1.24e+04  |
| Real Sto Return     | 1.05e+04  |
| Reward Loss         | -5.11e+06 |
| Running Env Steps   | 2355000   |
| Running Forward KL  | 14        |
| Running Reverse KL  | 9.92      |
| Running Update Time | 471       |
-----------------------------------
--2024-08-11 18:08:27.316762 UTC---
| Itration            | 472       |
| Real Det Return     | 1.21e+04  |
| Real Sto Return     | 1.14e+04  |
| Reward Loss         | -6.57e+06 |
| Running Env Steps   | 2360000   |
| Running Forward KL  | 14.4      |
| Running Reverse KL  | 10.2      |
| Running Update Time | 472       |
-----------------------------------
--2024-08-11 18:09:58.471498 UTC---
| Itration            | 473       |
| Real Det Return     | 1.22e+04  |
| Real Sto Return     | 1.18e+04  |
| Reward Loss         | -7.09e+06 |
| Running Env Steps   | 2365000   |
| Running Forward KL  | 14.3      |
| Running Reverse KL  | 10.3      |
| Running Update Time | 473       |
-----------------------------------
--2024-08-11 18:11:31.137202 UTC---
| Itration            | 474       |
| Real Det Return     | 1.23e+04  |
| Real Sto Return     | 1.13e+04  |
| Reward Loss         | -6.03e+06 |
| Running Env Steps   | 2370000   |
| Running Forward KL  | 14.4      |
| Running Reverse KL  | 10.7      |
| Running Update Time | 474       |
-----------------------------------
--2024-08-11 18:13:04.493302 UTC---
| Itration            | 475       |
| Real Det Return     | 1.23e+04  |
| Real Sto Return     | 1.11e+04  |
| Reward Loss         | -1.39e+07 |
| Running Env Steps   | 2375000   |
| Running Forward KL  | 14.3      |
| Running Reverse KL  | 8.66      |
| Running Update Time | 475       |
-----------------------------------
--2024-08-11 18:14:37.693722 UTC---
| Itration            | 476       |
| Real Det Return     | 1.22e+04  |
| Real Sto Return     | 1.18e+04  |
| Reward Loss         | -6.18e+06 |
| Running Env Steps   | 2380000   |
| Running Forward KL  | 14.1      |
| Running Reverse KL  | 10.6      |
| Running Update Time | 476       |
-----------------------------------
--2024-08-11 18:16:11.960557 UTC---
| Itration            | 477       |
| Real Det Return     | 1.23e+04  |
| Real Sto Return     | 1.16e+04  |
| Reward Loss         | -7.31e+06 |
| Running Env Steps   | 2385000   |
| Running Forward KL  | 14.2      |
| Running Reverse KL  | 10.2      |
| Running Update Time | 477       |
-----------------------------------
--2024-08-11 18:17:42.765472 UTC--
| Itration            | 478      |
| Real Det Return     | 1.22e+04 |
| Real Sto Return     | 1.17e+04 |
| Reward Loss         | -6.6e+06 |
| Running Env Steps   | 2390000  |
| Running Forward KL  | 14.9     |
| Running Reverse KL  | 10.9     |
| Running Update Time | 478      |
----------------------------------
--2024-08-11 18:19:16.473713 UTC---
| Itration            | 479       |
| Real Det Return     | 1.23e+04  |
| Real Sto Return     | 1.18e+04  |
| Reward Loss         | -6.42e+06 |
| Running Env Steps   | 2395000   |
| Running Forward KL  | 14.5      |
| Running Reverse KL  | 10.9      |
| Running Update Time | 479       |
-----------------------------------
--2024-08-11 18:20:49.623950 UTC---
| Itration            | 480       |
| Real Det Return     | 1.15e+04  |
| Real Sto Return     | 1.1e+04   |
| Reward Loss         | -7.62e+06 |
| Running Env Steps   | 2400000   |
| Running Forward KL  | 14.8      |
| Running Reverse KL  | 10.8      |
| Running Update Time | 480       |
-----------------------------------
--2024-08-11 18:22:21.145959 UTC---
| Itration            | 481       |
| Real Det Return     | 1.24e+04  |
| Real Sto Return     | 1.2e+04   |
| Reward Loss         | -4.88e+06 |
| Running Env Steps   | 2405000   |
| Running Forward KL  | 14.3      |
| Running Reverse KL  | 11        |
| Running Update Time | 481       |
-----------------------------------
--2024-08-11 18:23:53.697338 UTC---
| Itration            | 482       |
| Real Det Return     | 1.23e+04  |
| Real Sto Return     | 1.17e+04  |
| Reward Loss         | -6.01e+06 |
| Running Env Steps   | 2410000   |
| Running Forward KL  | 14        |
| Running Reverse KL  | 10.5      |
| Running Update Time | 482       |
-----------------------------------
--2024-08-11 18:25:25.433831 UTC---
| Itration            | 483       |
| Real Det Return     | 1.25e+04  |
| Real Sto Return     | 1.19e+04  |
| Reward Loss         | -4.76e+06 |
| Running Env Steps   | 2415000   |
| Running Forward KL  | 13.9      |
| Running Reverse KL  | 10.1      |
| Running Update Time | 483       |
-----------------------------------
--2024-08-11 18:26:59.365738 UTC---
| Itration            | 484       |
| Real Det Return     | 1.2e+04   |
| Real Sto Return     | 1.12e+04  |
| Reward Loss         | -8.13e+06 |
| Running Env Steps   | 2420000   |
| Running Forward KL  | 14.4      |
| Running Reverse KL  | 10.2      |
| Running Update Time | 484       |
-----------------------------------
--2024-08-11 18:28:32.843202 UTC---
| Itration            | 485       |
| Real Det Return     | 1.22e+04  |
| Real Sto Return     | 1.17e+04  |
| Reward Loss         | -5.62e+06 |
| Running Env Steps   | 2425000   |
| Running Forward KL  | 14.2      |
| Running Reverse KL  | 10.8      |
| Running Update Time | 485       |
-----------------------------------
--2024-08-11 18:30:04.273047 UTC---
| Itration            | 486       |
| Real Det Return     | 1.2e+04   |
| Real Sto Return     | 1.13e+04  |
| Reward Loss         | -5.49e+06 |
| Running Env Steps   | 2430000   |
| Running Forward KL  | 14.2      |
| Running Reverse KL  | 10.8      |
| Running Update Time | 486       |
-----------------------------------
--2024-08-11 18:31:37.657983 UTC---
| Itration            | 487       |
| Real Det Return     | 1.23e+04  |
| Real Sto Return     | 1.19e+04  |
| Reward Loss         | -4.91e+06 |
| Running Env Steps   | 2435000   |
| Running Forward KL  | 14        |
| Running Reverse KL  | 10.3      |
| Running Update Time | 487       |
-----------------------------------
--2024-08-11 18:33:12.107321 UTC---
| Itration            | 488       |
| Real Det Return     | 1.15e+04  |
| Real Sto Return     | 9.38e+03  |
| Reward Loss         | -9.81e+06 |
| Running Env Steps   | 2440000   |
| Running Forward KL  | 14        |
| Running Reverse KL  | 9.7       |
| Running Update Time | 488       |
-----------------------------------
--2024-08-11 18:34:43.813376 UTC---
| Itration            | 489       |
| Real Det Return     | 1.23e+04  |
| Real Sto Return     | 1.19e+04  |
| Reward Loss         | -4.93e+06 |
| Running Env Steps   | 2445000   |
| Running Forward KL  | 14.1      |
| Running Reverse KL  | 10.6      |
| Running Update Time | 489       |
-----------------------------------
--2024-08-11 18:36:16.642794 UTC---
| Itration            | 490       |
| Real Det Return     | 1.24e+04  |
| Real Sto Return     | 1.11e+04  |
| Reward Loss         | -4.63e+06 |
| Running Env Steps   | 2450000   |
| Running Forward KL  | 13.9      |
| Running Reverse KL  | 9.99      |
| Running Update Time | 490       |
-----------------------------------
--2024-08-11 18:37:48.167490 UTC---
| Itration            | 491       |
| Real Det Return     | 1.19e+04  |
| Real Sto Return     | 1.16e+04  |
| Reward Loss         | -6.55e+06 |
| Running Env Steps   | 2455000   |
| Running Forward KL  | 14.3      |
| Running Reverse KL  | 10.2      |
| Running Update Time | 491       |
-----------------------------------
--2024-08-11 18:39:20.380270 UTC---
| Itration            | 492       |
| Real Det Return     | 1.25e+04  |
| Real Sto Return     | 1.15e+04  |
| Reward Loss         | -4.59e+06 |
| Running Env Steps   | 2460000   |
| Running Forward KL  | 14.3      |
| Running Reverse KL  | 10.7      |
| Running Update Time | 492       |
-----------------------------------
--2024-08-11 18:40:53.793870 UTC---
| Itration            | 493       |
| Real Det Return     | 1.22e+04  |
| Real Sto Return     | 1.19e+04  |
| Reward Loss         | -4.77e+06 |
| Running Env Steps   | 2465000   |
| Running Forward KL  | 13.8      |
| Running Reverse KL  | 9.69      |
| Running Update Time | 493       |
-----------------------------------
--2024-08-11 18:42:25.095391 UTC---
| Itration            | 494       |
| Real Det Return     | 1.18e+04  |
| Real Sto Return     | 1.13e+04  |
| Reward Loss         | -6.58e+06 |
| Running Env Steps   | 2470000   |
| Running Forward KL  | 14.3      |
| Running Reverse KL  | 10.5      |
| Running Update Time | 494       |
-----------------------------------
--2024-08-11 18:43:58.909135 UTC---
| Itration            | 495       |
| Real Det Return     | 1.21e+04  |
| Real Sto Return     | 1.15e+04  |
| Reward Loss         | -8.32e+06 |
| Running Env Steps   | 2475000   |
| Running Forward KL  | 14        |
| Running Reverse KL  | 9.31      |
| Running Update Time | 495       |
-----------------------------------
--2024-08-11 18:45:32.274299 UTC---
| Itration            | 496       |
| Real Det Return     | 1.13e+04  |
| Real Sto Return     | 1.17e+04  |
| Reward Loss         | -5.74e+06 |
| Running Env Steps   | 2480000   |
| Running Forward KL  | 14.2      |
| Running Reverse KL  | 10.3      |
| Running Update Time | 496       |
-----------------------------------
--2024-08-11 18:47:03.944109 UTC---
| Itration            | 497       |
| Real Det Return     | 1.23e+04  |
| Real Sto Return     | 1.15e+04  |
| Reward Loss         | -5.66e+06 |
| Running Env Steps   | 2485000   |
| Running Forward KL  | 14        |
| Running Reverse KL  | 10.1      |
| Running Update Time | 497       |
-----------------------------------
--2024-08-11 18:48:36.598265 UTC---
| Itration            | 498       |
| Real Det Return     | 1.25e+04  |
| Real Sto Return     | 1.17e+04  |
| Reward Loss         | -7.58e+06 |
| Running Env Steps   | 2490000   |
| Running Forward KL  | 13.5      |
| Running Reverse KL  | 8.73      |
| Running Update Time | 498       |
-----------------------------------
--2024-08-11 18:50:08.920629 UTC--
| Itration            | 499      |
| Real Det Return     | 1.22e+04 |
| Real Sto Return     | 1.16e+04 |
| Reward Loss         | -5.1e+06 |
| Running Env Steps   | 2495000  |
| Running Forward KL  | 13.4     |
| Running Reverse KL  | 9.55     |
| Running Update Time | 499      |
----------------------------------
--2024-08-11 18:51:41.293524 UTC---
| Itration            | 500       |
| Real Det Return     | 1.22e+04  |
| Real Sto Return     | 1.17e+04  |
| Reward Loss         | -6.65e+06 |
| Running Env Steps   | 2500000   |
| Running Forward KL  | 13.6      |
| Running Reverse KL  | 9.15      |
| Running Update Time | 500       |
-----------------------------------
--2024-08-11 18:53:15.000670 UTC---
| Itration            | 501       |
| Real Det Return     | 1.22e+04  |
| Real Sto Return     | 1.18e+04  |
| Reward Loss         | -5.14e+06 |
| Running Env Steps   | 2505000   |
| Running Forward KL  | 13.8      |
| Running Reverse KL  | 9.93      |
| Running Update Time | 501       |
-----------------------------------
--2024-08-11 18:54:45.538398 UTC---
| Itration            | 502       |
| Real Det Return     | 1.19e+04  |
| Real Sto Return     | 1.12e+04  |
| Reward Loss         | -1.01e+07 |
| Running Env Steps   | 2510000   |
| Running Forward KL  | 13.5      |
| Running Reverse KL  | 9.07      |
| Running Update Time | 502       |
-----------------------------------
--2024-08-11 18:56:19.526199 UTC---
| Itration            | 503       |
| Real Det Return     | 1.23e+04  |
| Real Sto Return     | 1.14e+04  |
| Reward Loss         | -7.15e+06 |
| Running Env Steps   | 2515000   |
| Running Forward KL  | 13.4      |
| Running Reverse KL  | 9.12      |
| Running Update Time | 503       |
-----------------------------------
--2024-08-11 18:57:52.495325 UTC---
| Itration            | 504       |
| Real Det Return     | 1.22e+04  |
| Real Sto Return     | 1.17e+04  |
| Reward Loss         | -5.37e+06 |
| Running Env Steps   | 2520000   |
| Running Forward KL  | 13.5      |
| Running Reverse KL  | 9.8       |
| Running Update Time | 504       |
-----------------------------------
--2024-08-11 18:59:24.048229 UTC---
| Itration            | 505       |
| Real Det Return     | 1.16e+04  |
| Real Sto Return     | 1.13e+04  |
| Reward Loss         | -5.46e+06 |
| Running Env Steps   | 2525000   |
| Running Forward KL  | 13.7      |
| Running Reverse KL  | 10.1      |
| Running Update Time | 505       |
-----------------------------------
--2024-08-11 19:00:57.427956 UTC---
| Itration            | 506       |
| Real Det Return     | 1.2e+04   |
| Real Sto Return     | 1.17e+04  |
| Reward Loss         | -5.47e+06 |
| Running Env Steps   | 2530000   |
| Running Forward KL  | 14.2      |
| Running Reverse KL  | 10.4      |
| Running Update Time | 506       |
-----------------------------------
--2024-08-11 19:02:29.813513 UTC--
| Itration            | 507      |
| Real Det Return     | 1.17e+04 |
| Real Sto Return     | 1.13e+04 |
| Reward Loss         | -6.9e+06 |
| Running Env Steps   | 2535000  |
| Running Forward KL  | 13.4     |
| Running Reverse KL  | 9.52     |
| Running Update Time | 507      |
----------------------------------
--2024-08-11 19:04:01.550116 UTC---
| Itration            | 508       |
| Real Det Return     | 1.22e+04  |
| Real Sto Return     | 1.15e+04  |
| Reward Loss         | -6.39e+06 |
| Running Env Steps   | 2540000   |
| Running Forward KL  | 14.2      |
| Running Reverse KL  | 10.4      |
| Running Update Time | 508       |
-----------------------------------
--2024-08-11 19:05:35.337074 UTC---
| Itration            | 509       |
| Real Det Return     | 1.19e+04  |
| Real Sto Return     | 1.16e+04  |
| Reward Loss         | -5.07e+06 |
| Running Env Steps   | 2545000   |
| Running Forward KL  | 13.9      |
| Running Reverse KL  | 9.76      |
| Running Update Time | 509       |
-----------------------------------
--2024-08-11 19:07:06.477200 UTC---
| Itration            | 510       |
| Real Det Return     | 1.23e+04  |
| Real Sto Return     | 1.17e+04  |
| Reward Loss         | -5.43e+06 |
| Running Env Steps   | 2550000   |
| Running Forward KL  | 13.3      |
| Running Reverse KL  | 9.13      |
| Running Update Time | 510       |
-----------------------------------
--2024-08-11 19:08:40.271230 UTC---
| Itration            | 511       |
| Real Det Return     | 1.21e+04  |
| Real Sto Return     | 1.16e+04  |
| Reward Loss         | -5.91e+06 |
| Running Env Steps   | 2555000   |
| Running Forward KL  | 13.6      |
| Running Reverse KL  | 9.57      |
| Running Update Time | 511       |
-----------------------------------
--2024-08-11 19:10:13.023877 UTC---
| Itration            | 512       |
| Real Det Return     | 1.22e+04  |
| Real Sto Return     | 1.16e+04  |
| Reward Loss         | -6.75e+06 |
| Running Env Steps   | 2560000   |
| Running Forward KL  | 14        |
| Running Reverse KL  | 9.99      |
| Running Update Time | 512       |
-----------------------------------
--2024-08-11 19:11:44.163752 UTC---
| Itration            | 513       |
| Real Det Return     | 1.22e+04  |
| Real Sto Return     | 1.16e+04  |
| Reward Loss         | -5.34e+06 |
| Running Env Steps   | 2565000   |
| Running Forward KL  | 13.8      |
| Running Reverse KL  | 9.81      |
| Running Update Time | 513       |
-----------------------------------
--2024-08-11 19:13:16.503350 UTC---
| Itration            | 514       |
| Real Det Return     | 1.25e+04  |
| Real Sto Return     | 1.19e+04  |
| Reward Loss         | -5.03e+06 |
| Running Env Steps   | 2570000   |
| Running Forward KL  | 13.5      |
| Running Reverse KL  | 9.73      |
| Running Update Time | 514       |
-----------------------------------
--2024-08-11 19:14:48.115547 UTC---
| Itration            | 515       |
| Real Det Return     | 1.24e+04  |
| Real Sto Return     | 1.18e+04  |
| Reward Loss         | -5.84e+06 |
| Running Env Steps   | 2575000   |
| Running Forward KL  | 13.3      |
| Running Reverse KL  | 9.6       |
| Running Update Time | 515       |
-----------------------------------
--2024-08-11 19:16:19.813903 UTC---
| Itration            | 516       |
| Real Det Return     | 1.19e+04  |
| Real Sto Return     | 1.15e+04  |
| Reward Loss         | -9.87e+06 |
| Running Env Steps   | 2580000   |
| Running Forward KL  | 13.7      |
| Running Reverse KL  | 9.01      |
| Running Update Time | 516       |
-----------------------------------
--2024-08-11 19:17:53.354533 UTC---
| Itration            | 517       |
| Real Det Return     | 1.26e+04  |
| Real Sto Return     | 1.12e+04  |
| Reward Loss         | -6.61e+06 |
| Running Env Steps   | 2585000   |
| Running Forward KL  | 13.4      |
| Running Reverse KL  | 9.37      |
| Running Update Time | 517       |
-----------------------------------
--2024-08-11 19:19:23.963776 UTC---
| Itration            | 518       |
| Real Det Return     | 1.24e+04  |
| Real Sto Return     | 1.18e+04  |
| Reward Loss         | -5.06e+06 |
| Running Env Steps   | 2590000   |
| Running Forward KL  | 13.7      |
| Running Reverse KL  | 10.2      |
| Running Update Time | 518       |
-----------------------------------
--2024-08-11 19:20:57.185127 UTC---
| Itration            | 519       |
| Real Det Return     | 1.22e+04  |
| Real Sto Return     | 1.16e+04  |
| Reward Loss         | -6.04e+06 |
| Running Env Steps   | 2595000   |
| Running Forward KL  | 13        |
| Running Reverse KL  | 9.02      |
| Running Update Time | 519       |
-----------------------------------
--2024-08-11 19:22:30.104154 UTC---
| Itration            | 520       |
| Real Det Return     | 1.24e+04  |
| Real Sto Return     | 1.18e+04  |
| Reward Loss         | -4.99e+06 |
| Running Env Steps   | 2600000   |
| Running Forward KL  | 13.2      |
| Running Reverse KL  | 9.54      |
| Running Update Time | 520       |
-----------------------------------
--2024-08-11 19:24:01.781838 UTC---
| Itration            | 521       |
| Real Det Return     | 1.25e+04  |
| Real Sto Return     | 1.19e+04  |
| Reward Loss         | -4.59e+06 |
| Running Env Steps   | 2605000   |
| Running Forward KL  | 12.7      |
| Running Reverse KL  | 9.2       |
| Running Update Time | 521       |
-----------------------------------
--2024-08-11 19:25:33.448045 UTC---
| Itration            | 522       |
| Real Det Return     | 1.19e+04  |
| Real Sto Return     | 1.12e+04  |
| Reward Loss         | -7.59e+06 |
| Running Env Steps   | 2610000   |
| Running Forward KL  | 13.7      |
| Running Reverse KL  | 9.43      |
| Running Update Time | 522       |
-----------------------------------
--2024-08-11 19:27:05.771394 UTC---
| Itration            | 523       |
| Real Det Return     | 1.18e+04  |
| Real Sto Return     | 1.11e+04  |
| Reward Loss         | -7.05e+06 |
| Running Env Steps   | 2615000   |
| Running Forward KL  | 13.5      |
| Running Reverse KL  | 9.74      |
| Running Update Time | 523       |
-----------------------------------
--2024-08-11 19:28:37.803574 UTC---
| Itration            | 524       |
| Real Det Return     | 1.24e+04  |
| Real Sto Return     | 1.17e+04  |
| Reward Loss         | -5.27e+06 |
| Running Env Steps   | 2620000   |
| Running Forward KL  | 13.5      |
| Running Reverse KL  | 9.46      |
| Running Update Time | 524       |
-----------------------------------
--2024-08-11 19:30:10.737465 UTC---
| Itration            | 525       |
| Real Det Return     | 1.26e+04  |
| Real Sto Return     | 1.15e+04  |
| Reward Loss         | -4.45e+06 |
| Running Env Steps   | 2625000   |
| Running Forward KL  | 13.2      |
| Running Reverse KL  | 9.3       |
| Running Update Time | 525       |
-----------------------------------
--2024-08-11 19:31:41.084927 UTC---
| Itration            | 526       |
| Real Det Return     | 1.19e+04  |
| Real Sto Return     | 1.08e+04  |
| Reward Loss         | -8.32e+06 |
| Running Env Steps   | 2630000   |
| Running Forward KL  | 13        |
| Running Reverse KL  | 8.43      |
| Running Update Time | 526       |
-----------------------------------
--2024-08-11 19:33:15.091564 UTC---
| Itration            | 527       |
| Real Det Return     | 1.15e+04  |
| Real Sto Return     | 1.12e+04  |
| Reward Loss         | -6.65e+06 |
| Running Env Steps   | 2635000   |
| Running Forward KL  | 13.5      |
| Running Reverse KL  | 10        |
| Running Update Time | 527       |
-----------------------------------
--2024-08-11 19:34:48.459448 UTC---
| Itration            | 528       |
| Real Det Return     | 1.25e+04  |
| Real Sto Return     | 1.16e+04  |
| Reward Loss         | -5.53e+06 |
| Running Env Steps   | 2640000   |
| Running Forward KL  | 12.5      |
| Running Reverse KL  | 8.27      |
| Running Update Time | 528       |
-----------------------------------
--2024-08-11 19:36:20.149384 UTC---
| Itration            | 529       |
| Real Det Return     | 1.24e+04  |
| Real Sto Return     | 1.15e+04  |
| Reward Loss         | -5.26e+06 |
| Running Env Steps   | 2645000   |
| Running Forward KL  | 13.2      |
| Running Reverse KL  | 9.13      |
| Running Update Time | 529       |
-----------------------------------
--2024-08-11 19:37:53.084424 UTC---
| Itration            | 530       |
| Real Det Return     | 1.1e+04   |
| Real Sto Return     | 9.45e+03  |
| Reward Loss         | -9.09e+06 |
| Running Env Steps   | 2650000   |
| Running Forward KL  | 13.6      |
| Running Reverse KL  | 8.19      |
| Running Update Time | 530       |
-----------------------------------
--2024-08-11 19:39:25.855857 UTC---
| Itration            | 531       |
| Real Det Return     | 1.23e+04  |
| Real Sto Return     | 1.09e+04  |
| Reward Loss         | -6.41e+06 |
| Running Env Steps   | 2655000   |
| Running Forward KL  | 12.7      |
| Running Reverse KL  | 8.87      |
| Running Update Time | 531       |
-----------------------------------
--2024-08-11 19:40:58.123631 UTC---
| Itration            | 532       |
| Real Det Return     | 1.24e+04  |
| Real Sto Return     | 1.17e+04  |
| Reward Loss         | -5.85e+06 |
| Running Env Steps   | 2660000   |
| Running Forward KL  | 12.7      |
| Running Reverse KL  | 8.79      |
| Running Update Time | 532       |
-----------------------------------
--2024-08-11 19:42:32.031784 UTC---
| Itration            | 533       |
| Real Det Return     | 1.22e+04  |
| Real Sto Return     | 1.13e+04  |
| Reward Loss         | -5.16e+06 |
| Running Env Steps   | 2665000   |
| Running Forward KL  | 12.7      |
| Running Reverse KL  | 9.02      |
| Running Update Time | 533       |
-----------------------------------
--2024-08-11 19:44:02.633295 UTC---
| Itration            | 534       |
| Real Det Return     | 1.25e+04  |
| Real Sto Return     | 1.19e+04  |
| Reward Loss         | -6.15e+06 |
| Running Env Steps   | 2670000   |
| Running Forward KL  | 13.6      |
| Running Reverse KL  | 9.52      |
| Running Update Time | 534       |
-----------------------------------
--2024-08-11 19:45:36.747397 UTC---
| Itration            | 535       |
| Real Det Return     | 1.22e+04  |
| Real Sto Return     | 1.13e+04  |
| Reward Loss         | -6.97e+06 |
| Running Env Steps   | 2675000   |
| Running Forward KL  | 12.9      |
| Running Reverse KL  | 8.81      |
| Running Update Time | 535       |
-----------------------------------
--2024-08-11 19:47:10.389086 UTC---
| Itration            | 536       |
| Real Det Return     | 1.2e+04   |
| Real Sto Return     | 1.1e+04   |
| Reward Loss         | -7.27e+06 |
| Running Env Steps   | 2680000   |
| Running Forward KL  | 13        |
| Running Reverse KL  | 8.72      |
| Running Update Time | 536       |
-----------------------------------
--2024-08-11 19:48:42.358167 UTC---
| Itration            | 537       |
| Real Det Return     | 1.18e+04  |
| Real Sto Return     | 1.02e+04  |
| Reward Loss         | -7.93e+06 |
| Running Env Steps   | 2685000   |
| Running Forward KL  | 12.2      |
| Running Reverse KL  | 7.66      |
| Running Update Time | 537       |
-----------------------------------
--2024-08-11 19:50:14.949535 UTC---
| Itration            | 538       |
| Real Det Return     | 1.25e+04  |
| Real Sto Return     | 1.12e+04  |
| Reward Loss         | -5.93e+06 |
| Running Env Steps   | 2690000   |
| Running Forward KL  | 12        |
| Running Reverse KL  | 7.7       |
| Running Update Time | 538       |
-----------------------------------
--2024-08-11 19:51:46.954131 UTC---
| Itration            | 539       |
| Real Det Return     | 1.25e+04  |
| Real Sto Return     | 1.16e+04  |
| Reward Loss         | -7.74e+06 |
| Running Env Steps   | 2695000   |
| Running Forward KL  | 13.1      |
| Running Reverse KL  | 9.57      |
| Running Update Time | 539       |
-----------------------------------
--2024-08-11 19:53:19.520346 UTC---
| Itration            | 540       |
| Real Det Return     | 1.25e+04  |
| Real Sto Return     | 1.16e+04  |
| Reward Loss         | -1.14e+07 |
| Running Env Steps   | 2700000   |
| Running Forward KL  | 12.8      |
| Running Reverse KL  | 8.97      |
| Running Update Time | 540       |
-----------------------------------
--2024-08-11 19:54:53.048520 UTC---
| Itration            | 541       |
| Real Det Return     | 1.21e+04  |
| Real Sto Return     | 1.13e+04  |
| Reward Loss         | -7.46e+06 |
| Running Env Steps   | 2705000   |
| Running Forward KL  | 12.9      |
| Running Reverse KL  | 8.8       |
| Running Update Time | 541       |
-----------------------------------
--2024-08-11 19:56:24.933040 UTC---
| Itration            | 542       |
| Real Det Return     | 1.2e+04   |
| Real Sto Return     | 1.15e+04  |
| Reward Loss         | -6.76e+06 |
| Running Env Steps   | 2710000   |
| Running Forward KL  | 12.8      |
| Running Reverse KL  | 8.82      |
| Running Update Time | 542       |
-----------------------------------
--2024-08-11 19:57:58.399236 UTC--
| Itration            | 543      |
| Real Det Return     | 1.23e+04 |
| Real Sto Return     | 1.16e+04 |
| Reward Loss         | -5.6e+06 |
| Running Env Steps   | 2715000  |
| Running Forward KL  | 12.3     |
| Running Reverse KL  | 8.55     |
| Running Update Time | 543      |
----------------------------------
--2024-08-11 19:59:32.297456 UTC---
| Itration            | 544       |
| Real Det Return     | 1.22e+04  |
| Real Sto Return     | 1.09e+04  |
| Reward Loss         | -6.77e+06 |
| Running Env Steps   | 2720000   |
| Running Forward KL  | 12.8      |
| Running Reverse KL  | 8.71      |
| Running Update Time | 544       |
-----------------------------------
--2024-08-11 20:01:03.852999 UTC---
| Itration            | 545       |
| Real Det Return     | 1.21e+04  |
| Real Sto Return     | 1.13e+04  |
| Reward Loss         | -5.45e+06 |
| Running Env Steps   | 2725000   |
| Running Forward KL  | 12.8      |
| Running Reverse KL  | 9.07      |
| Running Update Time | 545       |
-----------------------------------
--2024-08-11 20:02:36.561838 UTC---
| Itration            | 546       |
| Real Det Return     | 1.23e+04  |
| Real Sto Return     | 1.16e+04  |
| Reward Loss         | -6.99e+06 |
| Running Env Steps   | 2730000   |
| Running Forward KL  | 12.9      |
| Running Reverse KL  | 8.8       |
| Running Update Time | 546       |
-----------------------------------
--2024-08-11 20:04:08.612058 UTC---
| Itration            | 547       |
| Real Det Return     | 1.25e+04  |
| Real Sto Return     | 1.17e+04  |
| Reward Loss         | -5.68e+06 |
| Running Env Steps   | 2735000   |
| Running Forward KL  | 12.7      |
| Running Reverse KL  | 8.84      |
| Running Update Time | 547       |
-----------------------------------
--2024-08-11 20:05:41.997637 UTC--
| Itration            | 548      |
| Real Det Return     | 1.23e+04 |
| Real Sto Return     | 1.17e+04 |
| Reward Loss         | -5.7e+06 |
| Running Env Steps   | 2740000  |
| Running Forward KL  | 12.6     |
| Running Reverse KL  | 9.51     |
| Running Update Time | 548      |
----------------------------------
--2024-08-11 20:07:15.708792 UTC---
| Itration            | 549       |
| Real Det Return     | 1.24e+04  |
| Real Sto Return     | 1.15e+04  |
| Reward Loss         | -7.77e+06 |
| Running Env Steps   | 2745000   |
| Running Forward KL  | 12.9      |
| Running Reverse KL  | 7.99      |
| Running Update Time | 549       |
-----------------------------------
--2024-08-11 20:08:47.155279 UTC---
| Itration            | 550       |
| Real Det Return     | 1.23e+04  |
| Real Sto Return     | 1.12e+04  |
| Reward Loss         | -5.86e+06 |
| Running Env Steps   | 2750000   |
| Running Forward KL  | 12.6      |
| Running Reverse KL  | 8.31      |
| Running Update Time | 550       |
-----------------------------------
--2024-08-11 20:10:21.467805 UTC---
| Itration            | 551       |
| Real Det Return     | 1.24e+04  |
| Real Sto Return     | 1.14e+04  |
| Reward Loss         | -5.63e+06 |
| Running Env Steps   | 2755000   |
| Running Forward KL  | 12.2      |
| Running Reverse KL  | 8.08      |
| Running Update Time | 551       |
-----------------------------------
--2024-08-11 20:11:54.718095 UTC---
| Itration            | 552       |
| Real Det Return     | 1.21e+04  |
| Real Sto Return     | 1.15e+04  |
| Reward Loss         | -5.98e+06 |
| Running Env Steps   | 2760000   |
| Running Forward KL  | 12.5      |
| Running Reverse KL  | 9.26      |
| Running Update Time | 552       |
-----------------------------------
--2024-08-11 20:13:26.098235 UTC--
| Itration            | 553      |
| Real Det Return     | 1.24e+04 |
| Real Sto Return     | 1.16e+04 |
| Reward Loss         | -8.7e+06 |
| Running Env Steps   | 2765000  |
| Running Forward KL  | 12.1     |
| Running Reverse KL  | 9.16     |
| Running Update Time | 553      |
----------------------------------
--2024-08-11 20:14:58.810796 UTC---
| Itration            | 554       |
| Real Det Return     | 1.24e+04  |
| Real Sto Return     | 1.17e+04  |
| Reward Loss         | -4.54e+06 |
| Running Env Steps   | 2770000   |
| Running Forward KL  | 12.3      |
| Running Reverse KL  | 8.9       |
| Running Update Time | 554       |
-----------------------------------
--2024-08-11 20:16:30.799836 UTC---
| Itration            | 555       |
| Real Det Return     | 1.23e+04  |
| Real Sto Return     | 1.15e+04  |
| Reward Loss         | -5.63e+06 |
| Running Env Steps   | 2775000   |
| Running Forward KL  | 12.3      |
| Running Reverse KL  | 8.62      |
| Running Update Time | 555       |
-----------------------------------
--2024-08-11 20:18:03.888835 UTC---
| Itration            | 556       |
| Real Det Return     | 1.24e+04  |
| Real Sto Return     | 1.18e+04  |
| Reward Loss         | -5.93e+06 |
| Running Env Steps   | 2780000   |
| Running Forward KL  | 12.5      |
| Running Reverse KL  | 8.84      |
| Running Update Time | 556       |
-----------------------------------
--2024-08-11 20:19:37.816759 UTC---
| Itration            | 557       |
| Real Det Return     | 1.22e+04  |
| Real Sto Return     | 1.13e+04  |
| Reward Loss         | -7.54e+06 |
| Running Env Steps   | 2785000   |
| Running Forward KL  | 12.7      |
| Running Reverse KL  | 8.77      |
| Running Update Time | 557       |
-----------------------------------
--2024-08-11 20:21:09.644355 UTC--
| Itration            | 558      |
| Real Det Return     | 1.23e+04 |
| Real Sto Return     | 1.16e+04 |
| Reward Loss         | -6.4e+06 |
| Running Env Steps   | 2790000  |
| Running Forward KL  | 12.9     |
| Running Reverse KL  | 8.91     |
| Running Update Time | 558      |
----------------------------------
--2024-08-11 20:22:43.753460 UTC---
| Itration            | 559       |
| Real Det Return     | 1.25e+04  |
| Real Sto Return     | 1.17e+04  |
| Reward Loss         | -5.24e+06 |
| Running Env Steps   | 2795000   |
| Running Forward KL  | 12.5      |
| Running Reverse KL  | 8.58      |
| Running Update Time | 559       |
-----------------------------------
--2024-08-11 20:24:16.911534 UTC---
| Itration            | 560       |
| Real Det Return     | 1.19e+04  |
| Real Sto Return     | 1.1e+04   |
| Reward Loss         | -7.26e+06 |
| Running Env Steps   | 2800000   |
| Running Forward KL  | 12.6      |
| Running Reverse KL  | 9.03      |
| Running Update Time | 560       |
-----------------------------------
--2024-08-11 20:25:48.313427 UTC--
| Itration            | 561      |
| Real Det Return     | 1.2e+04  |
| Real Sto Return     | 1.09e+04 |
| Reward Loss         | -5.3e+06 |
| Running Env Steps   | 2805000  |
| Running Forward KL  | 12.8     |
| Running Reverse KL  | 9.31     |
| Running Update Time | 561      |
----------------------------------
--2024-08-11 20:27:20.625733 UTC---
| Itration            | 562       |
| Real Det Return     | 1.21e+04  |
| Real Sto Return     | 1.15e+04  |
| Reward Loss         | -6.33e+06 |
| Running Env Steps   | 2810000   |
| Running Forward KL  | 12.5      |
| Running Reverse KL  | 8.79      |
| Running Update Time | 562       |
-----------------------------------
--2024-08-11 20:28:53.015886 UTC---
| Itration            | 563       |
| Real Det Return     | 1.26e+04  |
| Real Sto Return     | 1.13e+04  |
| Reward Loss         | -4.67e+06 |
| Running Env Steps   | 2815000   |
| Running Forward KL  | 12.4      |
| Running Reverse KL  | 8.5       |
| Running Update Time | 563       |
-----------------------------------
--2024-08-11 20:30:26.033304 UTC---
| Itration            | 564       |
| Real Det Return     | 1.23e+04  |
| Real Sto Return     | 1.13e+04  |
| Reward Loss         | -5.05e+06 |
| Running Env Steps   | 2820000   |
| Running Forward KL  | 11.7      |
| Running Reverse KL  | 8.31      |
| Running Update Time | 564       |
-----------------------------------
--2024-08-11 20:31:59.241143 UTC---
| Itration            | 565       |
| Real Det Return     | 1.18e+04  |
| Real Sto Return     | 1.14e+04  |
| Reward Loss         | -7.05e+06 |
| Running Env Steps   | 2825000   |
| Running Forward KL  | 12.6      |
| Running Reverse KL  | 8.5       |
| Running Update Time | 565       |
-----------------------------------
--2024-08-11 20:33:30.693356 UTC--
| Itration            | 566      |
| Real Det Return     | 1.22e+04 |
| Real Sto Return     | 1.1e+04  |
| Reward Loss         | -8.8e+06 |
| Running Env Steps   | 2830000  |
| Running Forward KL  | 12.2     |
| Running Reverse KL  | 9.93     |
| Running Update Time | 566      |
----------------------------------
--2024-08-11 20:35:04.674794 UTC---
| Itration            | 567       |
| Real Det Return     | 1.14e+04  |
| Real Sto Return     | 1.01e+04  |
| Reward Loss         | -6.14e+06 |
| Running Env Steps   | 2835000   |
| Running Forward KL  | 12.3      |
| Running Reverse KL  | 8.43      |
| Running Update Time | 567       |
-----------------------------------
--2024-08-11 20:36:38.279433 UTC---
| Itration            | 568       |
| Real Det Return     | 1.22e+04  |
| Real Sto Return     | 1.16e+04  |
| Reward Loss         | -6.85e+06 |
| Running Env Steps   | 2840000   |
| Running Forward KL  | 12        |
| Running Reverse KL  | 8.17      |
| Running Update Time | 568       |
-----------------------------------
--2024-08-11 20:38:09.523220 UTC---
| Itration            | 569       |
| Real Det Return     | 1.24e+04  |
| Real Sto Return     | 1.17e+04  |
| Reward Loss         | -6.08e+06 |
| Running Env Steps   | 2845000   |
| Running Forward KL  | 12.4      |
| Running Reverse KL  | 9.02      |
| Running Update Time | 569       |
-----------------------------------
--2024-08-11 20:39:42.964012 UTC---
| Itration            | 570       |
| Real Det Return     | 1.22e+04  |
| Real Sto Return     | 1.15e+04  |
| Reward Loss         | -6.12e+06 |
| Running Env Steps   | 2850000   |
| Running Forward KL  | 12.5      |
| Running Reverse KL  | 8.65      |
| Running Update Time | 570       |
-----------------------------------
--2024-08-11 20:41:15.244109 UTC---
| Itration            | 571       |
| Real Det Return     | 1.22e+04  |
| Real Sto Return     | 1.05e+04  |
| Reward Loss         | -6.08e+06 |
| Running Env Steps   | 2855000   |
| Running Forward KL  | 12.2      |
| Running Reverse KL  | 8.56      |
| Running Update Time | 571       |
-----------------------------------
--2024-08-11 20:42:48.235067 UTC---
| Itration            | 572       |
| Real Det Return     | 1.21e+04  |
| Real Sto Return     | 1.13e+04  |
| Reward Loss         | -6.09e+06 |
| Running Env Steps   | 2860000   |
| Running Forward KL  | 12.4      |
| Running Reverse KL  | 8.74      |
| Running Update Time | 572       |
-----------------------------------
--2024-08-11 20:44:22.185042 UTC---
| Itration            | 573       |
| Real Det Return     | 1.23e+04  |
| Real Sto Return     | 1.18e+04  |
| Reward Loss         | -4.81e+06 |
| Running Env Steps   | 2865000   |
| Running Forward KL  | 11.9      |
| Running Reverse KL  | 8.42      |
| Running Update Time | 573       |
-----------------------------------
--2024-08-11 20:45:53.712053 UTC---
| Itration            | 574       |
| Real Det Return     | 1.2e+04   |
| Real Sto Return     | 1.14e+04  |
| Reward Loss         | -6.11e+06 |
| Running Env Steps   | 2870000   |
| Running Forward KL  | 12.4      |
| Running Reverse KL  | 8.93      |
| Running Update Time | 574       |
-----------------------------------
--2024-08-11 20:47:27.884387 UTC---
| Itration            | 575       |
| Real Det Return     | 1.25e+04  |
| Real Sto Return     | 1.18e+04  |
| Reward Loss         | -4.49e+06 |
| Running Env Steps   | 2875000   |
| Running Forward KL  | 12        |
| Running Reverse KL  | 8.55      |
| Running Update Time | 575       |
-----------------------------------
--2024-08-11 20:49:01.630768 UTC---
| Itration            | 576       |
| Real Det Return     | 1.27e+04  |
| Real Sto Return     | 1.19e+04  |
| Reward Loss         | -4.51e+06 |
| Running Env Steps   | 2880000   |
| Running Forward KL  | 11.9      |
| Running Reverse KL  | 8.3       |
| Running Update Time | 576       |
-----------------------------------
--2024-08-11 20:50:33.256610 UTC---
| Itration            | 577       |
| Real Det Return     | 1.22e+04  |
| Real Sto Return     | 1.16e+04  |
| Reward Loss         | -6.43e+06 |
| Running Env Steps   | 2885000   |
| Running Forward KL  | 12.3      |
| Running Reverse KL  | 8.38      |
| Running Update Time | 577       |
-----------------------------------
--2024-08-11 20:52:06.414677 UTC---
| Itration            | 578       |
| Real Det Return     | 1.21e+04  |
| Real Sto Return     | 1.14e+04  |
| Reward Loss         | -6.31e+06 |
| Running Env Steps   | 2890000   |
| Running Forward KL  | 12.2      |
| Running Reverse KL  | 8.08      |
| Running Update Time | 578       |
-----------------------------------
--2024-08-11 20:53:38.604923 UTC--
| Itration            | 579      |
| Real Det Return     | 1.22e+04 |
| Real Sto Return     | 1.13e+04 |
| Reward Loss         | -5.6e+06 |
| Running Env Steps   | 2895000  |
| Running Forward KL  | 11.8     |
| Running Reverse KL  | 7.78     |
| Running Update Time | 579      |
----------------------------------
--2024-08-11 20:55:11.641207 UTC---
| Itration            | 580       |
| Real Det Return     | 1.22e+04  |
| Real Sto Return     | 1.08e+04  |
| Reward Loss         | -7.75e+06 |
| Running Env Steps   | 2900000   |
| Running Forward KL  | 11.8      |
| Running Reverse KL  | 7.57      |
| Running Update Time | 580       |
-----------------------------------
--2024-08-11 20:56:45.923652 UTC---
| Itration            | 581       |
| Real Det Return     | 1.25e+04  |
| Real Sto Return     | 1.06e+04  |
| Reward Loss         | -4.88e+06 |
| Running Env Steps   | 2905000   |
| Running Forward KL  | 11.1      |
| Running Reverse KL  | 7.4       |
| Running Update Time | 581       |
-----------------------------------
--2024-08-11 20:58:17.108260 UTC--
| Itration            | 582      |
| Real Det Return     | 1.18e+04 |
| Real Sto Return     | 1.17e+04 |
| Reward Loss         | -6.6e+06 |
| Running Env Steps   | 2910000  |
| Running Forward KL  | 12.1     |
| Running Reverse KL  | 8.2      |
| Running Update Time | 582      |
----------------------------------
--2024-08-11 20:59:50.440068 UTC---
| Itration            | 583       |
| Real Det Return     | 1.2e+04   |
| Real Sto Return     | 1.18e+04  |
| Reward Loss         | -5.31e+06 |
| Running Env Steps   | 2915000   |
| Running Forward KL  | 11.8      |
| Running Reverse KL  | 7.94      |
| Running Update Time | 583       |
-----------------------------------
--2024-08-11 21:01:23.669110 UTC---
| Itration            | 584       |
| Real Det Return     | 1.25e+04  |
| Real Sto Return     | 1.13e+04  |
| Reward Loss         | -5.69e+06 |
| Running Env Steps   | 2920000   |
| Running Forward KL  | 12.1      |
| Running Reverse KL  | 8.06      |
| Running Update Time | 584       |
-----------------------------------
--2024-08-11 21:02:55.032933 UTC---
| Itration            | 585       |
| Real Det Return     | 1.25e+04  |
| Real Sto Return     | 1.17e+04  |
| Reward Loss         | -9.03e+06 |
| Running Env Steps   | 2925000   |
| Running Forward KL  | 11.9      |
| Running Reverse KL  | 7.43      |
| Running Update Time | 585       |
-----------------------------------
--2024-08-11 21:04:28.590869 UTC--
| Itration            | 586      |
| Real Det Return     | 1.24e+04 |
| Real Sto Return     | 1.11e+04 |
| Reward Loss         | -5.7e+06 |
| Running Env Steps   | 2930000  |
| Running Forward KL  | 11.7     |
| Running Reverse KL  | 8.03     |
| Running Update Time | 586      |
----------------------------------
--2024-08-11 21:06:00.665856 UTC---
| Itration            | 587       |
| Real Det Return     | 1.19e+04  |
| Real Sto Return     | 1.12e+04  |
| Reward Loss         | -7.87e+06 |
| Running Env Steps   | 2935000   |
| Running Forward KL  | 13.1      |
| Running Reverse KL  | 9.36      |
| Running Update Time | 587       |
-----------------------------------
--2024-08-11 21:07:35.336579 UTC---
| Itration            | 588       |
| Real Det Return     | 1.24e+04  |
| Real Sto Return     | 1.18e+04  |
| Reward Loss         | -5.56e+06 |
| Running Env Steps   | 2940000   |
| Running Forward KL  | 11.9      |
| Running Reverse KL  | 8.07      |
| Running Update Time | 588       |
-----------------------------------
--2024-08-11 21:09:08.668517 UTC--
| Itration            | 589      |
| Real Det Return     | 1.23e+04 |
| Real Sto Return     | 1.17e+04 |
| Reward Loss         | -5.4e+06 |
| Running Env Steps   | 2945000  |
| Running Forward KL  | 12.4     |
| Running Reverse KL  | 8.43     |
| Running Update Time | 589      |
----------------------------------
--2024-08-11 21:10:40.523798 UTC---
| Itration            | 590       |
| Real Det Return     | 1.25e+04  |
| Real Sto Return     | 1.15e+04  |
| Reward Loss         | -5.64e+06 |
| Running Env Steps   | 2950000   |
| Running Forward KL  | 12.1      |
| Running Reverse KL  | 8.13      |
| Running Update Time | 590       |
-----------------------------------
--2024-08-11 21:12:12.481053 UTC---
| Itration            | 591       |
| Real Det Return     | 1.19e+04  |
| Real Sto Return     | 1.11e+04  |
| Reward Loss         | -7.09e+06 |
| Running Env Steps   | 2955000   |
| Running Forward KL  | 12.2      |
| Running Reverse KL  | 7.87      |
| Running Update Time | 591       |
-----------------------------------
--2024-08-11 21:13:44.991113 UTC---
| Itration            | 592       |
| Real Det Return     | 1.24e+04  |
| Real Sto Return     | 1.17e+04  |
| Reward Loss         | -5.09e+06 |
| Running Env Steps   | 2960000   |
| Running Forward KL  | 11.9      |
| Running Reverse KL  | 8.65      |
| Running Update Time | 592       |
-----------------------------------
--2024-08-11 21:15:16.738999 UTC--
| Itration            | 593      |
| Real Det Return     | 1.16e+04 |
| Real Sto Return     | 1.11e+04 |
| Reward Loss         | -8.1e+06 |
| Running Env Steps   | 2965000  |
| Running Forward KL  | 13.1     |
| Running Reverse KL  | 9.59     |
| Running Update Time | 593      |
----------------------------------
--2024-08-11 21:16:50.009187 UTC---
| Itration            | 594       |
| Real Det Return     | 1.06e+04  |
| Real Sto Return     | 1.06e+04  |
| Reward Loss         | -7.72e+06 |
| Running Env Steps   | 2970000   |
| Running Forward KL  | 13.1      |
| Running Reverse KL  | 8.99      |
| Running Update Time | 594       |
-----------------------------------
--2024-08-11 21:18:21.932553 UTC---
| Itration            | 595       |
| Real Det Return     | 1.22e+04  |
| Real Sto Return     | 1.14e+04  |
| Reward Loss         | -7.29e+06 |
| Running Env Steps   | 2975000   |
| Running Forward KL  | 11.3      |
| Running Reverse KL  | 6.96      |
| Running Update Time | 595       |
-----------------------------------
--2024-08-11 21:19:56.413513 UTC---
| Itration            | 596       |
| Real Det Return     | 1.19e+04  |
| Real Sto Return     | 1.11e+04  |
| Reward Loss         | -8.55e+06 |
| Running Env Steps   | 2980000   |
| Running Forward KL  | 12.5      |
| Running Reverse KL  | 8.5       |
| Running Update Time | 596       |
-----------------------------------
--2024-08-11 21:21:29.426510 UTC---
| Itration            | 597       |
| Real Det Return     | 1.24e+04  |
| Real Sto Return     | 1.11e+04  |
| Reward Loss         | -6.18e+06 |
| Running Env Steps   | 2985000   |
| Running Forward KL  | 12.4      |
| Running Reverse KL  | 8.42      |
| Running Update Time | 597       |
-----------------------------------
--2024-08-11 21:23:01.418637 UTC---
| Itration            | 598       |
| Real Det Return     | 1.26e+04  |
| Real Sto Return     | 1.16e+04  |
| Reward Loss         | -5.62e+06 |
| Running Env Steps   | 2990000   |
| Running Forward KL  | 11.2      |
| Running Reverse KL  | 7.79      |
| Running Update Time | 598       |
-----------------------------------
--2024-08-11 21:24:34.263325 UTC---
| Itration            | 599       |
| Real Det Return     | 1.25e+04  |
| Real Sto Return     | 1.18e+04  |
| Reward Loss         | -6.13e+06 |
| Running Env Steps   | 2995000   |
| Running Forward KL  | 11.9      |
| Running Reverse KL  | 8.18      |
| Running Update Time | 599       |
-----------------------------------
