Logging to logs/HalfCheetah-v3/exp-1/maxentirl_sa/2023_11_06_11_03_28
--2023-11-06 11:04:47.353178 CST--
| Itration            | 0        |
| Real Det Return     | 932      |
| Real Sto Return     | 689      |
| Reward Loss         | 96.1     |
| Running Env Steps   | 0        |
| Running Forward KL  | 43.3     |
| Running Reverse KL  | 11.1     |
| Running Update Time | 0        |
----------------------------------
--2023-11-06 11:06:16.284967 CST--
| Itration            | 1        |
| Real Det Return     | 1.02e+03 |
| Real Sto Return     | 688      |
| Reward Loss         | 125      |
| Running Env Steps   | 5000     |
| Running Forward KL  | 43.2     |
| Running Reverse KL  | 11.3     |
| Running Update Time | 1        |
----------------------------------
--2023-11-06 11:07:45.435807 CST--
| Itration            | 2        |
| Real Det Return     | 649      |
| Real Sto Return     | 624      |
| Reward Loss         | 149      |
| Running Env Steps   | 10000    |
| Running Forward KL  | 44.1     |
| Running Reverse KL  | 11.2     |
| Running Update Time | 2        |
----------------------------------
--2023-11-06 11:09:14.577248 CST--
| Itration            | 3        |
| Real Det Return     | 1.07e+03 |
| Real Sto Return     | 652      |
| Reward Loss         | 89.2     |
| Running Env Steps   | 15000    |
| Running Forward KL  | 43.5     |
| Running Reverse KL  | 10.7     |
| Running Update Time | 3        |
----------------------------------
--2023-11-06 11:10:44.040927 CST--
| Itration            | 4        |
| Real Det Return     | 1.11e+03 |
| Real Sto Return     | 721      |
| Reward Loss         | 81.9     |
| Running Env Steps   | 20000    |
| Running Forward KL  | 42.5     |
| Running Reverse KL  | 11.3     |
| Running Update Time | 4        |
----------------------------------
--2023-11-06 11:12:13.531362 CST--
| Itration            | 5        |
| Real Det Return     | 1.01e+03 |
| Real Sto Return     | 746      |
| Reward Loss         | 93.9     |
| Running Env Steps   | 25000    |
| Running Forward KL  | 42.3     |
| Running Reverse KL  | 11.2     |
| Running Update Time | 5        |
----------------------------------
--2023-11-06 11:13:43.066790 CST--
| Itration            | 6        |
| Real Det Return     | 1.15e+03 |
| Real Sto Return     | 734      |
| Reward Loss         | 62.5     |
| Running Env Steps   | 30000    |
| Running Forward KL  | 43.1     |
| Running Reverse KL  | 10.9     |
| Running Update Time | 6        |
----------------------------------
--2023-11-06 11:15:17.732942 CST--
| Itration            | 7        |
| Real Det Return     | 1.29e+03 |
| Real Sto Return     | 715      |
| Reward Loss         | 54.6     |
| Running Env Steps   | 35000    |
| Running Forward KL  | 42.8     |
| Running Reverse KL  | 11.1     |
| Running Update Time | 7        |
----------------------------------
--2023-11-06 11:16:52.066618 CST--
| Itration            | 8        |
| Real Det Return     | 1.24e+03 |
| Real Sto Return     | 714      |
| Reward Loss         | 43.8     |
| Running Env Steps   | 40000    |
| Running Forward KL  | 43.3     |
| Running Reverse KL  | 10.7     |
| Running Update Time | 8        |
----------------------------------
--2023-11-06 11:18:27.023467 CST--
| Itration            | 9        |
| Real Det Return     | 1.29e+03 |
| Real Sto Return     | 724      |
| Reward Loss         | 9.07     |
| Running Env Steps   | 45000    |
| Running Forward KL  | 43.2     |
| Running Reverse KL  | 10.5     |
| Running Update Time | 9        |
----------------------------------
--2023-11-06 11:20:03.396316 CST--
| Itration            | 10       |
| Real Det Return     | 1.29e+03 |
| Real Sto Return     | 746      |
| Reward Loss         | 7.63     |
| Running Env Steps   | 50000    |
| Running Forward KL  | 42.5     |
| Running Reverse KL  | 10.8     |
| Running Update Time | 10       |
----------------------------------
--2023-11-06 11:21:42.866605 CST--
| Itration            | 11       |
| Real Det Return     | 1.32e+03 |
| Real Sto Return     | 765      |
| Reward Loss         | -2.32    |
| Running Env Steps   | 55000    |
| Running Forward KL  | 42.1     |
| Running Reverse KL  | 10.7     |
| Running Update Time | 11       |
----------------------------------
--2023-11-06 11:23:23.517108 CST--
| Itration            | 12       |
| Real Det Return     | 1.34e+03 |
| Real Sto Return     | 734      |
| Reward Loss         | -28.1    |
| Running Env Steps   | 60000    |
| Running Forward KL  | 43.4     |
| Running Reverse KL  | 10.6     |
| Running Update Time | 12       |
----------------------------------
--2023-11-06 11:25:05.676523 CST--
| Itration            | 13       |
| Real Det Return     | 1.3e+03  |
| Real Sto Return     | 746      |
| Reward Loss         | -39.9    |
| Running Env Steps   | 65000    |
| Running Forward KL  | 42.2     |
| Running Reverse KL  | 10.4     |
| Running Update Time | 13       |
----------------------------------
--2023-11-06 11:26:43.827172 CST--
| Itration            | 14       |
| Real Det Return     | 1.19e+03 |
| Real Sto Return     | 761      |
| Reward Loss         | -52.8    |
| Running Env Steps   | 70000    |
| Running Forward KL  | 43.2     |
| Running Reverse KL  | 10.2     |
| Running Update Time | 14       |
----------------------------------
--2023-11-06 11:28:27.114751 CST--
| Itration            | 15       |
| Real Det Return     | 1.24e+03 |
| Real Sto Return     | 785      |
| Reward Loss         | -60.7    |
| Running Env Steps   | 75000    |
| Running Forward KL  | 42       |
| Running Reverse KL  | 10.4     |
| Running Update Time | 15       |
----------------------------------
--2023-11-06 11:30:12.838493 CST--
| Itration            | 16       |
| Real Det Return     | 1.24e+03 |
| Real Sto Return     | 772      |
| Reward Loss         | -65.7    |
| Running Env Steps   | 80000    |
| Running Forward KL  | 41.7     |
| Running Reverse KL  | 10.2     |
| Running Update Time | 16       |
----------------------------------
--2023-11-06 11:32:00.058108 CST--
| Itration            | 17       |
| Real Det Return     | 1.27e+03 |
| Real Sto Return     | 773      |
| Reward Loss         | -78.3    |
| Running Env Steps   | 85000    |
| Running Forward KL  | 42       |
| Running Reverse KL  | 10.2     |
| Running Update Time | 17       |
----------------------------------
--2023-11-06 11:33:48.407013 CST--
| Itration            | 18       |
| Real Det Return     | 1.24e+03 |
| Real Sto Return     | 791      |
| Reward Loss         | -88.5    |
| Running Env Steps   | 90000    |
| Running Forward KL  | 42.8     |
| Running Reverse KL  | 10.1     |
| Running Update Time | 18       |
----------------------------------
--2023-11-06 11:35:38.018774 CST--
| Itration            | 19       |
| Real Det Return     | 1.2e+03  |
| Real Sto Return     | 790      |
| Reward Loss         | -96.2    |
| Running Env Steps   | 95000    |
| Running Forward KL  | 41.8     |
| Running Reverse KL  | 10.2     |
| Running Update Time | 19       |
----------------------------------
--2023-11-06 11:37:29.401893 CST--
| Itration            | 20       |
| Real Det Return     | 1.15e+03 |
| Real Sto Return     | 762      |
| Reward Loss         | -109     |
| Running Env Steps   | 100000   |
| Running Forward KL  | 42.3     |
| Running Reverse KL  | 10.1     |
| Running Update Time | 20       |
----------------------------------
--2023-11-06 11:39:21.871294 CST--
| Itration            | 21       |
| Real Det Return     | 1.2e+03  |
| Real Sto Return     | 812      |
| Reward Loss         | -116     |
| Running Env Steps   | 105000   |
| Running Forward KL  | 41.2     |
| Running Reverse KL  | 10.2     |
| Running Update Time | 21       |
----------------------------------
--2023-11-06 11:41:15.401262 CST--
| Itration            | 22       |
| Real Det Return     | 1.13e+03 |
| Real Sto Return     | 849      |
| Reward Loss         | -121     |
| Running Env Steps   | 110000   |
| Running Forward KL  | 41.9     |
| Running Reverse KL  | 10.2     |
| Running Update Time | 22       |
----------------------------------
--2023-11-06 11:43:13.683140 CST--
| Itration            | 23       |
| Real Det Return     | 1.05e+03 |
| Real Sto Return     | 833      |
| Reward Loss         | -130     |
| Running Env Steps   | 115000   |
| Running Forward KL  | 41.5     |
| Running Reverse KL  | 10.2     |
| Running Update Time | 23       |
----------------------------------
--2023-11-06 11:45:13.048988 CST--
| Itration            | 24       |
| Real Det Return     | 1.07e+03 |
| Real Sto Return     | 795      |
| Reward Loss         | -140     |
| Running Env Steps   | 120000   |
| Running Forward KL  | 41.9     |
| Running Reverse KL  | 10.3     |
| Running Update Time | 24       |
----------------------------------
--2023-11-06 11:47:13.180850 CST--
| Itration            | 25       |
| Real Det Return     | 918      |
| Real Sto Return     | 739      |
| Reward Loss         | -148     |
| Running Env Steps   | 125000   |
| Running Forward KL  | 41.8     |
| Running Reverse KL  | 10       |
| Running Update Time | 25       |
----------------------------------
--2023-11-06 11:49:14.213878 CST--
| Itration            | 26       |
| Real Det Return     | 1.05e+03 |
| Real Sto Return     | 829      |
| Reward Loss         | -160     |
| Running Env Steps   | 130000   |
| Running Forward KL  | 41.8     |
| Running Reverse KL  | 10.1     |
| Running Update Time | 26       |
----------------------------------
--2023-11-06 11:51:15.690516 CST--
| Itration            | 27       |
| Real Det Return     | 1.11e+03 |
| Real Sto Return     | 845      |
| Reward Loss         | -161     |
| Running Env Steps   | 135000   |
| Running Forward KL  | 41.9     |
| Running Reverse KL  | 10       |
| Running Update Time | 27       |
----------------------------------
--2023-11-06 11:53:15.757760 CST--
| Itration            | 28       |
| Real Det Return     | 807      |
| Real Sto Return     | 815      |
| Reward Loss         | -172     |
| Running Env Steps   | 140000   |
| Running Forward KL  | 40.9     |
| Running Reverse KL  | 9.99     |
| Running Update Time | 28       |
----------------------------------
--2023-11-06 11:55:16.181385 CST--
| Itration            | 29       |
| Real Det Return     | 1.03e+03 |
| Real Sto Return     | 804      |
| Reward Loss         | -175     |
| Running Env Steps   | 145000   |
| Running Forward KL  | 42       |
| Running Reverse KL  | 9.83     |
| Running Update Time | 29       |
----------------------------------
--2023-11-06 11:57:16.327533 CST--
| Itration            | 30       |
| Real Det Return     | 871      |
| Real Sto Return     | 804      |
| Reward Loss         | -190     |
| Running Env Steps   | 150000   |
| Running Forward KL  | 41.5     |
| Running Reverse KL  | 10.1     |
| Running Update Time | 30       |
----------------------------------
--2023-11-06 11:59:16.690307 CST--
| Itration            | 31       |
| Real Det Return     | 972      |
| Real Sto Return     | 778      |
| Reward Loss         | -191     |
| Running Env Steps   | 155000   |
| Running Forward KL  | 41.1     |
| Running Reverse KL  | 10       |
| Running Update Time | 31       |
----------------------------------
--2023-11-06 12:01:14.626596 CST--
| Itration            | 32       |
| Real Det Return     | 1e+03    |
| Real Sto Return     | 846      |
| Reward Loss         | -197     |
| Running Env Steps   | 160000   |
| Running Forward KL  | 41.3     |
| Running Reverse KL  | 10       |
| Running Update Time | 32       |
----------------------------------
--2023-11-06 12:03:15.188379 CST--
| Itration            | 33       |
| Real Det Return     | 1.09e+03 |
| Real Sto Return     | 861      |
| Reward Loss         | -210     |
| Running Env Steps   | 165000   |
| Running Forward KL  | 41.6     |
| Running Reverse KL  | 10.2     |
| Running Update Time | 33       |
----------------------------------
--2023-11-06 12:05:16.296175 CST--
| Itration            | 34       |
| Real Det Return     | 1e+03    |
| Real Sto Return     | 819      |
| Reward Loss         | -217     |
| Running Env Steps   | 170000   |
| Running Forward KL  | 41.6     |
| Running Reverse KL  | 10       |
| Running Update Time | 34       |
----------------------------------
--2023-11-06 12:07:26.108482 CST--
| Itration            | 35       |
| Real Det Return     | 850      |
| Real Sto Return     | 813      |
| Reward Loss         | -222     |
| Running Env Steps   | 175000   |
| Running Forward KL  | 41.2     |
| Running Reverse KL  | 10       |
| Running Update Time | 35       |
----------------------------------
--2023-11-06 12:09:35.855731 CST--
| Itration            | 36       |
| Real Det Return     | 634      |
| Real Sto Return     | 821      |
| Reward Loss         | -230     |
| Running Env Steps   | 180000   |
| Running Forward KL  | 40.9     |
| Running Reverse KL  | 9.87     |
| Running Update Time | 36       |
----------------------------------
--2023-11-06 12:11:45.190360 CST--
| Itration            | 37       |
| Real Det Return     | 991      |
| Real Sto Return     | 825      |
| Reward Loss         | -223     |
| Running Env Steps   | 185000   |
| Running Forward KL  | 40.7     |
| Running Reverse KL  | 9.88     |
| Running Update Time | 37       |
----------------------------------
--2023-11-06 12:13:54.734117 CST--
| Itration            | 38       |
| Real Det Return     | 873      |
| Real Sto Return     | 836      |
| Reward Loss         | -232     |
| Running Env Steps   | 190000   |
| Running Forward KL  | 41       |
| Running Reverse KL  | 9.9      |
| Running Update Time | 38       |
----------------------------------
--2023-11-06 12:16:04.234650 CST--
| Itration            | 39       |
| Real Det Return     | 1.24e+03 |
| Real Sto Return     | 839      |
| Reward Loss         | -242     |
| Running Env Steps   | 195000   |
| Running Forward KL  | 41.1     |
| Running Reverse KL  | 9.66     |
| Running Update Time | 39       |
----------------------------------
--2023-11-06 12:18:13.795555 CST--
| Itration            | 40       |
| Real Det Return     | 758      |
| Real Sto Return     | 830      |
| Reward Loss         | -248     |
| Running Env Steps   | 200000   |
| Running Forward KL  | 40.8     |
| Running Reverse KL  | 9.58     |
| Running Update Time | 40       |
----------------------------------
--2023-11-06 12:20:23.407133 CST--
| Itration            | 41       |
| Real Det Return     | 1.19e+03 |
| Real Sto Return     | 855      |
| Reward Loss         | -261     |
| Running Env Steps   | 205000   |
| Running Forward KL  | 41.4     |
| Running Reverse KL  | 9.69     |
| Running Update Time | 41       |
----------------------------------
--2023-11-06 12:22:33.470510 CST--
| Itration            | 42       |
| Real Det Return     | 756      |
| Real Sto Return     | 866      |
| Reward Loss         | -261     |
| Running Env Steps   | 210000   |
| Running Forward KL  | 40.4     |
| Running Reverse KL  | 9.9      |
| Running Update Time | 42       |
----------------------------------
--2023-11-06 12:24:43.337233 CST--
| Itration            | 43       |
| Real Det Return     | 1.01e+03 |
| Real Sto Return     | 833      |
| Reward Loss         | -277     |
| Running Env Steps   | 215000   |
| Running Forward KL  | 41.7     |
| Running Reverse KL  | 9.7      |
| Running Update Time | 43       |
----------------------------------
--2023-11-06 12:26:53.129963 CST--
| Itration            | 44       |
| Real Det Return     | 1.05e+03 |
| Real Sto Return     | 820      |
| Reward Loss         | -277     |
| Running Env Steps   | 220000   |
| Running Forward KL  | 41.2     |
| Running Reverse KL  | 9.83     |
| Running Update Time | 44       |
----------------------------------
--2023-11-06 12:29:02.917089 CST--
| Itration            | 45       |
| Real Det Return     | 1.02e+03 |
| Real Sto Return     | 822      |
| Reward Loss         | -277     |
| Running Env Steps   | 225000   |
| Running Forward KL  | 41.1     |
| Running Reverse KL  | 9.76     |
| Running Update Time | 45       |
----------------------------------
--2023-11-06 12:31:13.012522 CST--
| Itration            | 46       |
| Real Det Return     | 1.09e+03 |
| Real Sto Return     | 857      |
| Reward Loss         | -292     |
| Running Env Steps   | 230000   |
| Running Forward KL  | 41       |
| Running Reverse KL  | 9.86     |
| Running Update Time | 46       |
----------------------------------
--2023-11-06 12:33:23.087321 CST--
| Itration            | 47       |
| Real Det Return     | 1.14e+03 |
| Real Sto Return     | 839      |
| Reward Loss         | -304     |
| Running Env Steps   | 235000   |
| Running Forward KL  | 40.5     |
| Running Reverse KL  | 9.6      |
| Running Update Time | 47       |
----------------------------------
--2023-11-06 12:35:33.407347 CST--
| Itration            | 48       |
| Real Det Return     | 1.14e+03 |
| Real Sto Return     | 871      |
| Reward Loss         | -291     |
| Running Env Steps   | 240000   |
| Running Forward KL  | 40.6     |
| Running Reverse KL  | 9.77     |
| Running Update Time | 48       |
----------------------------------
--2023-11-06 12:37:43.784169 CST--
| Itration            | 49       |
| Real Det Return     | 1.16e+03 |
| Real Sto Return     | 825      |
| Reward Loss         | -303     |
| Running Env Steps   | 245000   |
| Running Forward KL  | 40.7     |
| Running Reverse KL  | 9.78     |
| Running Update Time | 49       |
----------------------------------
--2023-11-06 12:39:54.053647 CST--
| Itration            | 50       |
| Real Det Return     | 1.18e+03 |
| Real Sto Return     | 862      |
| Reward Loss         | -313     |
| Running Env Steps   | 250000   |
| Running Forward KL  | 40.7     |
| Running Reverse KL  | 9.69     |
| Running Update Time | 50       |
----------------------------------
--2023-11-06 12:42:04.416588 CST--
| Itration            | 51       |
| Real Det Return     | 1.1e+03  |
| Real Sto Return     | 889      |
| Reward Loss         | -323     |
| Running Env Steps   | 255000   |
| Running Forward KL  | 40.9     |
| Running Reverse KL  | 9.76     |
| Running Update Time | 51       |
----------------------------------
--2023-11-06 12:44:14.871225 CST--
| Itration            | 52       |
| Real Det Return     | 1.18e+03 |
| Real Sto Return     | 898      |
| Reward Loss         | -322     |
| Running Env Steps   | 260000   |
| Running Forward KL  | 40.5     |
| Running Reverse KL  | 9.7      |
| Running Update Time | 52       |
----------------------------------
--2023-11-06 12:46:24.976593 CST--
| Itration            | 53       |
| Real Det Return     | 1.26e+03 |
| Real Sto Return     | 867      |
| Reward Loss         | -330     |
| Running Env Steps   | 265000   |
| Running Forward KL  | 39.8     |
| Running Reverse KL  | 9.79     |
| Running Update Time | 53       |
----------------------------------
--2023-11-06 12:48:34.954913 CST--
| Itration            | 54       |
| Real Det Return     | 1.32e+03 |
| Real Sto Return     | 877      |
| Reward Loss         | -333     |
| Running Env Steps   | 270000   |
| Running Forward KL  | 40.6     |
| Running Reverse KL  | 9.64     |
| Running Update Time | 54       |
----------------------------------
--2023-11-06 12:50:45.044679 CST--
| Itration            | 55       |
| Real Det Return     | 1.05e+03 |
| Real Sto Return     | 846      |
| Reward Loss         | -344     |
| Running Env Steps   | 275000   |
| Running Forward KL  | 40.6     |
| Running Reverse KL  | 9.73     |
| Running Update Time | 55       |
----------------------------------
--2023-11-06 12:52:51.468183 CST--
| Itration            | 56       |
| Real Det Return     | 1.32e+03 |
| Real Sto Return     | 884      |
| Reward Loss         | -351     |
| Running Env Steps   | 280000   |
| Running Forward KL  | 40.5     |
| Running Reverse KL  | 9.68     |
| Running Update Time | 56       |
----------------------------------
--2023-11-06 12:54:57.843639 CST--
| Itration            | 57       |
| Real Det Return     | 1.24e+03 |
| Real Sto Return     | 879      |
| Reward Loss         | -356     |
| Running Env Steps   | 285000   |
| Running Forward KL  | 41       |
| Running Reverse KL  | 9.87     |
| Running Update Time | 57       |
----------------------------------
--2023-11-06 12:57:04.319108 CST--
| Itration            | 58       |
| Real Det Return     | 1.25e+03 |
| Real Sto Return     | 964      |
| Reward Loss         | -349     |
| Running Env Steps   | 290000   |
| Running Forward KL  | 40.9     |
| Running Reverse KL  | 9.73     |
| Running Update Time | 58       |
----------------------------------
--2023-11-06 12:59:10.992010 CST--
| Itration            | 59       |
| Real Det Return     | 1.34e+03 |
| Real Sto Return     | 929      |
| Reward Loss         | -372     |
| Running Env Steps   | 295000   |
| Running Forward KL  | 40.6     |
| Running Reverse KL  | 9.73     |
| Running Update Time | 59       |
----------------------------------
--2023-11-06 13:01:17.674653 CST--
| Itration            | 60       |
| Real Det Return     | 1.22e+03 |
| Real Sto Return     | 890      |
| Reward Loss         | -365     |
| Running Env Steps   | 300000   |
| Running Forward KL  | 40.3     |
| Running Reverse KL  | 9.61     |
| Running Update Time | 60       |
----------------------------------
--2023-11-06 13:03:24.463426 CST--
| Itration            | 61       |
| Real Det Return     | 1.25e+03 |
| Real Sto Return     | 902      |
| Reward Loss         | -376     |
| Running Env Steps   | 305000   |
| Running Forward KL  | 40.7     |
| Running Reverse KL  | 9.73     |
| Running Update Time | 61       |
----------------------------------
--2023-11-06 13:05:31.594278 CST--
| Itration            | 62       |
| Real Det Return     | 1.27e+03 |
| Real Sto Return     | 906      |
| Reward Loss         | -378     |
| Running Env Steps   | 310000   |
| Running Forward KL  | 40.9     |
| Running Reverse KL  | 9.72     |
| Running Update Time | 62       |
----------------------------------
--2023-11-06 13:07:38.571398 CST--
| Itration            | 63       |
| Real Det Return     | 1.33e+03 |
| Real Sto Return     | 941      |
| Reward Loss         | -377     |
| Running Env Steps   | 315000   |
| Running Forward KL  | 40.5     |
| Running Reverse KL  | 9.68     |
| Running Update Time | 63       |
----------------------------------
--2023-11-06 13:09:40.993175 CST--
| Itration            | 64       |
| Real Det Return     | 1.26e+03 |
| Real Sto Return     | 955      |
| Reward Loss         | -387     |
| Running Env Steps   | 320000   |
| Running Forward KL  | 40.6     |
| Running Reverse KL  | 9.58     |
| Running Update Time | 64       |
----------------------------------
--2023-11-06 13:11:43.498750 CST--
| Itration            | 65       |
| Real Det Return     | 1.36e+03 |
| Real Sto Return     | 982      |
| Reward Loss         | -413     |
| Running Env Steps   | 325000   |
| Running Forward KL  | 40.5     |
| Running Reverse KL  | 9.67     |
| Running Update Time | 65       |
----------------------------------
--2023-11-06 13:13:46.764786 CST--
| Itration            | 66       |
| Real Det Return     | 1.19e+03 |
| Real Sto Return     | 967      |
| Reward Loss         | -395     |
| Running Env Steps   | 330000   |
| Running Forward KL  | 39.9     |
| Running Reverse KL  | 9.41     |
| Running Update Time | 66       |
----------------------------------
--2023-11-06 13:15:50.835707 CST--
| Itration            | 67       |
| Real Det Return     | 1.4e+03  |
| Real Sto Return     | 987      |
| Reward Loss         | -414     |
| Running Env Steps   | 335000   |
| Running Forward KL  | 40.5     |
| Running Reverse KL  | 9.62     |
| Running Update Time | 67       |
----------------------------------
--2023-11-06 13:17:54.477766 CST--
| Itration            | 68       |
| Real Det Return     | 1.48e+03 |
| Real Sto Return     | 1.03e+03 |
| Reward Loss         | -409     |
| Running Env Steps   | 340000   |
| Running Forward KL  | 39.7     |
| Running Reverse KL  | 9.62     |
| Running Update Time | 68       |
----------------------------------
--2023-11-06 13:19:57.820749 CST--
| Itration            | 69       |
| Real Det Return     | 1.66e+03 |
| Real Sto Return     | 1.05e+03 |
| Reward Loss         | -425     |
| Running Env Steps   | 345000   |
| Running Forward KL  | 40.1     |
| Running Reverse KL  | 9.61     |
| Running Update Time | 69       |
----------------------------------
--2023-11-06 13:22:01.425620 CST--
| Itration            | 70       |
| Real Det Return     | 1.44e+03 |
| Real Sto Return     | 1.07e+03 |
| Reward Loss         | -414     |
| Running Env Steps   | 350000   |
| Running Forward KL  | 39.8     |
| Running Reverse KL  | 9.39     |
| Running Update Time | 70       |
----------------------------------
--2023-11-06 13:24:04.750171 CST--
| Itration            | 71       |
| Real Det Return     | 1.36e+03 |
| Real Sto Return     | 1.05e+03 |
| Reward Loss         | -420     |
| Running Env Steps   | 355000   |
| Running Forward KL  | 40       |
| Running Reverse KL  | 9.33     |
| Running Update Time | 71       |
----------------------------------
--2023-11-06 13:26:08.294038 CST--
| Itration            | 72       |
| Real Det Return     | 1.62e+03 |
| Real Sto Return     | 1.03e+03 |
| Reward Loss         | -438     |
| Running Env Steps   | 360000   |
| Running Forward KL  | 40.1     |
| Running Reverse KL  | 9.48     |
| Running Update Time | 72       |
----------------------------------
--2023-11-06 13:28:12.059031 CST--
| Itration            | 73       |
| Real Det Return     | 1.53e+03 |
| Real Sto Return     | 1.06e+03 |
| Reward Loss         | -444     |
| Running Env Steps   | 365000   |
| Running Forward KL  | 40.3     |
| Running Reverse KL  | 9.55     |
| Running Update Time | 73       |
----------------------------------
--2023-11-06 13:30:19.232880 CST--
| Itration            | 74       |
| Real Det Return     | 1.62e+03 |
| Real Sto Return     | 1.07e+03 |
| Reward Loss         | -442     |
| Running Env Steps   | 370000   |
| Running Forward KL  | 39.4     |
| Running Reverse KL  | 9.46     |
| Running Update Time | 74       |
----------------------------------
--2023-11-06 13:32:27.518604 CST--
| Itration            | 75       |
| Real Det Return     | 1.54e+03 |
| Real Sto Return     | 1.09e+03 |
| Reward Loss         | -456     |
| Running Env Steps   | 375000   |
| Running Forward KL  | 40.2     |
| Running Reverse KL  | 9.54     |
| Running Update Time | 75       |
----------------------------------
--2023-11-06 13:34:35.026180 CST--
| Itration            | 76       |
| Real Det Return     | 1.51e+03 |
| Real Sto Return     | 1.1e+03  |
| Reward Loss         | -464     |
| Running Env Steps   | 380000   |
| Running Forward KL  | 39.5     |
| Running Reverse KL  | 9.45     |
| Running Update Time | 76       |
----------------------------------
--2023-11-06 13:36:43.193316 CST--
| Itration            | 77       |
| Real Det Return     | 1.5e+03  |
| Real Sto Return     | 1.11e+03 |
| Reward Loss         | -446     |
| Running Env Steps   | 385000   |
| Running Forward KL  | 39.5     |
| Running Reverse KL  | 9.36     |
| Running Update Time | 77       |
----------------------------------
--2023-11-06 13:38:50.708239 CST--
| Itration            | 78       |
| Real Det Return     | 1.54e+03 |
| Real Sto Return     | 1.12e+03 |
| Reward Loss         | -465     |
| Running Env Steps   | 390000   |
| Running Forward KL  | 40.2     |
| Running Reverse KL  | 9.48     |
| Running Update Time | 78       |
----------------------------------
--2023-11-06 13:40:58.661989 CST--
| Itration            | 79       |
| Real Det Return     | 1.46e+03 |
| Real Sto Return     | 1.12e+03 |
| Reward Loss         | -462     |
| Running Env Steps   | 395000   |
| Running Forward KL  | 39.7     |
| Running Reverse KL  | 9.36     |
| Running Update Time | 79       |
----------------------------------
--2023-11-06 13:43:06.063874 CST--
| Itration            | 80       |
| Real Det Return     | 1.5e+03  |
| Real Sto Return     | 1.13e+03 |
| Reward Loss         | -461     |
| Running Env Steps   | 400000   |
| Running Forward KL  | 39.2     |
| Running Reverse KL  | 9.32     |
| Running Update Time | 80       |
----------------------------------
--2023-11-06 13:45:13.914192 CST--
| Itration            | 81       |
| Real Det Return     | 1.62e+03 |
| Real Sto Return     | 1.12e+03 |
| Reward Loss         | -463     |
| Running Env Steps   | 405000   |
| Running Forward KL  | 39       |
| Running Reverse KL  | 9.33     |
| Running Update Time | 81       |
----------------------------------
--2023-11-06 13:47:21.422231 CST--
| Itration            | 82       |
| Real Det Return     | 2.05e+03 |
| Real Sto Return     | 1.25e+03 |
| Reward Loss         | -465     |
| Running Env Steps   | 410000   |
| Running Forward KL  | 39.7     |
| Running Reverse KL  | 9.41     |
| Running Update Time | 82       |
----------------------------------
--2023-11-06 13:49:26.958413 CST--
| Itration            | 83       |
| Real Det Return     | 1.54e+03 |
| Real Sto Return     | 1.19e+03 |
| Reward Loss         | -476     |
| Running Env Steps   | 415000   |
| Running Forward KL  | 39.4     |
| Running Reverse KL  | 9.15     |
| Running Update Time | 83       |
----------------------------------
--2023-11-06 13:51:32.485248 CST--
| Itration            | 84       |
| Real Det Return     | 1.59e+03 |
| Real Sto Return     | 1.16e+03 |
| Reward Loss         | -487     |
| Running Env Steps   | 420000   |
| Running Forward KL  | 39.6     |
| Running Reverse KL  | 9.46     |
| Running Update Time | 84       |
----------------------------------
--2023-11-06 13:53:39.486538 CST--
| Itration            | 85       |
| Real Det Return     | 1.5e+03  |
| Real Sto Return     | 1.19e+03 |
| Reward Loss         | -486     |
| Running Env Steps   | 425000   |
| Running Forward KL  | 39.6     |
| Running Reverse KL  | 9.35     |
| Running Update Time | 85       |
----------------------------------
--2023-11-06 13:55:45.084153 CST--
| Itration            | 86       |
| Real Det Return     | 1.63e+03 |
| Real Sto Return     | 1.25e+03 |
| Reward Loss         | -478     |
| Running Env Steps   | 430000   |
| Running Forward KL  | 38.6     |
| Running Reverse KL  | 9.28     |
| Running Update Time | 86       |
----------------------------------
--2023-11-06 13:57:50.781824 CST--
| Itration            | 87       |
| Real Det Return     | 1.69e+03 |
| Real Sto Return     | 1.28e+03 |
| Reward Loss         | -492     |
| Running Env Steps   | 435000   |
| Running Forward KL  | 39.2     |
| Running Reverse KL  | 9.22     |
| Running Update Time | 87       |
----------------------------------
--2023-11-06 13:59:56.536233 CST--
| Itration            | 88       |
| Real Det Return     | 1.82e+03 |
| Real Sto Return     | 1.25e+03 |
| Reward Loss         | -492     |
| Running Env Steps   | 440000   |
| Running Forward KL  | 39.4     |
| Running Reverse KL  | 9.31     |
| Running Update Time | 88       |
----------------------------------
--2023-11-06 14:02:00.376226 CST--
| Itration            | 89       |
| Real Det Return     | 1.71e+03 |
| Real Sto Return     | 1.26e+03 |
| Reward Loss         | -492     |
| Running Env Steps   | 445000   |
| Running Forward KL  | 39.1     |
| Running Reverse KL  | 9.19     |
| Running Update Time | 89       |
----------------------------------
--2023-11-06 14:04:04.826574 CST--
| Itration            | 90       |
| Real Det Return     | 1.73e+03 |
| Real Sto Return     | 1.33e+03 |
| Reward Loss         | -517     |
| Running Env Steps   | 450000   |
| Running Forward KL  | 39.5     |
| Running Reverse KL  | 9.42     |
| Running Update Time | 90       |
----------------------------------
--2023-11-06 14:06:09.088478 CST--
| Itration            | 91       |
| Real Det Return     | 1.8e+03  |
| Real Sto Return     | 1.3e+03  |
| Reward Loss         | -520     |
| Running Env Steps   | 455000   |
| Running Forward KL  | 39.6     |
| Running Reverse KL  | 9.27     |
| Running Update Time | 91       |
----------------------------------
--2023-11-06 14:08:12.950094 CST--
| Itration            | 92       |
| Real Det Return     | 1.71e+03 |
| Real Sto Return     | 1.32e+03 |
| Reward Loss         | -515     |
| Running Env Steps   | 460000   |
| Running Forward KL  | 39.3     |
| Running Reverse KL  | 9.36     |
| Running Update Time | 92       |
----------------------------------
--2023-11-06 14:10:16.625873 CST--
| Itration            | 93       |
| Real Det Return     | 1.85e+03 |
| Real Sto Return     | 1.36e+03 |
| Reward Loss         | -508     |
| Running Env Steps   | 465000   |
| Running Forward KL  | 38.3     |
| Running Reverse KL  | 9.19     |
| Running Update Time | 93       |
----------------------------------
--2023-11-06 14:12:20.324870 CST--
| Itration            | 94       |
| Real Det Return     | 2.12e+03 |
| Real Sto Return     | 1.46e+03 |
| Reward Loss         | -510     |
| Running Env Steps   | 470000   |
| Running Forward KL  | 38.9     |
| Running Reverse KL  | 9.14     |
| Running Update Time | 94       |
----------------------------------
--2023-11-06 14:14:24.037531 CST--
| Itration            | 95       |
| Real Det Return     | 2.06e+03 |
| Real Sto Return     | 1.43e+03 |
| Reward Loss         | -505     |
| Running Env Steps   | 475000   |
| Running Forward KL  | 38.7     |
| Running Reverse KL  | 9.17     |
| Running Update Time | 95       |
----------------------------------
--2023-11-06 14:16:36.680648 CST--
| Itration            | 96       |
| Real Det Return     | 2.04e+03 |
| Real Sto Return     | 1.4e+03  |
| Reward Loss         | -515     |
| Running Env Steps   | 480000   |
| Running Forward KL  | 38.7     |
| Running Reverse KL  | 9.03     |
| Running Update Time | 96       |
----------------------------------
--2023-11-06 14:18:49.180191 CST--
| Itration            | 97       |
| Real Det Return     | 1.95e+03 |
| Real Sto Return     | 1.4e+03  |
| Reward Loss         | -542     |
| Running Env Steps   | 485000   |
| Running Forward KL  | 39.6     |
| Running Reverse KL  | 9.21     |
| Running Update Time | 97       |
----------------------------------
--2023-11-06 14:21:01.527002 CST--
| Itration            | 98       |
| Real Det Return     | 1.9e+03  |
| Real Sto Return     | 1.47e+03 |
| Reward Loss         | -522     |
| Running Env Steps   | 490000   |
| Running Forward KL  | 38.8     |
| Running Reverse KL  | 9.14     |
| Running Update Time | 98       |
----------------------------------
--2023-11-06 14:23:13.863174 CST--
| Itration            | 99       |
| Real Det Return     | 2.04e+03 |
| Real Sto Return     | 1.47e+03 |
| Reward Loss         | -528     |
| Running Env Steps   | 495000   |
| Running Forward KL  | 39       |
| Running Reverse KL  | 9.04     |
| Running Update Time | 99       |
----------------------------------
--2023-11-06 14:25:25.816070 CST--
| Itration            | 100      |
| Real Det Return     | 1.9e+03  |
| Real Sto Return     | 1.42e+03 |
| Reward Loss         | -532     |
| Running Env Steps   | 500000   |
| Running Forward KL  | 38.9     |
| Running Reverse KL  | 9.2      |
| Running Update Time | 100      |
----------------------------------
--2023-11-06 14:27:37.869137 CST--
| Itration            | 101      |
| Real Det Return     | 2.11e+03 |
| Real Sto Return     | 1.46e+03 |
| Reward Loss         | -534     |
| Running Env Steps   | 505000   |
| Running Forward KL  | 38.6     |
| Running Reverse KL  | 9.11     |
| Running Update Time | 101      |
----------------------------------
--2023-11-06 14:29:50.334185 CST--
| Itration            | 102      |
| Real Det Return     | 2.27e+03 |
| Real Sto Return     | 1.54e+03 |
| Reward Loss         | -535     |
| Running Env Steps   | 510000   |
| Running Forward KL  | 38.3     |
| Running Reverse KL  | 9.01     |
| Running Update Time | 102      |
----------------------------------
--2023-11-06 14:32:02.752643 CST--
| Itration            | 103      |
| Real Det Return     | 2.27e+03 |
| Real Sto Return     | 1.57e+03 |
| Reward Loss         | -536     |
| Running Env Steps   | 515000   |
| Running Forward KL  | 38.9     |
| Running Reverse KL  | 8.98     |
| Running Update Time | 103      |
----------------------------------
--2023-11-06 14:34:15.279009 CST--
| Itration            | 104      |
| Real Det Return     | 2.19e+03 |
| Real Sto Return     | 1.59e+03 |
| Reward Loss         | -537     |
| Running Env Steps   | 520000   |
| Running Forward KL  | 38.6     |
| Running Reverse KL  | 8.96     |
| Running Update Time | 104      |
----------------------------------
--2023-11-06 14:36:27.528864 CST--
| Itration            | 105      |
| Real Det Return     | 2.26e+03 |
| Real Sto Return     | 1.56e+03 |
| Reward Loss         | -555     |
| Running Env Steps   | 525000   |
| Running Forward KL  | 39       |
| Running Reverse KL  | 9.04     |
| Running Update Time | 105      |
----------------------------------
--2023-11-06 14:38:40.538615 CST--
| Itration            | 106      |
| Real Det Return     | 2.22e+03 |
| Real Sto Return     | 1.59e+03 |
| Reward Loss         | -542     |
| Running Env Steps   | 530000   |
| Running Forward KL  | 38       |
| Running Reverse KL  | 8.92     |
| Running Update Time | 106      |
----------------------------------
--2023-11-06 14:40:52.693893 CST--
| Itration            | 107      |
| Real Det Return     | 2.18e+03 |
| Real Sto Return     | 1.58e+03 |
| Reward Loss         | -540     |
| Running Env Steps   | 535000   |
| Running Forward KL  | 38.1     |
| Running Reverse KL  | 9.01     |
| Running Update Time | 107      |
----------------------------------
--2023-11-06 14:43:00.704122 CST--
| Itration            | 108      |
| Real Det Return     | 2.4e+03  |
| Real Sto Return     | 1.62e+03 |
| Reward Loss         | -547     |
| Running Env Steps   | 540000   |
| Running Forward KL  | 38.5     |
| Running Reverse KL  | 8.98     |
| Running Update Time | 108      |
----------------------------------
--2023-11-06 14:45:08.735852 CST--
| Itration            | 109      |
| Real Det Return     | 2.29e+03 |
| Real Sto Return     | 1.67e+03 |
| Reward Loss         | -549     |
| Running Env Steps   | 545000   |
| Running Forward KL  | 38.1     |
| Running Reverse KL  | 8.81     |
| Running Update Time | 109      |
----------------------------------
--2023-11-06 14:47:16.487326 CST--
| Itration            | 110      |
| Real Det Return     | 2.4e+03  |
| Real Sto Return     | 1.65e+03 |
| Reward Loss         | -553     |
| Running Env Steps   | 550000   |
| Running Forward KL  | 37.9     |
| Running Reverse KL  | 8.93     |
| Running Update Time | 110      |
----------------------------------
--2023-11-06 14:49:24.545188 CST--
| Itration            | 111      |
| Real Det Return     | 2.32e+03 |
| Real Sto Return     | 1.71e+03 |
| Reward Loss         | -563     |
| Running Env Steps   | 555000   |
| Running Forward KL  | 38.3     |
| Running Reverse KL  | 8.88     |
| Running Update Time | 111      |
----------------------------------
--2023-11-06 14:51:32.300190 CST--
| Itration            | 112      |
| Real Det Return     | 2.62e+03 |
| Real Sto Return     | 1.7e+03  |
| Reward Loss         | -573     |
| Running Env Steps   | 560000   |
| Running Forward KL  | 38.8     |
| Running Reverse KL  | 8.92     |
| Running Update Time | 112      |
----------------------------------
--2023-11-06 14:53:40.184895 CST--
| Itration            | 113      |
| Real Det Return     | 2.37e+03 |
| Real Sto Return     | 1.76e+03 |
| Reward Loss         | -562     |
| Running Env Steps   | 565000   |
| Running Forward KL  | 37.5     |
| Running Reverse KL  | 8.95     |
| Running Update Time | 113      |
----------------------------------
--2023-11-06 14:55:48.061550 CST--
| Itration            | 114      |
| Real Det Return     | 2.39e+03 |
| Real Sto Return     | 1.7e+03  |
| Reward Loss         | -561     |
| Running Env Steps   | 570000   |
| Running Forward KL  | 38       |
| Running Reverse KL  | 8.72     |
| Running Update Time | 114      |
----------------------------------
--2023-11-06 14:57:56.042136 CST--
| Itration            | 115      |
| Real Det Return     | 2.24e+03 |
| Real Sto Return     | 1.74e+03 |
| Reward Loss         | -575     |
| Running Env Steps   | 575000   |
| Running Forward KL  | 37.9     |
| Running Reverse KL  | 8.91     |
| Running Update Time | 115      |
----------------------------------
--2023-11-06 15:00:03.961046 CST--
| Itration            | 116      |
| Real Det Return     | 2.26e+03 |
| Real Sto Return     | 1.65e+03 |
| Reward Loss         | -581     |
| Running Env Steps   | 580000   |
| Running Forward KL  | 38.3     |
| Running Reverse KL  | 8.95     |
| Running Update Time | 116      |
----------------------------------
--2023-11-06 15:02:11.948812 CST--
| Itration            | 117      |
| Real Det Return     | 2.27e+03 |
| Real Sto Return     | 1.75e+03 |
| Reward Loss         | -590     |
| Running Env Steps   | 585000   |
| Running Forward KL  | 37.9     |
| Running Reverse KL  | 8.96     |
| Running Update Time | 117      |
----------------------------------
--2023-11-06 15:04:20.013866 CST--
| Itration            | 118      |
| Real Det Return     | 2.31e+03 |
| Real Sto Return     | 1.7e+03  |
| Reward Loss         | -581     |
| Running Env Steps   | 590000   |
| Running Forward KL  | 38.4     |
| Running Reverse KL  | 8.92     |
| Running Update Time | 118      |
----------------------------------
--2023-11-06 15:06:27.974003 CST--
| Itration            | 119      |
| Real Det Return     | 2.36e+03 |
| Real Sto Return     | 1.81e+03 |
| Reward Loss         | -591     |
| Running Env Steps   | 595000   |
| Running Forward KL  | 38.6     |
| Running Reverse KL  | 8.84     |
| Running Update Time | 119      |
----------------------------------
--2023-11-06 15:08:35.844595 CST--
| Itration            | 120      |
| Real Det Return     | 2.22e+03 |
| Real Sto Return     | 1.74e+03 |
| Reward Loss         | -578     |
| Running Env Steps   | 600000   |
| Running Forward KL  | 38.1     |
| Running Reverse KL  | 8.82     |
| Running Update Time | 120      |
----------------------------------
--2023-11-06 15:10:43.951373 CST--
| Itration            | 121      |
| Real Det Return     | 2.29e+03 |
| Real Sto Return     | 1.81e+03 |
| Reward Loss         | -565     |
| Running Env Steps   | 605000   |
| Running Forward KL  | 37.6     |
| Running Reverse KL  | 8.65     |
| Running Update Time | 121      |
----------------------------------
--2023-11-06 15:12:52.309284 CST--
| Itration            | 122      |
| Real Det Return     | 2.16e+03 |
| Real Sto Return     | 1.71e+03 |
| Reward Loss         | -584     |
| Running Env Steps   | 610000   |
| Running Forward KL  | 37.5     |
| Running Reverse KL  | 8.78     |
| Running Update Time | 122      |
----------------------------------
--2023-11-06 15:15:00.572748 CST--
| Itration            | 123      |
| Real Det Return     | 2.32e+03 |
| Real Sto Return     | 1.8e+03  |
| Reward Loss         | -580     |
| Running Env Steps   | 615000   |
| Running Forward KL  | 36.9     |
| Running Reverse KL  | 8.66     |
| Running Update Time | 123      |
----------------------------------
--2023-11-06 15:17:08.553128 CST--
| Itration            | 124      |
| Real Det Return     | 2.22e+03 |
| Real Sto Return     | 1.76e+03 |
| Reward Loss         | -600     |
| Running Env Steps   | 620000   |
| Running Forward KL  | 37.3     |
| Running Reverse KL  | 8.79     |
| Running Update Time | 124      |
----------------------------------
--2023-11-06 15:19:16.453613 CST--
| Itration            | 125      |
| Real Det Return     | 2.64e+03 |
| Real Sto Return     | 1.86e+03 |
| Reward Loss         | -594     |
| Running Env Steps   | 625000   |
| Running Forward KL  | 37.4     |
| Running Reverse KL  | 8.7      |
| Running Update Time | 125      |
----------------------------------
--2023-11-06 15:21:24.505353 CST--
| Itration            | 126      |
| Real Det Return     | 2.49e+03 |
| Real Sto Return     | 1.86e+03 |
| Reward Loss         | -599     |
| Running Env Steps   | 630000   |
| Running Forward KL  | 38.1     |
| Running Reverse KL  | 8.84     |
| Running Update Time | 126      |
----------------------------------
--2023-11-06 15:23:32.601005 CST--
| Itration            | 127      |
| Real Det Return     | 2.32e+03 |
| Real Sto Return     | 1.84e+03 |
| Reward Loss         | -599     |
| Running Env Steps   | 635000   |
| Running Forward KL  | 37.2     |
| Running Reverse KL  | 8.72     |
| Running Update Time | 127      |
----------------------------------
--2023-11-06 15:25:40.666541 CST--
| Itration            | 128      |
| Real Det Return     | 2.57e+03 |
| Real Sto Return     | 1.92e+03 |
| Reward Loss         | -582     |
| Running Env Steps   | 640000   |
| Running Forward KL  | 37.5     |
| Running Reverse KL  | 8.61     |
| Running Update Time | 128      |
----------------------------------
--2023-11-06 15:27:48.741484 CST--
| Itration            | 129      |
| Real Det Return     | 2.61e+03 |
| Real Sto Return     | 1.96e+03 |
| Reward Loss         | -584     |
| Running Env Steps   | 645000   |
| Running Forward KL  | 37.6     |
| Running Reverse KL  | 8.57     |
| Running Update Time | 129      |
----------------------------------
--2023-11-06 15:29:56.893064 CST--
| Itration            | 130      |
| Real Det Return     | 2.25e+03 |
| Real Sto Return     | 1.87e+03 |
| Reward Loss         | -611     |
| Running Env Steps   | 650000   |
| Running Forward KL  | 37.1     |
| Running Reverse KL  | 8.75     |
| Running Update Time | 130      |
----------------------------------
--2023-11-06 15:32:04.798132 CST--
| Itration            | 131      |
| Real Det Return     | 2.47e+03 |
| Real Sto Return     | 1.88e+03 |
| Reward Loss         | -618     |
| Running Env Steps   | 655000   |
| Running Forward KL  | 38       |
| Running Reverse KL  | 8.72     |
| Running Update Time | 131      |
----------------------------------
--2023-11-06 15:34:12.699177 CST--
| Itration            | 132      |
| Real Det Return     | 2.63e+03 |
| Real Sto Return     | 1.92e+03 |
| Reward Loss         | -603     |
| Running Env Steps   | 660000   |
| Running Forward KL  | 37.8     |
| Running Reverse KL  | 8.7      |
| Running Update Time | 132      |
----------------------------------
--2023-11-06 15:36:20.554604 CST--
| Itration            | 133      |
| Real Det Return     | 2.51e+03 |
| Real Sto Return     | 1.96e+03 |
| Reward Loss         | -612     |
| Running Env Steps   | 665000   |
| Running Forward KL  | 37.3     |
| Running Reverse KL  | 8.69     |
| Running Update Time | 133      |
----------------------------------
--2023-11-06 15:38:28.429575 CST--
| Itration            | 134      |
| Real Det Return     | 2.7e+03  |
| Real Sto Return     | 2e+03    |
| Reward Loss         | -617     |
| Running Env Steps   | 670000   |
| Running Forward KL  | 37.7     |
| Running Reverse KL  | 8.59     |
| Running Update Time | 134      |
----------------------------------
--2023-11-06 15:40:36.311063 CST--
| Itration            | 135      |
| Real Det Return     | 2.54e+03 |
| Real Sto Return     | 1.97e+03 |
| Reward Loss         | -602     |
| Running Env Steps   | 675000   |
| Running Forward KL  | 37       |
| Running Reverse KL  | 8.51     |
| Running Update Time | 135      |
----------------------------------
--2023-11-06 15:42:44.293033 CST--
| Itration            | 136      |
| Real Det Return     | 2.56e+03 |
| Real Sto Return     | 1.99e+03 |
| Reward Loss         | -616     |
| Running Env Steps   | 680000   |
| Running Forward KL  | 36.7     |
| Running Reverse KL  | 8.56     |
| Running Update Time | 136      |
----------------------------------
--2023-11-06 15:44:52.149754 CST--
| Itration            | 137      |
| Real Det Return     | 2.76e+03 |
| Real Sto Return     | 2.12e+03 |
| Reward Loss         | -594     |
| Running Env Steps   | 685000   |
| Running Forward KL  | 36.7     |
| Running Reverse KL  | 8.53     |
| Running Update Time | 137      |
----------------------------------
--2023-11-06 15:47:00.314866 CST--
| Itration            | 138      |
| Real Det Return     | 2.76e+03 |
| Real Sto Return     | 1.95e+03 |
| Reward Loss         | -646     |
| Running Env Steps   | 690000   |
| Running Forward KL  | 37.2     |
| Running Reverse KL  | 8.78     |
| Running Update Time | 138      |
----------------------------------
--2023-11-06 15:49:08.572702 CST--
| Itration            | 139      |
| Real Det Return     | 2.64e+03 |
| Real Sto Return     | 2.06e+03 |
| Reward Loss         | -618     |
| Running Env Steps   | 695000   |
| Running Forward KL  | 37       |
| Running Reverse KL  | 8.47     |
| Running Update Time | 139      |
----------------------------------
--2023-11-06 15:51:17.247700 CST--
| Itration            | 140      |
| Real Det Return     | 2.71e+03 |
| Real Sto Return     | 2.09e+03 |
| Reward Loss         | -612     |
| Running Env Steps   | 700000   |
| Running Forward KL  | 36.9     |
| Running Reverse KL  | 8.42     |
| Running Update Time | 140      |
----------------------------------
--2023-11-06 15:53:25.679561 CST--
| Itration            | 141      |
| Real Det Return     | 2.58e+03 |
| Real Sto Return     | 2.12e+03 |
| Reward Loss         | -608     |
| Running Env Steps   | 705000   |
| Running Forward KL  | 36.9     |
| Running Reverse KL  | 8.42     |
| Running Update Time | 141      |
----------------------------------
--2023-11-06 15:55:34.047245 CST--
| Itration            | 142      |
| Real Det Return     | 2.69e+03 |
| Real Sto Return     | 2.15e+03 |
| Reward Loss         | -606     |
| Running Env Steps   | 710000   |
| Running Forward KL  | 36.7     |
| Running Reverse KL  | 8.32     |
| Running Update Time | 142      |
----------------------------------
--2023-11-06 15:57:42.210206 CST--
| Itration            | 143      |
| Real Det Return     | 2.68e+03 |
| Real Sto Return     | 2.07e+03 |
| Reward Loss         | -630     |
| Running Env Steps   | 715000   |
| Running Forward KL  | 36       |
| Running Reverse KL  | 8.39     |
| Running Update Time | 143      |
----------------------------------
--2023-11-06 15:59:50.839602 CST--
| Itration            | 144      |
| Real Det Return     | 2.77e+03 |
| Real Sto Return     | 2.15e+03 |
| Reward Loss         | -604     |
| Running Env Steps   | 720000   |
| Running Forward KL  | 36.3     |
| Running Reverse KL  | 8.29     |
| Running Update Time | 144      |
----------------------------------
--2023-11-06 16:01:59.185826 CST--
| Itration            | 145      |
| Real Det Return     | 2.74e+03 |
| Real Sto Return     | 2.1e+03  |
| Reward Loss         | -633     |
| Running Env Steps   | 725000   |
| Running Forward KL  | 36.6     |
| Running Reverse KL  | 8.44     |
| Running Update Time | 145      |
----------------------------------
--2023-11-06 16:04:07.887592 CST--
| Itration            | 146      |
| Real Det Return     | 2.77e+03 |
| Real Sto Return     | 2.21e+03 |
| Reward Loss         | -613     |
| Running Env Steps   | 730000   |
| Running Forward KL  | 36.4     |
| Running Reverse KL  | 8.44     |
| Running Update Time | 146      |
----------------------------------
--2023-11-06 16:06:16.437282 CST--
| Itration            | 147      |
| Real Det Return     | 2.72e+03 |
| Real Sto Return     | 2.16e+03 |
| Reward Loss         | -625     |
| Running Env Steps   | 735000   |
| Running Forward KL  | 36.5     |
| Running Reverse KL  | 8.33     |
| Running Update Time | 147      |
----------------------------------
--2023-11-06 16:08:25.050074 CST--
| Itration            | 148      |
| Real Det Return     | 2.81e+03 |
| Real Sto Return     | 2.15e+03 |
| Reward Loss         | -617     |
| Running Env Steps   | 740000   |
| Running Forward KL  | 35.9     |
| Running Reverse KL  | 8.33     |
| Running Update Time | 148      |
----------------------------------
--2023-11-06 16:10:33.957163 CST--
| Itration            | 149      |
| Real Det Return     | 2.39e+03 |
| Real Sto Return     | 2.22e+03 |
| Reward Loss         | -638     |
| Running Env Steps   | 745000   |
| Running Forward KL  | 36.1     |
| Running Reverse KL  | 8.35     |
| Running Update Time | 149      |
----------------------------------
--2023-11-06 16:12:42.911667 CST--
| Itration            | 150      |
| Real Det Return     | 2.67e+03 |
| Real Sto Return     | 2.22e+03 |
| Reward Loss         | -617     |
| Running Env Steps   | 750000   |
| Running Forward KL  | 36.8     |
| Running Reverse KL  | 8.32     |
| Running Update Time | 150      |
----------------------------------
--2023-11-06 16:14:52.201378 CST--
| Itration            | 151      |
| Real Det Return     | 2.53e+03 |
| Real Sto Return     | 2.27e+03 |
| Reward Loss         | -621     |
| Running Env Steps   | 755000   |
| Running Forward KL  | 36.3     |
| Running Reverse KL  | 8.25     |
| Running Update Time | 151      |
----------------------------------
--2023-11-06 16:17:01.345524 CST--
| Itration            | 152      |
| Real Det Return     | 2.74e+03 |
| Real Sto Return     | 2.21e+03 |
| Reward Loss         | -625     |
| Running Env Steps   | 760000   |
| Running Forward KL  | 36.3     |
| Running Reverse KL  | 8.27     |
| Running Update Time | 152      |
----------------------------------
--2023-11-06 16:19:10.605240 CST--
| Itration            | 153      |
| Real Det Return     | 2.71e+03 |
| Real Sto Return     | 2.19e+03 |
| Reward Loss         | -650     |
| Running Env Steps   | 765000   |
| Running Forward KL  | 36.8     |
| Running Reverse KL  | 8.34     |
| Running Update Time | 153      |
----------------------------------
--2023-11-06 16:21:19.409273 CST--
| Itration            | 154      |
| Real Det Return     | 2.56e+03 |
| Real Sto Return     | 2.24e+03 |
| Reward Loss         | -630     |
| Running Env Steps   | 770000   |
| Running Forward KL  | 36.6     |
| Running Reverse KL  | 8.28     |
| Running Update Time | 154      |
----------------------------------
--2023-11-06 16:23:31.396972 CST--
| Itration            | 155      |
| Real Det Return     | 2.46e+03 |
| Real Sto Return     | 2.34e+03 |
| Reward Loss         | -630     |
| Running Env Steps   | 775000   |
| Running Forward KL  | 36.6     |
| Running Reverse KL  | 8.28     |
| Running Update Time | 155      |
----------------------------------
--2023-11-06 16:25:43.068480 CST--
| Itration            | 156      |
| Real Det Return     | 2.76e+03 |
| Real Sto Return     | 2.22e+03 |
| Reward Loss         | -642     |
| Running Env Steps   | 780000   |
| Running Forward KL  | 36.3     |
| Running Reverse KL  | 8.34     |
| Running Update Time | 156      |
----------------------------------
--2023-11-06 16:27:54.671062 CST--
| Itration            | 157      |
| Real Det Return     | 2.77e+03 |
| Real Sto Return     | 2.25e+03 |
| Reward Loss         | -640     |
| Running Env Steps   | 785000   |
| Running Forward KL  | 36.5     |
| Running Reverse KL  | 8.21     |
| Running Update Time | 157      |
----------------------------------
--2023-11-06 16:30:06.417851 CST--
| Itration            | 158      |
| Real Det Return     | 2.77e+03 |
| Real Sto Return     | 2.22e+03 |
| Reward Loss         | -633     |
| Running Env Steps   | 790000   |
| Running Forward KL  | 36.1     |
| Running Reverse KL  | 8.26     |
| Running Update Time | 158      |
----------------------------------
--2023-11-06 16:32:18.107167 CST--
| Itration            | 159      |
| Real Det Return     | 2.58e+03 |
| Real Sto Return     | 2.34e+03 |
| Reward Loss         | -640     |
| Running Env Steps   | 795000   |
| Running Forward KL  | 36.3     |
| Running Reverse KL  | 8.28     |
| Running Update Time | 159      |
----------------------------------
--2023-11-06 16:34:29.806737 CST--
| Itration            | 160      |
| Real Det Return     | 2.65e+03 |
| Real Sto Return     | 2.31e+03 |
| Reward Loss         | -618     |
| Running Env Steps   | 800000   |
| Running Forward KL  | 36.6     |
| Running Reverse KL  | 7.98     |
| Running Update Time | 160      |
----------------------------------
--2023-11-06 16:36:41.908239 CST--
| Itration            | 161      |
| Real Det Return     | 2.44e+03 |
| Real Sto Return     | 2.28e+03 |
| Reward Loss         | -645     |
| Running Env Steps   | 805000   |
| Running Forward KL  | 35.1     |
| Running Reverse KL  | 8.19     |
| Running Update Time | 161      |
----------------------------------
--2023-11-06 16:38:53.781558 CST--
| Itration            | 162      |
| Real Det Return     | 2.56e+03 |
| Real Sto Return     | 2.3e+03  |
| Reward Loss         | -629     |
| Running Env Steps   | 810000   |
| Running Forward KL  | 36.1     |
| Running Reverse KL  | 8.12     |
| Running Update Time | 162      |
----------------------------------
--2023-11-06 16:41:05.859406 CST--
| Itration            | 163      |
| Real Det Return     | 2.55e+03 |
| Real Sto Return     | 2.32e+03 |
| Reward Loss         | -645     |
| Running Env Steps   | 815000   |
| Running Forward KL  | 36.1     |
| Running Reverse KL  | 8.17     |
| Running Update Time | 163      |
----------------------------------
--2023-11-06 16:43:17.659079 CST--
| Itration            | 164      |
| Real Det Return     | 2.19e+03 |
| Real Sto Return     | 2.43e+03 |
| Reward Loss         | -609     |
| Running Env Steps   | 820000   |
| Running Forward KL  | 35.7     |
| Running Reverse KL  | 8.09     |
| Running Update Time | 164      |
----------------------------------
--2023-11-06 16:45:29.396422 CST--
| Itration            | 165      |
| Real Det Return     | 2.22e+03 |
| Real Sto Return     | 2.36e+03 |
| Reward Loss         | -657     |
| Running Env Steps   | 825000   |
| Running Forward KL  | 36.2     |
| Running Reverse KL  | 8.25     |
| Running Update Time | 165      |
----------------------------------
--2023-11-06 16:47:41.113290 CST--
| Itration            | 166      |
| Real Det Return     | 2.52e+03 |
| Real Sto Return     | 2.38e+03 |
| Reward Loss         | -649     |
| Running Env Steps   | 830000   |
| Running Forward KL  | 35.6     |
| Running Reverse KL  | 8.12     |
| Running Update Time | 166      |
----------------------------------
--2023-11-06 16:49:52.901027 CST--
| Itration            | 167      |
| Real Det Return     | 2.25e+03 |
| Real Sto Return     | 2.37e+03 |
| Reward Loss         | -639     |
| Running Env Steps   | 835000   |
| Running Forward KL  | 35.9     |
| Running Reverse KL  | 8.09     |
| Running Update Time | 167      |
----------------------------------
--2023-11-06 16:52:04.997876 CST--
| Itration            | 168      |
| Real Det Return     | 2.33e+03 |
| Real Sto Return     | 2.41e+03 |
| Reward Loss         | -629     |
| Running Env Steps   | 840000   |
| Running Forward KL  | 35.8     |
| Running Reverse KL  | 8.09     |
| Running Update Time | 168      |
----------------------------------
--2023-11-06 16:54:16.758124 CST--
| Itration            | 169      |
| Real Det Return     | 2.44e+03 |
| Real Sto Return     | 2.43e+03 |
| Reward Loss         | -643     |
| Running Env Steps   | 845000   |
| Running Forward KL  | 35.3     |
| Running Reverse KL  | 8.08     |
| Running Update Time | 169      |
----------------------------------
--2023-11-06 16:56:28.623485 CST--
| Itration            | 170      |
| Real Det Return     | 2.6e+03  |
| Real Sto Return     | 2.39e+03 |
| Reward Loss         | -658     |
| Running Env Steps   | 850000   |
| Running Forward KL  | 35.6     |
| Running Reverse KL  | 8.19     |
| Running Update Time | 170      |
----------------------------------
--2023-11-06 16:58:40.397915 CST--
| Itration            | 171      |
| Real Det Return     | 2.61e+03 |
| Real Sto Return     | 2.35e+03 |
| Reward Loss         | -649     |
| Running Env Steps   | 855000   |
| Running Forward KL  | 36.1     |
| Running Reverse KL  | 8.13     |
| Running Update Time | 171      |
----------------------------------
--2023-11-06 17:00:52.246792 CST--
| Itration            | 172      |
| Real Det Return     | 1.99e+03 |
| Real Sto Return     | 2.43e+03 |
| Reward Loss         | -665     |
| Running Env Steps   | 860000   |
| Running Forward KL  | 37       |
| Running Reverse KL  | 8.11     |
| Running Update Time | 172      |
----------------------------------
--2023-11-06 17:03:04.378900 CST--
| Itration            | 173      |
| Real Det Return     | 2.4e+03  |
| Real Sto Return     | 2.4e+03  |
| Reward Loss         | -653     |
| Running Env Steps   | 865000   |
| Running Forward KL  | 35.3     |
| Running Reverse KL  | 8.07     |
| Running Update Time | 173      |
----------------------------------
--2023-11-06 17:05:16.751578 CST--
| Itration            | 174      |
| Real Det Return     | 2.32e+03 |
| Real Sto Return     | 2.43e+03 |
| Reward Loss         | -659     |
| Running Env Steps   | 870000   |
| Running Forward KL  | 36.3     |
| Running Reverse KL  | 7.9      |
| Running Update Time | 174      |
----------------------------------
--2023-11-06 17:07:29.694335 CST--
| Itration            | 175      |
| Real Det Return     | 2.3e+03  |
| Real Sto Return     | 2.39e+03 |
| Reward Loss         | -666     |
| Running Env Steps   | 875000   |
| Running Forward KL  | 35.7     |
| Running Reverse KL  | 8.09     |
| Running Update Time | 175      |
----------------------------------
--2023-11-06 17:09:42.297735 CST--
| Itration            | 176      |
| Real Det Return     | 2.42e+03 |
| Real Sto Return     | 2.4e+03  |
| Reward Loss         | -648     |
| Running Env Steps   | 880000   |
| Running Forward KL  | 34.9     |
| Running Reverse KL  | 7.96     |
| Running Update Time | 176      |
----------------------------------
--2023-11-06 17:11:54.771614 CST--
| Itration            | 177      |
| Real Det Return     | 2.48e+03 |
| Real Sto Return     | 2.41e+03 |
| Reward Loss         | -677     |
| Running Env Steps   | 885000   |
| Running Forward KL  | 34.9     |
| Running Reverse KL  | 8.05     |
| Running Update Time | 177      |
----------------------------------
--2023-11-06 17:14:07.414947 CST--
| Itration            | 178      |
| Real Det Return     | 2.42e+03 |
| Real Sto Return     | 2.29e+03 |
| Reward Loss         | -674     |
| Running Env Steps   | 890000   |
| Running Forward KL  | 35.7     |
| Running Reverse KL  | 8.14     |
| Running Update Time | 178      |
----------------------------------
--2023-11-06 17:16:20.086092 CST--
| Itration            | 179      |
| Real Det Return     | 2.5e+03  |
| Real Sto Return     | 2.37e+03 |
| Reward Loss         | -677     |
| Running Env Steps   | 895000   |
| Running Forward KL  | 35.2     |
| Running Reverse KL  | 8.07     |
| Running Update Time | 179      |
----------------------------------
--2023-11-06 17:18:32.507233 CST--
| Itration            | 180      |
| Real Det Return     | 2.42e+03 |
| Real Sto Return     | 2.38e+03 |
| Reward Loss         | -671     |
| Running Env Steps   | 900000   |
| Running Forward KL  | 35.4     |
| Running Reverse KL  | 8.03     |
| Running Update Time | 180      |
----------------------------------
--2023-11-06 17:20:44.996438 CST--
| Itration            | 181      |
| Real Det Return     | 2.35e+03 |
| Real Sto Return     | 2.43e+03 |
| Reward Loss         | -653     |
| Running Env Steps   | 905000   |
| Running Forward KL  | 34.2     |
| Running Reverse KL  | 7.98     |
| Running Update Time | 181      |
----------------------------------
--2023-11-06 17:22:57.552140 CST--
| Itration            | 182      |
| Real Det Return     | 2.13e+03 |
| Real Sto Return     | 2.47e+03 |
| Reward Loss         | -643     |
| Running Env Steps   | 910000   |
| Running Forward KL  | 35.1     |
| Running Reverse KL  | 7.88     |
| Running Update Time | 182      |
----------------------------------
--2023-11-06 17:25:09.432253 CST--
| Itration            | 183      |
| Real Det Return     | 2.17e+03 |
| Real Sto Return     | 2.47e+03 |
| Reward Loss         | -652     |
| Running Env Steps   | 915000   |
| Running Forward KL  | 35.4     |
| Running Reverse KL  | 7.88     |
| Running Update Time | 183      |
----------------------------------
--2023-11-06 17:27:21.729854 CST--
| Itration            | 184      |
| Real Det Return     | 2.2e+03  |
| Real Sto Return     | 2.47e+03 |
| Reward Loss         | -670     |
| Running Env Steps   | 920000   |
| Running Forward KL  | 34.8     |
| Running Reverse KL  | 7.8      |
| Running Update Time | 184      |
----------------------------------
--2023-11-06 17:29:33.709302 CST--
| Itration            | 185      |
| Real Det Return     | 2.32e+03 |
| Real Sto Return     | 2.47e+03 |
| Reward Loss         | -664     |
| Running Env Steps   | 925000   |
| Running Forward KL  | 34.8     |
| Running Reverse KL  | 7.95     |
| Running Update Time | 185      |
----------------------------------
--2023-11-06 17:31:45.766033 CST--
| Itration            | 186      |
| Real Det Return     | 2.21e+03 |
| Real Sto Return     | 2.48e+03 |
| Reward Loss         | -670     |
| Running Env Steps   | 930000   |
| Running Forward KL  | 35       |
| Running Reverse KL  | 7.88     |
| Running Update Time | 186      |
----------------------------------
--2023-11-06 17:33:57.738689 CST--
| Itration            | 187      |
| Real Det Return     | 1.92e+03 |
| Real Sto Return     | 2.53e+03 |
| Reward Loss         | -675     |
| Running Env Steps   | 935000   |
| Running Forward KL  | 35.8     |
| Running Reverse KL  | 7.95     |
| Running Update Time | 187      |
----------------------------------
--2023-11-06 17:36:09.590598 CST--
| Itration            | 188      |
| Real Det Return     | 2.27e+03 |
| Real Sto Return     | 2.48e+03 |
| Reward Loss         | -673     |
| Running Env Steps   | 940000   |
| Running Forward KL  | 34.9     |
| Running Reverse KL  | 7.93     |
| Running Update Time | 188      |
----------------------------------
--2023-11-06 17:38:21.501455 CST--
| Itration            | 189      |
| Real Det Return     | 1.92e+03 |
| Real Sto Return     | 2.5e+03  |
| Reward Loss         | -674     |
| Running Env Steps   | 945000   |
| Running Forward KL  | 35.3     |
| Running Reverse KL  | 7.99     |
| Running Update Time | 189      |
----------------------------------
--2023-11-06 17:40:33.336132 CST--
| Itration            | 190      |
| Real Det Return     | 2.23e+03 |
| Real Sto Return     | 2.45e+03 |
| Reward Loss         | -677     |
| Running Env Steps   | 950000   |
| Running Forward KL  | 34.6     |
| Running Reverse KL  | 7.89     |
| Running Update Time | 190      |
----------------------------------
--2023-11-06 17:42:45.765949 CST--
| Itration            | 191      |
| Real Det Return     | 2.11e+03 |
| Real Sto Return     | 2.5e+03  |
| Reward Loss         | -665     |
| Running Env Steps   | 955000   |
| Running Forward KL  | 34.4     |
| Running Reverse KL  | 7.8      |
| Running Update Time | 191      |
----------------------------------
--2023-11-06 17:44:58.153009 CST--
| Itration            | 192      |
| Real Det Return     | 2.3e+03  |
| Real Sto Return     | 2.42e+03 |
| Reward Loss         | -686     |
| Running Env Steps   | 960000   |
| Running Forward KL  | 35.1     |
| Running Reverse KL  | 7.89     |
| Running Update Time | 192      |
----------------------------------
--2023-11-06 17:47:10.350993 CST--
| Itration            | 193      |
| Real Det Return     | 2.23e+03 |
| Real Sto Return     | 2.49e+03 |
| Reward Loss         | -696     |
| Running Env Steps   | 965000   |
| Running Forward KL  | 35.4     |
| Running Reverse KL  | 7.86     |
| Running Update Time | 193      |
----------------------------------
--2023-11-06 17:49:22.385152 CST--
| Itration            | 194      |
| Real Det Return     | 2.22e+03 |
| Real Sto Return     | 2.51e+03 |
| Reward Loss         | -677     |
| Running Env Steps   | 970000   |
| Running Forward KL  | 34.8     |
| Running Reverse KL  | 7.82     |
| Running Update Time | 194      |
----------------------------------
--2023-11-06 17:51:34.356769 CST--
| Itration            | 195      |
| Real Det Return     | 2.34e+03 |
| Real Sto Return     | 2.42e+03 |
| Reward Loss         | -704     |
| Running Env Steps   | 975000   |
| Running Forward KL  | 35       |
| Running Reverse KL  | 8.01     |
| Running Update Time | 195      |
----------------------------------
--2023-11-06 17:53:46.371489 CST--
| Itration            | 196      |
| Real Det Return     | 2.24e+03 |
| Real Sto Return     | 2.49e+03 |
| Reward Loss         | -699     |
| Running Env Steps   | 980000   |
| Running Forward KL  | 34.8     |
| Running Reverse KL  | 7.91     |
| Running Update Time | 196      |
----------------------------------
--2023-11-06 17:55:58.317745 CST--
| Itration            | 197      |
| Real Det Return     | 2.18e+03 |
| Real Sto Return     | 2.44e+03 |
| Reward Loss         | -721     |
| Running Env Steps   | 985000   |
| Running Forward KL  | 35.4     |
| Running Reverse KL  | 7.94     |
| Running Update Time | 197      |
----------------------------------
--2023-11-06 17:58:10.008175 CST--
| Itration            | 198      |
| Real Det Return     | 2.24e+03 |
| Real Sto Return     | 2.44e+03 |
| Reward Loss         | -710     |
| Running Env Steps   | 990000   |
| Running Forward KL  | 34.5     |
| Running Reverse KL  | 7.84     |
| Running Update Time | 198      |
----------------------------------
--2023-11-06 18:00:21.393383 CST--
| Itration            | 199      |
| Real Det Return     | 2.11e+03 |
| Real Sto Return     | 2.51e+03 |
| Reward Loss         | -669     |
| Running Env Steps   | 995000   |
| Running Forward KL  | 34.5     |
| Running Reverse KL  | 7.79     |
| Running Update Time | 199      |
----------------------------------
--2023-11-06 18:02:32.910469 CST--
| Itration            | 200      |
| Real Det Return     | 2.2e+03  |
| Real Sto Return     | 2.45e+03 |
| Reward Loss         | -715     |
| Running Env Steps   | 1000000  |
| Running Forward KL  | 34.7     |
| Running Reverse KL  | 7.82     |
| Running Update Time | 200      |
----------------------------------
--2023-11-06 18:04:44.210964 CST--
| Itration            | 201      |
| Real Det Return     | 1.98e+03 |
| Real Sto Return     | 2.49e+03 |
| Reward Loss         | -709     |
| Running Env Steps   | 1005000  |
| Running Forward KL  | 34.8     |
| Running Reverse KL  | 7.76     |
| Running Update Time | 201      |
----------------------------------
--2023-11-06 18:06:55.738641 CST--
| Itration            | 202      |
| Real Det Return     | 2.02e+03 |
| Real Sto Return     | 2.53e+03 |
| Reward Loss         | -685     |
| Running Env Steps   | 1010000  |
| Running Forward KL  | 33.9     |
| Running Reverse KL  | 7.7      |
| Running Update Time | 202      |
----------------------------------
--2023-11-06 18:09:07.131540 CST--
| Itration            | 203      |
| Real Det Return     | 1.96e+03 |
| Real Sto Return     | 2.54e+03 |
| Reward Loss         | -679     |
| Running Env Steps   | 1015000  |
| Running Forward KL  | 34.7     |
| Running Reverse KL  | 7.7      |
| Running Update Time | 203      |
----------------------------------
--2023-11-06 18:11:19.682899 CST--
| Itration            | 204      |
| Real Det Return     | 2.21e+03 |
| Real Sto Return     | 2.51e+03 |
| Reward Loss         | -698     |
| Running Env Steps   | 1020000  |
| Running Forward KL  | 34.7     |
| Running Reverse KL  | 7.8      |
| Running Update Time | 204      |
----------------------------------
--2023-11-06 18:13:32.604157 CST--
| Itration            | 205      |
| Real Det Return     | 2.27e+03 |
| Real Sto Return     | 2.52e+03 |
| Reward Loss         | -702     |
| Running Env Steps   | 1025000  |
| Running Forward KL  | 34.7     |
| Running Reverse KL  | 7.85     |
| Running Update Time | 205      |
----------------------------------
--2023-11-06 18:15:44.475701 CST--
| Itration            | 206      |
| Real Det Return     | 2.12e+03 |
| Real Sto Return     | 2.5e+03  |
| Reward Loss         | -723     |
| Running Env Steps   | 1030000  |
| Running Forward KL  | 34.6     |
| Running Reverse KL  | 7.81     |
| Running Update Time | 206      |
----------------------------------
--2023-11-06 18:17:56.289426 CST--
| Itration            | 207      |
| Real Det Return     | 2.04e+03 |
| Real Sto Return     | 2.52e+03 |
| Reward Loss         | -705     |
| Running Env Steps   | 1035000  |
| Running Forward KL  | 34.4     |
| Running Reverse KL  | 7.75     |
| Running Update Time | 207      |
----------------------------------
--2023-11-06 18:20:08.457174 CST--
| Itration            | 208      |
| Real Det Return     | 2.08e+03 |
| Real Sto Return     | 2.57e+03 |
| Reward Loss         | -689     |
| Running Env Steps   | 1040000  |
| Running Forward KL  | 34.3     |
| Running Reverse KL  | 7.76     |
| Running Update Time | 208      |
----------------------------------
--2023-11-06 18:22:20.789576 CST--
| Itration            | 209      |
| Real Det Return     | 2.04e+03 |
| Real Sto Return     | 2.51e+03 |
| Reward Loss         | -726     |
| Running Env Steps   | 1045000  |
| Running Forward KL  | 34.4     |
| Running Reverse KL  | 7.78     |
| Running Update Time | 209      |
----------------------------------
--2023-11-06 18:24:33.254192 CST--
| Itration            | 210      |
| Real Det Return     | 2.04e+03 |
| Real Sto Return     | 2.59e+03 |
| Reward Loss         | -678     |
| Running Env Steps   | 1050000  |
| Running Forward KL  | 33.9     |
| Running Reverse KL  | 7.67     |
| Running Update Time | 210      |
----------------------------------
--2023-11-06 18:26:45.825875 CST--
| Itration            | 211      |
| Real Det Return     | 2.11e+03 |
| Real Sto Return     | 2.5e+03  |
| Reward Loss         | -722     |
| Running Env Steps   | 1055000  |
| Running Forward KL  | 34.7     |
| Running Reverse KL  | 7.79     |
| Running Update Time | 211      |
----------------------------------
--2023-11-06 18:28:58.297381 CST--
| Itration            | 212      |
| Real Det Return     | 2.2e+03  |
| Real Sto Return     | 2.51e+03 |
| Reward Loss         | -711     |
| Running Env Steps   | 1060000  |
| Running Forward KL  | 34.6     |
| Running Reverse KL  | 7.68     |
| Running Update Time | 212      |
----------------------------------
--2023-11-06 18:31:10.748564 CST--
| Itration            | 213      |
| Real Det Return     | 2.06e+03 |
| Real Sto Return     | 2.51e+03 |
| Reward Loss         | -720     |
| Running Env Steps   | 1065000  |
| Running Forward KL  | 34.7     |
| Running Reverse KL  | 7.68     |
| Running Update Time | 213      |
----------------------------------
--2023-11-06 18:33:22.544378 CST--
| Itration            | 214      |
| Real Det Return     | 1.87e+03 |
| Real Sto Return     | 2.54e+03 |
| Reward Loss         | -714     |
| Running Env Steps   | 1070000  |
| Running Forward KL  | 34.9     |
| Running Reverse KL  | 7.75     |
| Running Update Time | 214      |
----------------------------------
--2023-11-06 18:35:34.148947 CST--
| Itration            | 215      |
| Real Det Return     | 1.91e+03 |
| Real Sto Return     | 2.56e+03 |
| Reward Loss         | -722     |
| Running Env Steps   | 1075000  |
| Running Forward KL  | 34.8     |
| Running Reverse KL  | 7.72     |
| Running Update Time | 215      |
----------------------------------
--2023-11-06 18:37:45.959579 CST--
| Itration            | 216      |
| Real Det Return     | 2.09e+03 |
| Real Sto Return     | 2.54e+03 |
| Reward Loss         | -729     |
| Running Env Steps   | 1080000  |
| Running Forward KL  | 33.5     |
| Running Reverse KL  | 7.63     |
| Running Update Time | 216      |
----------------------------------
--2023-11-06 18:39:57.691671 CST--
| Itration            | 217      |
| Real Det Return     | 2.13e+03 |
| Real Sto Return     | 2.53e+03 |
| Reward Loss         | -709     |
| Running Env Steps   | 1085000  |
| Running Forward KL  | 34       |
| Running Reverse KL  | 7.73     |
| Running Update Time | 217      |
----------------------------------
--2023-11-06 18:42:09.301232 CST--
| Itration            | 218      |
| Real Det Return     | 2.13e+03 |
| Real Sto Return     | 2.49e+03 |
| Reward Loss         | -722     |
| Running Env Steps   | 1090000  |
| Running Forward KL  | 34       |
| Running Reverse KL  | 7.85     |
| Running Update Time | 218      |
----------------------------------
--2023-11-06 18:44:20.739705 CST--
| Itration            | 219      |
| Real Det Return     | 2.07e+03 |
| Real Sto Return     | 2.52e+03 |
| Reward Loss         | -725     |
| Running Env Steps   | 1095000  |
| Running Forward KL  | 34.1     |
| Running Reverse KL  | 7.69     |
| Running Update Time | 219      |
----------------------------------
--2023-11-06 18:46:32.225881 CST--
| Itration            | 220      |
| Real Det Return     | 2.18e+03 |
| Real Sto Return     | 2.47e+03 |
| Reward Loss         | -740     |
| Running Env Steps   | 1100000  |
| Running Forward KL  | 34.1     |
| Running Reverse KL  | 7.8      |
| Running Update Time | 220      |
----------------------------------
--2023-11-06 18:48:43.540931 CST--
| Itration            | 221      |
| Real Det Return     | 2.05e+03 |
| Real Sto Return     | 2.51e+03 |
| Reward Loss         | -724     |
| Running Env Steps   | 1105000  |
| Running Forward KL  | 34       |
| Running Reverse KL  | 7.68     |
| Running Update Time | 221      |
----------------------------------
--2023-11-06 18:50:54.944840 CST--
| Itration            | 222      |
| Real Det Return     | 2.04e+03 |
| Real Sto Return     | 2.61e+03 |
| Reward Loss         | -680     |
| Running Env Steps   | 1110000  |
| Running Forward KL  | 34.2     |
| Running Reverse KL  | 7.62     |
| Running Update Time | 222      |
----------------------------------
--2023-11-06 18:53:06.524779 CST--
| Itration            | 223      |
| Real Det Return     | 2.21e+03 |
| Real Sto Return     | 2.53e+03 |
| Reward Loss         | -738     |
| Running Env Steps   | 1115000  |
| Running Forward KL  | 34.2     |
| Running Reverse KL  | 7.74     |
| Running Update Time | 223      |
----------------------------------
--2023-11-06 18:55:18.110253 CST--
| Itration            | 224      |
| Real Det Return     | 2.05e+03 |
| Real Sto Return     | 2.54e+03 |
| Reward Loss         | -746     |
| Running Env Steps   | 1120000  |
| Running Forward KL  | 33.5     |
| Running Reverse KL  | 7.68     |
| Running Update Time | 224      |
----------------------------------
--2023-11-06 18:57:29.942326 CST--
| Itration            | 225      |
| Real Det Return     | 2.02e+03 |
| Real Sto Return     | 2.55e+03 |
| Reward Loss         | -721     |
| Running Env Steps   | 1125000  |
| Running Forward KL  | 33.4     |
| Running Reverse KL  | 7.61     |
| Running Update Time | 225      |
----------------------------------
--2023-11-06 18:59:41.542274 CST--
| Itration            | 226      |
| Real Det Return     | 2.07e+03 |
| Real Sto Return     | 2.56e+03 |
| Reward Loss         | -729     |
| Running Env Steps   | 1130000  |
| Running Forward KL  | 33.8     |
| Running Reverse KL  | 7.74     |
| Running Update Time | 226      |
----------------------------------
--2023-11-06 19:01:53.530505 CST--
| Itration            | 227      |
| Real Det Return     | 2.07e+03 |
| Real Sto Return     | 2.56e+03 |
| Reward Loss         | -742     |
| Running Env Steps   | 1135000  |
| Running Forward KL  | 34       |
| Running Reverse KL  | 7.66     |
| Running Update Time | 227      |
----------------------------------
--2023-11-06 19:03:57.139375 CST--
| Itration            | 228      |
| Real Det Return     | 2.18e+03 |
| Real Sto Return     | 2.58e+03 |
| Reward Loss         | -753     |
| Running Env Steps   | 1140000  |
| Running Forward KL  | 33.3     |
| Running Reverse KL  | 7.64     |
| Running Update Time | 228      |
----------------------------------
--2023-11-06 19:06:01.238658 CST--
| Itration            | 229      |
| Real Det Return     | 1.92e+03 |
| Real Sto Return     | 2.59e+03 |
| Reward Loss         | -727     |
| Running Env Steps   | 1145000  |
| Running Forward KL  | 33.9     |
| Running Reverse KL  | 7.58     |
| Running Update Time | 229      |
----------------------------------
--2023-11-06 19:08:04.916045 CST--
| Itration            | 230      |
| Real Det Return     | 2.02e+03 |
| Real Sto Return     | 2.53e+03 |
| Reward Loss         | -742     |
| Running Env Steps   | 1150000  |
| Running Forward KL  | 33.6     |
| Running Reverse KL  | 7.76     |
| Running Update Time | 230      |
----------------------------------
--2023-11-06 19:10:08.637840 CST--
| Itration            | 231      |
| Real Det Return     | 2.09e+03 |
| Real Sto Return     | 2.55e+03 |
| Reward Loss         | -754     |
| Running Env Steps   | 1155000  |
| Running Forward KL  | 34.1     |
| Running Reverse KL  | 7.71     |
| Running Update Time | 231      |
----------------------------------
--2023-11-06 19:12:12.740002 CST--
| Itration            | 232      |
| Real Det Return     | 2.27e+03 |
| Real Sto Return     | 2.51e+03 |
| Reward Loss         | -765     |
| Running Env Steps   | 1160000  |
| Running Forward KL  | 33.3     |
| Running Reverse KL  | 7.71     |
| Running Update Time | 232      |
----------------------------------
--2023-11-06 19:14:16.274225 CST--
| Itration            | 233      |
| Real Det Return     | 1.81e+03 |
| Real Sto Return     | 2.57e+03 |
| Reward Loss         | -738     |
| Running Env Steps   | 1165000  |
| Running Forward KL  | 34.4     |
| Running Reverse KL  | 7.68     |
| Running Update Time | 233      |
----------------------------------
--2023-11-06 19:16:19.853266 CST--
| Itration            | 234      |
| Real Det Return     | 1.99e+03 |
| Real Sto Return     | 2.58e+03 |
| Reward Loss         | -745     |
| Running Env Steps   | 1170000  |
| Running Forward KL  | 34       |
| Running Reverse KL  | 7.58     |
| Running Update Time | 234      |
----------------------------------
--2023-11-06 19:18:23.515013 CST--
| Itration            | 235      |
| Real Det Return     | 2.1e+03  |
| Real Sto Return     | 2.54e+03 |
| Reward Loss         | -750     |
| Running Env Steps   | 1175000  |
| Running Forward KL  | 33.3     |
| Running Reverse KL  | 7.51     |
| Running Update Time | 235      |
----------------------------------
--2023-11-06 19:20:27.252304 CST--
| Itration            | 236      |
| Real Det Return     | 2.11e+03 |
| Real Sto Return     | 2.58e+03 |
| Reward Loss         | -719     |
| Running Env Steps   | 1180000  |
| Running Forward KL  | 33.7     |
| Running Reverse KL  | 7.52     |
| Running Update Time | 236      |
----------------------------------
--2023-11-06 19:22:31.495632 CST--
| Itration            | 237      |
| Real Det Return     | 1.87e+03 |
| Real Sto Return     | 2.59e+03 |
| Reward Loss         | -724     |
| Running Env Steps   | 1185000  |
| Running Forward KL  | 33.5     |
| Running Reverse KL  | 7.58     |
| Running Update Time | 237      |
----------------------------------
--2023-11-06 19:24:35.959590 CST--
| Itration            | 238      |
| Real Det Return     | 2.01e+03 |
| Real Sto Return     | 2.56e+03 |
| Reward Loss         | -755     |
| Running Env Steps   | 1190000  |
| Running Forward KL  | 34.3     |
| Running Reverse KL  | 7.58     |
| Running Update Time | 238      |
----------------------------------
--2023-11-06 19:26:40.164062 CST--
| Itration            | 239      |
| Real Det Return     | 1.95e+03 |
| Real Sto Return     | 2.59e+03 |
| Reward Loss         | -748     |
| Running Env Steps   | 1195000  |
| Running Forward KL  | 33.8     |
| Running Reverse KL  | 7.58     |
| Running Update Time | 239      |
----------------------------------
--2023-11-06 19:28:44.431571 CST--
| Itration            | 240      |
| Real Det Return     | 2.08e+03 |
| Real Sto Return     | 2.55e+03 |
| Reward Loss         | -728     |
| Running Env Steps   | 1200000  |
| Running Forward KL  | 33.4     |
| Running Reverse KL  | 7.56     |
| Running Update Time | 240      |
----------------------------------
--2023-11-06 19:30:48.111831 CST--
| Itration            | 241      |
| Real Det Return     | 2.2e+03  |
| Real Sto Return     | 2.54e+03 |
| Reward Loss         | -776     |
| Running Env Steps   | 1205000  |
| Running Forward KL  | 33.5     |
| Running Reverse KL  | 7.79     |
| Running Update Time | 241      |
----------------------------------
--2023-11-06 19:32:52.237982 CST--
| Itration            | 242      |
| Real Det Return     | 1.93e+03 |
| Real Sto Return     | 2.59e+03 |
| Reward Loss         | -754     |
| Running Env Steps   | 1210000  |
| Running Forward KL  | 34.2     |
| Running Reverse KL  | 7.59     |
| Running Update Time | 242      |
----------------------------------
--2023-11-06 19:34:56.661403 CST--
| Itration            | 243      |
| Real Det Return     | 1.99e+03 |
| Real Sto Return     | 2.59e+03 |
| Reward Loss         | -742     |
| Running Env Steps   | 1215000  |
| Running Forward KL  | 34.2     |
| Running Reverse KL  | 7.57     |
| Running Update Time | 243      |
----------------------------------
--2023-11-06 19:37:00.427896 CST--
| Itration            | 244      |
| Real Det Return     | 2.02e+03 |
| Real Sto Return     | 2.58e+03 |
| Reward Loss         | -762     |
| Running Env Steps   | 1220000  |
| Running Forward KL  | 33.1     |
| Running Reverse KL  | 7.53     |
| Running Update Time | 244      |
----------------------------------
--2023-11-06 19:39:05.201136 CST--
| Itration            | 245      |
| Real Det Return     | 1.99e+03 |
| Real Sto Return     | 2.6e+03  |
| Reward Loss         | -757     |
| Running Env Steps   | 1225000  |
| Running Forward KL  | 34       |
| Running Reverse KL  | 7.73     |
| Running Update Time | 245      |
----------------------------------
--2023-11-06 19:41:09.698329 CST--
| Itration            | 246      |
| Real Det Return     | 2.06e+03 |
| Real Sto Return     | 2.57e+03 |
| Reward Loss         | -754     |
| Running Env Steps   | 1230000  |
| Running Forward KL  | 33.4     |
| Running Reverse KL  | 7.59     |
| Running Update Time | 246      |
----------------------------------
--2023-11-06 19:43:13.506911 CST--
| Itration            | 247      |
| Real Det Return     | 2.03e+03 |
| Real Sto Return     | 2.6e+03  |
| Reward Loss         | -764     |
| Running Env Steps   | 1235000  |
| Running Forward KL  | 34       |
| Running Reverse KL  | 7.6      |
| Running Update Time | 247      |
----------------------------------
--2023-11-06 19:45:17.885443 CST--
| Itration            | 248      |
| Real Det Return     | 2.25e+03 |
| Real Sto Return     | 2.58e+03 |
| Reward Loss         | -746     |
| Running Env Steps   | 1240000  |
| Running Forward KL  | 32.5     |
| Running Reverse KL  | 7.49     |
| Running Update Time | 248      |
----------------------------------
--2023-11-06 19:47:22.533246 CST--
| Itration            | 249      |
| Real Det Return     | 2.26e+03 |
| Real Sto Return     | 2.56e+03 |
| Reward Loss         | -774     |
| Running Env Steps   | 1245000  |
| Running Forward KL  | 33       |
| Running Reverse KL  | 7.59     |
| Running Update Time | 249      |
----------------------------------
--2023-11-06 19:49:27.725509 CST--
| Itration            | 250      |
| Real Det Return     | 2.22e+03 |
| Real Sto Return     | 2.57e+03 |
| Reward Loss         | -780     |
| Running Env Steps   | 1250000  |
| Running Forward KL  | 32.9     |
| Running Reverse KL  | 7.61     |
| Running Update Time | 250      |
----------------------------------
--2023-11-06 19:51:31.643470 CST--
| Itration            | 251      |
| Real Det Return     | 2.1e+03  |
| Real Sto Return     | 2.59e+03 |
| Reward Loss         | -750     |
| Running Env Steps   | 1255000  |
| Running Forward KL  | 33.5     |
| Running Reverse KL  | 7.58     |
| Running Update Time | 251      |
----------------------------------
--2023-11-06 19:53:35.864568 CST--
| Itration            | 252      |
| Real Det Return     | 2.24e+03 |
| Real Sto Return     | 2.6e+03  |
| Reward Loss         | -771     |
| Running Env Steps   | 1260000  |
| Running Forward KL  | 33.3     |
| Running Reverse KL  | 7.55     |
| Running Update Time | 252      |
----------------------------------
--2023-11-06 19:55:40.644414 CST--
| Itration            | 253      |
| Real Det Return     | 2.07e+03 |
| Real Sto Return     | 2.6e+03  |
| Reward Loss         | -787     |
| Running Env Steps   | 1265000  |
| Running Forward KL  | 33.3     |
| Running Reverse KL  | 7.64     |
| Running Update Time | 253      |
----------------------------------
--2023-11-06 19:57:45.114348 CST--
| Itration            | 254      |
| Real Det Return     | 2.18e+03 |
| Real Sto Return     | 2.54e+03 |
| Reward Loss         | -795     |
| Running Env Steps   | 1270000  |
| Running Forward KL  | 32.9     |
| Running Reverse KL  | 7.57     |
| Running Update Time | 254      |
----------------------------------
--2023-11-06 19:59:48.723211 CST--
| Itration            | 255      |
| Real Det Return     | 2.07e+03 |
| Real Sto Return     | 2.6e+03  |
| Reward Loss         | -759     |
| Running Env Steps   | 1275000  |
| Running Forward KL  | 32.7     |
| Running Reverse KL  | 7.51     |
| Running Update Time | 255      |
----------------------------------
--2023-11-06 20:01:52.388747 CST--
| Itration            | 256      |
| Real Det Return     | 2.07e+03 |
| Real Sto Return     | 2.58e+03 |
| Reward Loss         | -757     |
| Running Env Steps   | 1280000  |
| Running Forward KL  | 32.5     |
| Running Reverse KL  | 7.58     |
| Running Update Time | 256      |
----------------------------------
--2023-11-06 20:03:56.525943 CST--
| Itration            | 257      |
| Real Det Return     | 2.03e+03 |
| Real Sto Return     | 2.61e+03 |
| Reward Loss         | -750     |
| Running Env Steps   | 1285000  |
| Running Forward KL  | 33.7     |
| Running Reverse KL  | 7.63     |
| Running Update Time | 257      |
----------------------------------
--2023-11-06 20:06:00.636362 CST--
| Itration            | 258      |
| Real Det Return     | 2.31e+03 |
| Real Sto Return     | 2.57e+03 |
| Reward Loss         | -791     |
| Running Env Steps   | 1290000  |
| Running Forward KL  | 32.8     |
| Running Reverse KL  | 7.56     |
| Running Update Time | 258      |
----------------------------------
--2023-11-06 20:08:04.191837 CST--
| Itration            | 259      |
| Real Det Return     | 2.04e+03 |
| Real Sto Return     | 2.6e+03  |
| Reward Loss         | -755     |
| Running Env Steps   | 1295000  |
| Running Forward KL  | 32.8     |
| Running Reverse KL  | 7.68     |
| Running Update Time | 259      |
----------------------------------
--2023-11-06 20:10:07.870190 CST--
| Itration            | 260      |
| Real Det Return     | 1.97e+03 |
| Real Sto Return     | 2.59e+03 |
| Reward Loss         | -767     |
| Running Env Steps   | 1300000  |
| Running Forward KL  | 33.1     |
| Running Reverse KL  | 7.51     |
| Running Update Time | 260      |
----------------------------------
--2023-11-06 20:12:11.572081 CST--
| Itration            | 261      |
| Real Det Return     | 2.29e+03 |
| Real Sto Return     | 2.54e+03 |
| Reward Loss         | -760     |
| Running Env Steps   | 1305000  |
| Running Forward KL  | 32.7     |
| Running Reverse KL  | 7.63     |
| Running Update Time | 261      |
----------------------------------
--2023-11-06 20:14:15.223820 CST--
| Itration            | 262      |
| Real Det Return     | 2.06e+03 |
| Real Sto Return     | 2.62e+03 |
| Reward Loss         | -777     |
| Running Env Steps   | 1310000  |
| Running Forward KL  | 33       |
| Running Reverse KL  | 7.56     |
| Running Update Time | 262      |
----------------------------------
--2023-11-06 20:16:18.958884 CST--
| Itration            | 263      |
| Real Det Return     | 2.06e+03 |
| Real Sto Return     | 2.62e+03 |
| Reward Loss         | -757     |
| Running Env Steps   | 1315000  |
| Running Forward KL  | 33.3     |
| Running Reverse KL  | 7.56     |
| Running Update Time | 263      |
----------------------------------
--2023-11-06 20:18:23.455634 CST--
| Itration            | 264      |
| Real Det Return     | 2.11e+03 |
| Real Sto Return     | 2.58e+03 |
| Reward Loss         | -790     |
| Running Env Steps   | 1320000  |
| Running Forward KL  | 33.5     |
| Running Reverse KL  | 7.6      |
| Running Update Time | 264      |
----------------------------------
--2023-11-06 20:20:27.869878 CST--
| Itration            | 265      |
| Real Det Return     | 2.24e+03 |
| Real Sto Return     | 2.6e+03  |
| Reward Loss         | -769     |
| Running Env Steps   | 1325000  |
| Running Forward KL  | 32.4     |
| Running Reverse KL  | 7.49     |
| Running Update Time | 265      |
----------------------------------
--2023-11-06 20:22:32.032513 CST--
| Itration            | 266      |
| Real Det Return     | 2.14e+03 |
| Real Sto Return     | 2.61e+03 |
| Reward Loss         | -784     |
| Running Env Steps   | 1330000  |
| Running Forward KL  | 33       |
| Running Reverse KL  | 7.52     |
| Running Update Time | 266      |
----------------------------------
--2023-11-06 20:24:36.361658 CST--
| Itration            | 267      |
| Real Det Return     | 2.19e+03 |
| Real Sto Return     | 2.56e+03 |
| Reward Loss         | -786     |
| Running Env Steps   | 1335000  |
| Running Forward KL  | 32.6     |
| Running Reverse KL  | 7.59     |
| Running Update Time | 267      |
----------------------------------
--2023-11-06 20:26:41.824058 CST--
| Itration            | 268      |
| Real Det Return     | 2.26e+03 |
| Real Sto Return     | 2.56e+03 |
| Reward Loss         | -784     |
| Running Env Steps   | 1340000  |
| Running Forward KL  | 32.5     |
| Running Reverse KL  | 7.51     |
| Running Update Time | 268      |
----------------------------------
--2023-11-06 20:28:47.187286 CST--
| Itration            | 269      |
| Real Det Return     | 2.16e+03 |
| Real Sto Return     | 2.61e+03 |
| Reward Loss         | -768     |
| Running Env Steps   | 1345000  |
| Running Forward KL  | 32.4     |
| Running Reverse KL  | 7.51     |
| Running Update Time | 269      |
----------------------------------
--2023-11-06 20:30:52.301824 CST--
| Itration            | 270      |
| Real Det Return     | 2.1e+03  |
| Real Sto Return     | 2.63e+03 |
| Reward Loss         | -782     |
| Running Env Steps   | 1350000  |
| Running Forward KL  | 32.3     |
| Running Reverse KL  | 7.5      |
| Running Update Time | 270      |
----------------------------------
--2023-11-06 20:32:57.755671 CST--
| Itration            | 271      |
| Real Det Return     | 2.1e+03  |
| Real Sto Return     | 2.6e+03  |
| Reward Loss         | -809     |
| Running Env Steps   | 1355000  |
| Running Forward KL  | 32.7     |
| Running Reverse KL  | 7.49     |
| Running Update Time | 271      |
----------------------------------
--2023-11-06 20:35:03.380042 CST--
| Itration            | 272      |
| Real Det Return     | 2.17e+03 |
| Real Sto Return     | 2.62e+03 |
| Reward Loss         | -774     |
| Running Env Steps   | 1360000  |
| Running Forward KL  | 32.1     |
| Running Reverse KL  | 7.54     |
| Running Update Time | 272      |
----------------------------------
--2023-11-06 20:37:08.804156 CST--
| Itration            | 273      |
| Real Det Return     | 2.26e+03 |
| Real Sto Return     | 2.58e+03 |
| Reward Loss         | -786     |
| Running Env Steps   | 1365000  |
| Running Forward KL  | 32.6     |
| Running Reverse KL  | 7.69     |
| Running Update Time | 273      |
----------------------------------
--2023-11-06 20:39:13.738608 CST--
| Itration            | 274      |
| Real Det Return     | 2.1e+03  |
| Real Sto Return     | 2.62e+03 |
| Reward Loss         | -777     |
| Running Env Steps   | 1370000  |
| Running Forward KL  | 32.8     |
| Running Reverse KL  | 7.46     |
| Running Update Time | 274      |
----------------------------------
--2023-11-06 20:41:19.203441 CST--
| Itration            | 275      |
| Real Det Return     | 2.1e+03  |
| Real Sto Return     | 2.61e+03 |
| Reward Loss         | -794     |
| Running Env Steps   | 1375000  |
| Running Forward KL  | 33       |
| Running Reverse KL  | 7.47     |
| Running Update Time | 275      |
----------------------------------
--2023-11-06 20:43:24.745343 CST--
| Itration            | 276      |
| Real Det Return     | 2.03e+03 |
| Real Sto Return     | 2.61e+03 |
| Reward Loss         | -790     |
| Running Env Steps   | 1380000  |
| Running Forward KL  | 32.3     |
| Running Reverse KL  | 7.47     |
| Running Update Time | 276      |
----------------------------------
--2023-11-06 20:45:31.988503 CST--
| Itration            | 277      |
| Real Det Return     | 2.06e+03 |
| Real Sto Return     | 2.61e+03 |
| Reward Loss         | -782     |
| Running Env Steps   | 1385000  |
| Running Forward KL  | 32.9     |
| Running Reverse KL  | 7.58     |
| Running Update Time | 277      |
----------------------------------
--2023-11-06 20:47:38.851856 CST--
| Itration            | 278      |
| Real Det Return     | 2e+03    |
| Real Sto Return     | 2.62e+03 |
| Reward Loss         | -773     |
| Running Env Steps   | 1390000  |
| Running Forward KL  | 31.6     |
| Running Reverse KL  | 7.47     |
| Running Update Time | 278      |
----------------------------------
--2023-11-06 20:49:45.929101 CST--
| Itration            | 279      |
| Real Det Return     | 2.13e+03 |
| Real Sto Return     | 2.6e+03  |
| Reward Loss         | -791     |
| Running Env Steps   | 1395000  |
| Running Forward KL  | 32.6     |
| Running Reverse KL  | 7.48     |
| Running Update Time | 279      |
----------------------------------
--2023-11-06 20:51:53.017496 CST--
| Itration            | 280      |
| Real Det Return     | 2.18e+03 |
| Real Sto Return     | 2.63e+03 |
| Reward Loss         | -791     |
| Running Env Steps   | 1400000  |
| Running Forward KL  | 32.4     |
| Running Reverse KL  | 7.47     |
| Running Update Time | 280      |
----------------------------------
--2023-11-06 20:54:00.390267 CST--
| Itration            | 281      |
| Real Det Return     | 2e+03    |
| Real Sto Return     | 2.63e+03 |
| Reward Loss         | -795     |
| Running Env Steps   | 1405000  |
| Running Forward KL  | 32.9     |
| Running Reverse KL  | 7.65     |
| Running Update Time | 281      |
----------------------------------
--2023-11-06 20:56:07.399236 CST--
| Itration            | 282      |
| Real Det Return     | 1.95e+03 |
| Real Sto Return     | 2.63e+03 |
| Reward Loss         | -774     |
| Running Env Steps   | 1410000  |
| Running Forward KL  | 32.6     |
| Running Reverse KL  | 7.66     |
| Running Update Time | 282      |
----------------------------------
--2023-11-06 20:58:14.168723 CST--
| Itration            | 283      |
| Real Det Return     | 2.12e+03 |
| Real Sto Return     | 2.61e+03 |
| Reward Loss         | -788     |
| Running Env Steps   | 1415000  |
| Running Forward KL  | 33       |
| Running Reverse KL  | 7.5      |
| Running Update Time | 283      |
----------------------------------
--2023-11-06 21:00:20.904668 CST--
| Itration            | 284      |
| Real Det Return     | 1.92e+03 |
| Real Sto Return     | 2.61e+03 |
| Reward Loss         | -796     |
| Running Env Steps   | 1420000  |
| Running Forward KL  | 33       |
| Running Reverse KL  | 7.5      |
| Running Update Time | 284      |
----------------------------------
--2023-11-06 21:02:27.426377 CST--
| Itration            | 285      |
| Real Det Return     | 2e+03    |
| Real Sto Return     | 2.61e+03 |
| Reward Loss         | -789     |
| Running Env Steps   | 1425000  |
| Running Forward KL  | 32.2     |
| Running Reverse KL  | 7.43     |
| Running Update Time | 285      |
----------------------------------
--2023-11-06 21:04:34.327016 CST--
| Itration            | 286      |
| Real Det Return     | 2.28e+03 |
| Real Sto Return     | 2.59e+03 |
| Reward Loss         | -802     |
| Running Env Steps   | 1430000  |
| Running Forward KL  | 32.5     |
| Running Reverse KL  | 7.55     |
| Running Update Time | 286      |
----------------------------------
--2023-11-06 21:06:41.301481 CST--
| Itration            | 287      |
| Real Det Return     | 2e+03    |
| Real Sto Return     | 2.62e+03 |
| Reward Loss         | -783     |
| Running Env Steps   | 1435000  |
| Running Forward KL  | 32.9     |
| Running Reverse KL  | 7.63     |
| Running Update Time | 287      |
----------------------------------
--2023-11-06 21:08:48.073815 CST--
| Itration            | 288      |
| Real Det Return     | 2.01e+03 |
| Real Sto Return     | 2.62e+03 |
| Reward Loss         | -803     |
| Running Env Steps   | 1440000  |
| Running Forward KL  | 32.3     |
| Running Reverse KL  | 7.52     |
| Running Update Time | 288      |
----------------------------------
--2023-11-06 21:10:55.008836 CST--
| Itration            | 289      |
| Real Det Return     | 2.4e+03  |
| Real Sto Return     | 2.61e+03 |
| Reward Loss         | -807     |
| Running Env Steps   | 1445000  |
| Running Forward KL  | 32.3     |
| Running Reverse KL  | 7.46     |
| Running Update Time | 289      |
----------------------------------
--2023-11-06 21:13:01.804408 CST--
| Itration            | 290      |
| Real Det Return     | 2.15e+03 |
| Real Sto Return     | 2.62e+03 |
| Reward Loss         | -791     |
| Running Env Steps   | 1450000  |
| Running Forward KL  | 31.8     |
| Running Reverse KL  | 7.43     |
| Running Update Time | 290      |
----------------------------------
--2023-11-06 21:15:08.500463 CST--
| Itration            | 291      |
| Real Det Return     | 2.17e+03 |
| Real Sto Return     | 2.64e+03 |
| Reward Loss         | -778     |
| Running Env Steps   | 1455000  |
| Running Forward KL  | 32       |
| Running Reverse KL  | 7.55     |
| Running Update Time | 291      |
----------------------------------
--2023-11-06 21:17:15.198605 CST--
| Itration            | 292      |
| Real Det Return     | 2.39e+03 |
| Real Sto Return     | 2.6e+03  |
| Reward Loss         | -804     |
| Running Env Steps   | 1460000  |
| Running Forward KL  | 32       |
| Running Reverse KL  | 7.61     |
| Running Update Time | 292      |
----------------------------------
--2023-11-06 21:19:22.103713 CST--
| Itration            | 293      |
| Real Det Return     | 2.12e+03 |
| Real Sto Return     | 2.63e+03 |
| Reward Loss         | -772     |
| Running Env Steps   | 1465000  |
| Running Forward KL  | 32       |
| Running Reverse KL  | 7.41     |
| Running Update Time | 293      |
----------------------------------
--2023-11-06 21:21:28.930193 CST--
| Itration            | 294      |
| Real Det Return     | 2.11e+03 |
| Real Sto Return     | 2.63e+03 |
| Reward Loss         | -792     |
| Running Env Steps   | 1470000  |
| Running Forward KL  | 32.3     |
| Running Reverse KL  | 7.32     |
| Running Update Time | 294      |
----------------------------------
--2023-11-06 21:23:35.582597 CST--
| Itration            | 295      |
| Real Det Return     | 2.28e+03 |
| Real Sto Return     | 2.63e+03 |
| Reward Loss         | -797     |
| Running Env Steps   | 1475000  |
| Running Forward KL  | 32.1     |
| Running Reverse KL  | 7.52     |
| Running Update Time | 295      |
----------------------------------
--2023-11-06 21:25:42.443756 CST--
| Itration            | 296      |
| Real Det Return     | 2.09e+03 |
| Real Sto Return     | 2.63e+03 |
| Reward Loss         | -816     |
| Running Env Steps   | 1480000  |
| Running Forward KL  | 31.9     |
| Running Reverse KL  | 7.57     |
| Running Update Time | 296      |
----------------------------------
--2023-11-06 21:27:48.998424 CST--
| Itration            | 297      |
| Real Det Return     | 2.11e+03 |
| Real Sto Return     | 2.64e+03 |
| Reward Loss         | -792     |
| Running Env Steps   | 1485000  |
| Running Forward KL  | 32.2     |
| Running Reverse KL  | 7.56     |
| Running Update Time | 297      |
----------------------------------
--2023-11-06 21:29:55.802466 CST--
| Itration            | 298      |
| Real Det Return     | 1.98e+03 |
| Real Sto Return     | 2.63e+03 |
| Reward Loss         | -791     |
| Running Env Steps   | 1490000  |
| Running Forward KL  | 31.7     |
| Running Reverse KL  | 7.61     |
| Running Update Time | 298      |
----------------------------------
--2023-11-06 21:32:02.713777 CST--
| Itration            | 299      |
| Real Det Return     | 2e+03    |
| Real Sto Return     | 2.63e+03 |
| Reward Loss         | -762     |
| Running Env Steps   | 1495000  |
| Running Forward KL  | 32       |
| Running Reverse KL  | 7.45     |
| Running Update Time | 299      |
----------------------------------
--2023-11-06 21:34:09.601015 CST--
| Itration            | 300      |
| Real Det Return     | 2.18e+03 |
| Real Sto Return     | 2.63e+03 |
| Reward Loss         | -814     |
| Running Env Steps   | 1500000  |
| Running Forward KL  | 32       |
| Running Reverse KL  | 7.53     |
| Running Update Time | 300      |
----------------------------------
--2023-11-06 21:36:16.836507 CST--
| Itration            | 301      |
| Real Det Return     | 2.17e+03 |
| Real Sto Return     | 2.62e+03 |
| Reward Loss         | -834     |
| Running Env Steps   | 1505000  |
| Running Forward KL  | 31.4     |
| Running Reverse KL  | 7.49     |
| Running Update Time | 301      |
----------------------------------
--2023-11-06 21:38:23.907383 CST--
| Itration            | 302      |
| Real Det Return     | 2.01e+03 |
| Real Sto Return     | 2.62e+03 |
| Reward Loss         | -784     |
| Running Env Steps   | 1510000  |
| Running Forward KL  | 32.3     |
| Running Reverse KL  | 7.54     |
| Running Update Time | 302      |
----------------------------------
--2023-11-06 21:40:28.398911 CST--
| Itration            | 303      |
| Real Det Return     | 2.32e+03 |
| Real Sto Return     | 2.62e+03 |
| Reward Loss         | -822     |
| Running Env Steps   | 1515000  |
| Running Forward KL  | 31.9     |
| Running Reverse KL  | 7.47     |
| Running Update Time | 303      |
----------------------------------
--2023-11-06 21:42:32.866902 CST--
| Itration            | 304      |
| Real Det Return     | 2.16e+03 |
| Real Sto Return     | 2.61e+03 |
| Reward Loss         | -810     |
| Running Env Steps   | 1520000  |
| Running Forward KL  | 32       |
| Running Reverse KL  | 7.42     |
| Running Update Time | 304      |
----------------------------------
--2023-11-06 21:44:36.835101 CST--
| Itration            | 305      |
| Real Det Return     | 2.07e+03 |
| Real Sto Return     | 2.64e+03 |
| Reward Loss         | -791     |
| Running Env Steps   | 1525000  |
| Running Forward KL  | 32.5     |
| Running Reverse KL  | 7.44     |
| Running Update Time | 305      |
----------------------------------
--2023-11-06 21:46:40.824662 CST--
| Itration            | 306      |
| Real Det Return     | 2.12e+03 |
| Real Sto Return     | 2.62e+03 |
| Reward Loss         | -783     |
| Running Env Steps   | 1530000  |
| Running Forward KL  | 31.3     |
| Running Reverse KL  | 7.49     |
| Running Update Time | 306      |
----------------------------------
--2023-11-06 21:48:44.843980 CST--
| Itration            | 307      |
| Real Det Return     | 2.13e+03 |
| Real Sto Return     | 2.63e+03 |
| Reward Loss         | -812     |
| Running Env Steps   | 1535000  |
| Running Forward KL  | 31       |
| Running Reverse KL  | 7.51     |
| Running Update Time | 307      |
----------------------------------
--2023-11-06 21:50:48.981880 CST--
| Itration            | 308      |
| Real Det Return     | 1.93e+03 |
| Real Sto Return     | 2.61e+03 |
| Reward Loss         | -799     |
| Running Env Steps   | 1540000  |
| Running Forward KL  | 31.4     |
| Running Reverse KL  | 7.41     |
| Running Update Time | 308      |
----------------------------------
--2023-11-06 21:52:52.907757 CST--
| Itration            | 309      |
| Real Det Return     | 1.95e+03 |
| Real Sto Return     | 2.64e+03 |
| Reward Loss         | -810     |
| Running Env Steps   | 1545000  |
| Running Forward KL  | 31.7     |
| Running Reverse KL  | 7.51     |
| Running Update Time | 309      |
----------------------------------
--2023-11-06 21:54:57.013501 CST--
| Itration            | 310      |
| Real Det Return     | 2.52e+03 |
| Real Sto Return     | 2.58e+03 |
| Reward Loss         | -829     |
| Running Env Steps   | 1550000  |
| Running Forward KL  | 31.2     |
| Running Reverse KL  | 7.73     |
| Running Update Time | 310      |
----------------------------------
--2023-11-06 21:57:00.952020 CST--
| Itration            | 311      |
| Real Det Return     | 2.05e+03 |
| Real Sto Return     | 2.63e+03 |
| Reward Loss         | -821     |
| Running Env Steps   | 1555000  |
| Running Forward KL  | 31.4     |
| Running Reverse KL  | 7.45     |
| Running Update Time | 311      |
----------------------------------
--2023-11-06 21:59:05.183520 CST--
| Itration            | 312      |
| Real Det Return     | 2.18e+03 |
| Real Sto Return     | 2.62e+03 |
| Reward Loss         | -797     |
| Running Env Steps   | 1560000  |
| Running Forward KL  | 32       |
| Running Reverse KL  | 7.49     |
| Running Update Time | 312      |
----------------------------------
--2023-11-06 22:01:09.534796 CST--
| Itration            | 313      |
| Real Det Return     | 2.01e+03 |
| Real Sto Return     | 2.64e+03 |
| Reward Loss         | -821     |
| Running Env Steps   | 1565000  |
| Running Forward KL  | 31.4     |
| Running Reverse KL  | 7.58     |
| Running Update Time | 313      |
----------------------------------
--2023-11-06 22:03:13.895109 CST--
| Itration            | 314      |
| Real Det Return     | 2.16e+03 |
| Real Sto Return     | 2.63e+03 |
| Reward Loss         | -789     |
| Running Env Steps   | 1570000  |
| Running Forward KL  | 31       |
| Running Reverse KL  | 7.46     |
| Running Update Time | 314      |
----------------------------------
--2023-11-06 22:05:18.000014 CST--
| Itration            | 315      |
| Real Det Return     | 2.17e+03 |
| Real Sto Return     | 2.63e+03 |
| Reward Loss         | -820     |
| Running Env Steps   | 1575000  |
| Running Forward KL  | 31.4     |
| Running Reverse KL  | 7.63     |
| Running Update Time | 315      |
----------------------------------
--2023-11-06 22:07:22.313357 CST--
| Itration            | 316      |
| Real Det Return     | 2.17e+03 |
| Real Sto Return     | 2.65e+03 |
| Reward Loss         | -797     |
| Running Env Steps   | 1580000  |
| Running Forward KL  | 31.1     |
| Running Reverse KL  | 7.63     |
| Running Update Time | 316      |
----------------------------------
--2023-11-06 22:09:26.598227 CST--
| Itration            | 317      |
| Real Det Return     | 2.34e+03 |
| Real Sto Return     | 2.57e+03 |
| Reward Loss         | -833     |
| Running Env Steps   | 1585000  |
| Running Forward KL  | 31.3     |
| Running Reverse KL  | 7.56     |
| Running Update Time | 317      |
----------------------------------
--2023-11-06 22:11:35.092962 CST--
| Itration            | 318      |
| Real Det Return     | 2.17e+03 |
| Real Sto Return     | 2.64e+03 |
| Reward Loss         | -821     |
| Running Env Steps   | 1590000  |
| Running Forward KL  | 31.7     |
| Running Reverse KL  | 7.48     |
| Running Update Time | 318      |
----------------------------------
--2023-11-06 22:13:44.006961 CST--
| Itration            | 319      |
| Real Det Return     | 2.09e+03 |
| Real Sto Return     | 2.62e+03 |
| Reward Loss         | -808     |
| Running Env Steps   | 1595000  |
| Running Forward KL  | 31.2     |
| Running Reverse KL  | 7.38     |
| Running Update Time | 319      |
----------------------------------
--2023-11-06 22:15:52.939996 CST--
| Itration            | 320      |
| Real Det Return     | 2.27e+03 |
| Real Sto Return     | 2.6e+03  |
| Reward Loss         | -829     |
| Running Env Steps   | 1600000  |
| Running Forward KL  | 31       |
| Running Reverse KL  | 7.48     |
| Running Update Time | 320      |
----------------------------------
--2023-11-06 22:18:02.258803 CST--
| Itration            | 321      |
| Real Det Return     | 2.15e+03 |
| Real Sto Return     | 2.61e+03 |
| Reward Loss         | -828     |
| Running Env Steps   | 1605000  |
| Running Forward KL  | 31.4     |
| Running Reverse KL  | 7.41     |
| Running Update Time | 321      |
----------------------------------
--2023-11-06 22:20:11.816735 CST--
| Itration            | 322      |
| Real Det Return     | 2.35e+03 |
| Real Sto Return     | 2.62e+03 |
| Reward Loss         | -812     |
| Running Env Steps   | 1610000  |
| Running Forward KL  | 30.9     |
| Running Reverse KL  | 7.48     |
| Running Update Time | 322      |
----------------------------------
--2023-11-06 22:22:20.518385 CST--
| Itration            | 323      |
| Real Det Return     | 2.03e+03 |
| Real Sto Return     | 2.63e+03 |
| Reward Loss         | -803     |
| Running Env Steps   | 1615000  |
| Running Forward KL  | 31       |
| Running Reverse KL  | 7.4      |
| Running Update Time | 323      |
----------------------------------
--2023-11-06 22:24:25.044418 CST--
| Itration            | 324      |
| Real Det Return     | 2.3e+03  |
| Real Sto Return     | 2.66e+03 |
| Reward Loss         | -823     |
| Running Env Steps   | 1620000  |
| Running Forward KL  | 30.9     |
| Running Reverse KL  | 7.53     |
| Running Update Time | 324      |
----------------------------------
--2023-11-06 22:26:29.376358 CST--
| Itration            | 325      |
| Real Det Return     | 1.95e+03 |
| Real Sto Return     | 2.63e+03 |
| Reward Loss         | -837     |
| Running Env Steps   | 1625000  |
| Running Forward KL  | 31.5     |
| Running Reverse KL  | 7.52     |
| Running Update Time | 325      |
----------------------------------
--2023-11-06 22:28:33.779932 CST--
| Itration            | 326      |
| Real Det Return     | 2.22e+03 |
| Real Sto Return     | 2.64e+03 |
| Reward Loss         | -840     |
| Running Env Steps   | 1630000  |
| Running Forward KL  | 31       |
| Running Reverse KL  | 7.51     |
| Running Update Time | 326      |
----------------------------------
--2023-11-06 22:30:37.807183 CST--
| Itration            | 327      |
| Real Det Return     | 2.16e+03 |
| Real Sto Return     | 2.61e+03 |
| Reward Loss         | -824     |
| Running Env Steps   | 1635000  |
| Running Forward KL  | 31       |
| Running Reverse KL  | 7.54     |
| Running Update Time | 327      |
----------------------------------
--2023-11-06 22:32:42.039136 CST--
| Itration            | 328      |
| Real Det Return     | 2.04e+03 |
| Real Sto Return     | 2.61e+03 |
| Reward Loss         | -852     |
| Running Env Steps   | 1640000  |
| Running Forward KL  | 30.8     |
| Running Reverse KL  | 7.42     |
| Running Update Time | 328      |
----------------------------------
--2023-11-06 22:34:46.296233 CST--
| Itration            | 329      |
| Real Det Return     | 2.08e+03 |
| Real Sto Return     | 2.64e+03 |
| Reward Loss         | -822     |
| Running Env Steps   | 1645000  |
| Running Forward KL  | 30.8     |
| Running Reverse KL  | 7.39     |
| Running Update Time | 329      |
----------------------------------
--2023-11-06 22:36:50.957118 CST--
| Itration            | 330      |
| Real Det Return     | 2.73e+03 |
| Real Sto Return     | 2.58e+03 |
| Reward Loss         | -816     |
| Running Env Steps   | 1650000  |
| Running Forward KL  | 30.7     |
| Running Reverse KL  | 7.52     |
| Running Update Time | 330      |
----------------------------------
--2023-11-06 22:38:55.542076 CST--
| Itration            | 331      |
| Real Det Return     | 2.18e+03 |
| Real Sto Return     | 2.63e+03 |
| Reward Loss         | -829     |
| Running Env Steps   | 1655000  |
| Running Forward KL  | 31.1     |
| Running Reverse KL  | 7.51     |
| Running Update Time | 331      |
----------------------------------
--2023-11-06 22:41:00.378410 CST--
| Itration            | 332      |
| Real Det Return     | 2.47e+03 |
| Real Sto Return     | 2.62e+03 |
| Reward Loss         | -807     |
| Running Env Steps   | 1660000  |
| Running Forward KL  | 30.9     |
| Running Reverse KL  | 7.56     |
| Running Update Time | 332      |
----------------------------------
--2023-11-06 22:43:05.077853 CST--
| Itration            | 333      |
| Real Det Return     | 2.11e+03 |
| Real Sto Return     | 2.64e+03 |
| Reward Loss         | -831     |
| Running Env Steps   | 1665000  |
| Running Forward KL  | 31       |
| Running Reverse KL  | 7.5      |
| Running Update Time | 333      |
----------------------------------
--2023-11-06 22:45:10.857604 CST--
| Itration            | 334      |
| Real Det Return     | 2.08e+03 |
| Real Sto Return     | 2.65e+03 |
| Reward Loss         | -835     |
| Running Env Steps   | 1670000  |
| Running Forward KL  | 31.1     |
| Running Reverse KL  | 7.44     |
| Running Update Time | 334      |
----------------------------------
--2023-11-06 22:47:15.363130 CST--
| Itration            | 335      |
| Real Det Return     | 2.07e+03 |
| Real Sto Return     | 2.65e+03 |
| Reward Loss         | -836     |
| Running Env Steps   | 1675000  |
| Running Forward KL  | 30.9     |
| Running Reverse KL  | 7.58     |
| Running Update Time | 335      |
----------------------------------
--2023-11-06 22:49:20.331924 CST--
| Itration            | 336      |
| Real Det Return     | 2.27e+03 |
| Real Sto Return     | 2.62e+03 |
| Reward Loss         | -820     |
| Running Env Steps   | 1680000  |
| Running Forward KL  | 31.1     |
| Running Reverse KL  | 7.44     |
| Running Update Time | 336      |
----------------------------------
--2023-11-06 22:51:25.082824 CST--
| Itration            | 337      |
| Real Det Return     | 2.27e+03 |
| Real Sto Return     | 2.64e+03 |
| Reward Loss         | -854     |
| Running Env Steps   | 1685000  |
| Running Forward KL  | 30.3     |
| Running Reverse KL  | 7.35     |
| Running Update Time | 337      |
----------------------------------
--2023-11-06 22:53:29.635847 CST--
| Itration            | 338      |
| Real Det Return     | 2.23e+03 |
| Real Sto Return     | 2.62e+03 |
| Reward Loss         | -829     |
| Running Env Steps   | 1690000  |
| Running Forward KL  | 30.6     |
| Running Reverse KL  | 7.46     |
| Running Update Time | 338      |
----------------------------------
--2023-11-06 22:55:33.910776 CST--
| Itration            | 339      |
| Real Det Return     | 2.08e+03 |
| Real Sto Return     | 2.64e+03 |
| Reward Loss         | -832     |
| Running Env Steps   | 1695000  |
| Running Forward KL  | 30.8     |
| Running Reverse KL  | 7.46     |
| Running Update Time | 339      |
----------------------------------
--2023-11-06 22:57:38.190994 CST--
| Itration            | 340      |
| Real Det Return     | 2.28e+03 |
| Real Sto Return     | 2.59e+03 |
| Reward Loss         | -840     |
| Running Env Steps   | 1700000  |
| Running Forward KL  | 30.5     |
| Running Reverse KL  | 7.42     |
| Running Update Time | 340      |
----------------------------------
--2023-11-06 22:59:42.209703 CST--
| Itration            | 341      |
| Real Det Return     | 2.16e+03 |
| Real Sto Return     | 2.63e+03 |
| Reward Loss         | -857     |
| Running Env Steps   | 1705000  |
| Running Forward KL  | 31.3     |
| Running Reverse KL  | 7.52     |
| Running Update Time | 341      |
----------------------------------
--2023-11-06 23:01:46.273571 CST--
| Itration            | 342      |
| Real Det Return     | 1.98e+03 |
| Real Sto Return     | 2.65e+03 |
| Reward Loss         | -837     |
| Running Env Steps   | 1710000  |
| Running Forward KL  | 31.4     |
| Running Reverse KL  | 7.65     |
| Running Update Time | 342      |
----------------------------------
--2023-11-06 23:03:50.884011 CST--
| Itration            | 343      |
| Real Det Return     | 2.19e+03 |
| Real Sto Return     | 2.64e+03 |
| Reward Loss         | -846     |
| Running Env Steps   | 1715000  |
| Running Forward KL  | 30.7     |
| Running Reverse KL  | 7.47     |
| Running Update Time | 343      |
----------------------------------
--2023-11-06 23:05:54.927723 CST--
| Itration            | 344      |
| Real Det Return     | 2.31e+03 |
| Real Sto Return     | 2.64e+03 |
| Reward Loss         | -841     |
| Running Env Steps   | 1720000  |
| Running Forward KL  | 30.6     |
| Running Reverse KL  | 7.51     |
| Running Update Time | 344      |
----------------------------------
--2023-11-06 23:08:07.597728 CST--
| Itration            | 345      |
| Real Det Return     | 2.29e+03 |
| Real Sto Return     | 2.61e+03 |
| Reward Loss         | -854     |
| Running Env Steps   | 1725000  |
| Running Forward KL  | 30.3     |
| Running Reverse KL  | 7.47     |
| Running Update Time | 345      |
----------------------------------
--2023-11-06 23:10:20.366523 CST--
| Itration            | 346      |
| Real Det Return     | 2.4e+03  |
| Real Sto Return     | 2.58e+03 |
| Reward Loss         | -910     |
| Running Env Steps   | 1730000  |
| Running Forward KL  | 30.7     |
| Running Reverse KL  | 7.35     |
| Running Update Time | 346      |
----------------------------------
--2023-11-06 23:12:33.481433 CST--
| Itration            | 347      |
| Real Det Return     | 2.45e+03 |
| Real Sto Return     | 2.47e+03 |
| Reward Loss         | -880     |
| Running Env Steps   | 1735000  |
| Running Forward KL  | 30.5     |
| Running Reverse KL  | 7.54     |
| Running Update Time | 347      |
----------------------------------
--2023-11-06 23:14:41.055355 CST--
| Itration            | 348      |
| Real Det Return     | 2.17e+03 |
| Real Sto Return     | 2.6e+03  |
| Reward Loss         | -894     |
| Running Env Steps   | 1740000  |
| Running Forward KL  | 30.9     |
| Running Reverse KL  | 7.34     |
| Running Update Time | 348      |
----------------------------------
--2023-11-06 23:16:49.469475 CST--
| Itration            | 349      |
| Real Det Return     | 2.68e+03 |
| Real Sto Return     | 2.31e+03 |
| Reward Loss         | -989     |
| Running Env Steps   | 1745000  |
| Running Forward KL  | 31.8     |
| Running Reverse KL  | 9.73     |
| Running Update Time | 349      |
----------------------------------
--2023-11-06 23:18:57.414192 CST--
| Itration            | 350      |
| Real Det Return     | 1.67e+03 |
| Real Sto Return     | 2.09e+03 |
| Reward Loss         | -712     |
| Running Env Steps   | 1750000  |
| Running Forward KL  | 32       |
| Running Reverse KL  | 14.7     |
| Running Update Time | 350      |
----------------------------------
--2023-11-06 23:21:05.024019 CST---
| Itration            | 351       |
| Real Det Return     | 2.19e+03  |
| Real Sto Return     | 2.1e+03   |
| Reward Loss         | -1.04e+03 |
| Running Env Steps   | 1755000   |
| Running Forward KL  | 32.4      |
| Running Reverse KL  | 8.95      |
| Running Update Time | 351       |
-----------------------------------
--2023-11-06 23:23:13.470828 CST--
| Itration            | 352      |
| Real Det Return     | 876      |
| Real Sto Return     | 934      |
| Reward Loss         | -1.2e+03 |
| Running Env Steps   | 1760000  |
| Running Forward KL  | 40.7     |
| Running Reverse KL  | 14.9     |
| Running Update Time | 352      |
----------------------------------
--2023-11-06 23:25:21.066452 CST--
| Itration            | 353      |
| Real Det Return     | 1.98e+03 |
| Real Sto Return     | 2.59e+03 |
| Reward Loss         | -874     |
| Running Env Steps   | 1765000  |
| Running Forward KL  | 31.7     |
| Running Reverse KL  | 7.6      |
| Running Update Time | 353      |
----------------------------------
--2023-11-06 23:27:28.843172 CST--
| Itration            | 354      |
| Real Det Return     | 2.3e+03  |
| Real Sto Return     | 2.65e+03 |
| Reward Loss         | -856     |
| Running Env Steps   | 1770000  |
| Running Forward KL  | 31.2     |
| Running Reverse KL  | 7.53     |
| Running Update Time | 354      |
----------------------------------
--2023-11-06 23:29:36.490757 CST--
| Itration            | 355      |
| Real Det Return     | 2.26e+03 |
| Real Sto Return     | 2.66e+03 |
| Reward Loss         | -870     |
| Running Env Steps   | 1775000  |
| Running Forward KL  | 30.5     |
| Running Reverse KL  | 7.59     |
| Running Update Time | 355      |
----------------------------------
--2023-11-06 23:31:43.953419 CST--
| Itration            | 356      |
| Real Det Return     | 2.18e+03 |
| Real Sto Return     | 2.67e+03 |
| Reward Loss         | -849     |
| Running Env Steps   | 1780000  |
| Running Forward KL  | 30.4     |
| Running Reverse KL  | 7.49     |
| Running Update Time | 356      |
----------------------------------
--2023-11-06 23:33:51.194887 CST--
| Itration            | 357      |
| Real Det Return     | 2.18e+03 |
| Real Sto Return     | 2.65e+03 |
| Reward Loss         | -851     |
| Running Env Steps   | 1785000  |
| Running Forward KL  | 30.2     |
| Running Reverse KL  | 7.58     |
| Running Update Time | 357      |
----------------------------------
--2023-11-06 23:35:58.647286 CST--
| Itration            | 358      |
| Real Det Return     | 2.16e+03 |
| Real Sto Return     | 2.67e+03 |
| Reward Loss         | -837     |
| Running Env Steps   | 1790000  |
| Running Forward KL  | 30.3     |
| Running Reverse KL  | 7.5      |
| Running Update Time | 358      |
----------------------------------
--2023-11-06 23:38:05.949714 CST--
| Itration            | 359      |
| Real Det Return     | 2.29e+03 |
| Real Sto Return     | 2.66e+03 |
| Reward Loss         | -882     |
| Running Env Steps   | 1795000  |
| Running Forward KL  | 30.4     |
| Running Reverse KL  | 7.62     |
| Running Update Time | 359      |
----------------------------------
--2023-11-06 23:40:09.308464 CST--
| Itration            | 360      |
| Real Det Return     | 2.37e+03 |
| Real Sto Return     | 2.67e+03 |
| Reward Loss         | -877     |
| Running Env Steps   | 1800000  |
| Running Forward KL  | 30.7     |
| Running Reverse KL  | 7.53     |
| Running Update Time | 360      |
----------------------------------
--2023-11-06 23:42:15.067963 CST--
| Itration            | 361      |
| Real Det Return     | 2.29e+03 |
| Real Sto Return     | 2.68e+03 |
| Reward Loss         | -874     |
| Running Env Steps   | 1805000  |
| Running Forward KL  | 30.4     |
| Running Reverse KL  | 7.42     |
| Running Update Time | 361      |
----------------------------------
--2023-11-06 23:44:20.552302 CST--
| Itration            | 362      |
| Real Det Return     | 2.15e+03 |
| Real Sto Return     | 2.64e+03 |
| Reward Loss         | -866     |
| Running Env Steps   | 1810000  |
| Running Forward KL  | 30.9     |
| Running Reverse KL  | 7.66     |
| Running Update Time | 362      |
----------------------------------
--2023-11-06 23:46:25.681898 CST--
| Itration            | 363      |
| Real Det Return     | 2.21e+03 |
| Real Sto Return     | 2.67e+03 |
| Reward Loss         | -859     |
| Running Env Steps   | 1815000  |
| Running Forward KL  | 30.8     |
| Running Reverse KL  | 7.54     |
| Running Update Time | 363      |
----------------------------------
--2023-11-06 23:48:30.717668 CST--
| Itration            | 364      |
| Real Det Return     | 2.22e+03 |
| Real Sto Return     | 2.64e+03 |
| Reward Loss         | -861     |
| Running Env Steps   | 1820000  |
| Running Forward KL  | 30.9     |
| Running Reverse KL  | 7.61     |
| Running Update Time | 364      |
----------------------------------
--2023-11-06 23:50:26.864086 CST--
| Itration            | 365      |
| Real Det Return     | 2.25e+03 |
| Real Sto Return     | 2.67e+03 |
| Reward Loss         | -868     |
| Running Env Steps   | 1825000  |
| Running Forward KL  | 29.8     |
| Running Reverse KL  | 7.46     |
| Running Update Time | 365      |
----------------------------------
--2023-11-06 23:52:32.457265 CST--
| Itration            | 366      |
| Real Det Return     | 2.09e+03 |
| Real Sto Return     | 2.65e+03 |
| Reward Loss         | -891     |
| Running Env Steps   | 1830000  |
| Running Forward KL  | 31.2     |
| Running Reverse KL  | 7.82     |
| Running Update Time | 366      |
----------------------------------
--2023-11-06 23:54:37.784589 CST--
| Itration            | 367      |
| Real Det Return     | 2.15e+03 |
| Real Sto Return     | 2.67e+03 |
| Reward Loss         | -849     |
| Running Env Steps   | 1835000  |
| Running Forward KL  | 30.5     |
| Running Reverse KL  | 7.55     |
| Running Update Time | 367      |
----------------------------------
--2023-11-06 23:56:43.283113 CST--
| Itration            | 368      |
| Real Det Return     | 2.47e+03 |
| Real Sto Return     | 2.66e+03 |
| Reward Loss         | -892     |
| Running Env Steps   | 1840000  |
| Running Forward KL  | 30.1     |
| Running Reverse KL  | 7.6      |
| Running Update Time | 368      |
----------------------------------
--2023-11-06 23:58:48.053822 CST--
| Itration            | 369      |
| Real Det Return     | 2.54e+03 |
| Real Sto Return     | 2.66e+03 |
| Reward Loss         | -877     |
| Running Env Steps   | 1845000  |
| Running Forward KL  | 30.3     |
| Running Reverse KL  | 7.5      |
| Running Update Time | 369      |
----------------------------------
--2023-11-07 00:00:51.999505 CST--
| Itration            | 370      |
| Real Det Return     | 2.28e+03 |
| Real Sto Return     | 2.65e+03 |
| Reward Loss         | -891     |
| Running Env Steps   | 1850000  |
| Running Forward KL  | 30.4     |
| Running Reverse KL  | 7.72     |
| Running Update Time | 370      |
----------------------------------
--2023-11-07 00:02:55.988654 CST--
| Itration            | 371      |
| Real Det Return     | 2.1e+03  |
| Real Sto Return     | 2.62e+03 |
| Reward Loss         | -871     |
| Running Env Steps   | 1855000  |
| Running Forward KL  | 30.6     |
| Running Reverse KL  | 7.79     |
| Running Update Time | 371      |
----------------------------------
--2023-11-07 00:04:59.789466 CST--
| Itration            | 372      |
| Real Det Return     | 2.11e+03 |
| Real Sto Return     | 2.65e+03 |
| Reward Loss         | -861     |
| Running Env Steps   | 1860000  |
| Running Forward KL  | 30       |
| Running Reverse KL  | 7.81     |
| Running Update Time | 372      |
----------------------------------
--2023-11-07 00:07:03.472403 CST--
| Itration            | 373      |
| Real Det Return     | 2.24e+03 |
| Real Sto Return     | 2.67e+03 |
| Reward Loss         | -873     |
| Running Env Steps   | 1865000  |
| Running Forward KL  | 30.7     |
| Running Reverse KL  | 7.77     |
| Running Update Time | 373      |
----------------------------------
--2023-11-07 00:09:07.563753 CST--
| Itration            | 374      |
| Real Det Return     | 2.21e+03 |
| Real Sto Return     | 2.68e+03 |
| Reward Loss         | -882     |
| Running Env Steps   | 1870000  |
| Running Forward KL  | 29.8     |
| Running Reverse KL  | 7.59     |
| Running Update Time | 374      |
----------------------------------
--2023-11-07 00:11:08.743800 CST--
| Itration            | 375      |
| Real Det Return     | 2.2e+03  |
| Real Sto Return     | 2.65e+03 |
| Reward Loss         | -869     |
| Running Env Steps   | 1875000  |
| Running Forward KL  | 30.4     |
| Running Reverse KL  | 7.7      |
| Running Update Time | 375      |
----------------------------------
--2023-11-07 00:13:12.830208 CST--
| Itration            | 376      |
| Real Det Return     | 2.23e+03 |
| Real Sto Return     | 2.67e+03 |
| Reward Loss         | -894     |
| Running Env Steps   | 1880000  |
| Running Forward KL  | 30.7     |
| Running Reverse KL  | 7.73     |
| Running Update Time | 376      |
----------------------------------
--2023-11-07 00:15:16.875315 CST--
| Itration            | 377      |
| Real Det Return     | 2.34e+03 |
| Real Sto Return     | 2.67e+03 |
| Reward Loss         | -893     |
| Running Env Steps   | 1885000  |
| Running Forward KL  | 30.5     |
| Running Reverse KL  | 7.65     |
| Running Update Time | 377      |
----------------------------------
--2023-11-07 00:17:21.114903 CST--
| Itration            | 378      |
| Real Det Return     | 2.31e+03 |
| Real Sto Return     | 2.69e+03 |
| Reward Loss         | -889     |
| Running Env Steps   | 1890000  |
| Running Forward KL  | 30       |
| Running Reverse KL  | 7.72     |
| Running Update Time | 378      |
----------------------------------
--2023-11-07 00:19:24.973460 CST--
| Itration            | 379      |
| Real Det Return     | 2.31e+03 |
| Real Sto Return     | 2.67e+03 |
| Reward Loss         | -878     |
| Running Env Steps   | 1895000  |
| Running Forward KL  | 30.4     |
| Running Reverse KL  | 7.69     |
| Running Update Time | 379      |
----------------------------------
--2023-11-07 00:21:28.750284 CST--
| Itration            | 380      |
| Real Det Return     | 2.28e+03 |
| Real Sto Return     | 2.67e+03 |
| Reward Loss         | -899     |
| Running Env Steps   | 1900000  |
| Running Forward KL  | 30.1     |
| Running Reverse KL  | 7.72     |
| Running Update Time | 380      |
----------------------------------
--2023-11-07 00:23:32.438107 CST--
| Itration            | 381      |
| Real Det Return     | 2.14e+03 |
| Real Sto Return     | 2.65e+03 |
| Reward Loss         | -887     |
| Running Env Steps   | 1905000  |
| Running Forward KL  | 30.7     |
| Running Reverse KL  | 7.86     |
| Running Update Time | 381      |
----------------------------------
--2023-11-07 00:25:36.172182 CST--
| Itration            | 382      |
| Real Det Return     | 2.33e+03 |
| Real Sto Return     | 2.67e+03 |
| Reward Loss         | -898     |
| Running Env Steps   | 1910000  |
| Running Forward KL  | 30.3     |
| Running Reverse KL  | 7.75     |
| Running Update Time | 382      |
----------------------------------
--2023-11-07 00:27:40.250907 CST--
| Itration            | 383      |
| Real Det Return     | 2.32e+03 |
| Real Sto Return     | 2.68e+03 |
| Reward Loss         | -903     |
| Running Env Steps   | 1915000  |
| Running Forward KL  | 30.7     |
| Running Reverse KL  | 7.63     |
| Running Update Time | 383      |
----------------------------------
--2023-11-07 00:29:44.074847 CST--
| Itration            | 384      |
| Real Det Return     | 2.31e+03 |
| Real Sto Return     | 2.66e+03 |
| Reward Loss         | -900     |
| Running Env Steps   | 1920000  |
| Running Forward KL  | 30.7     |
| Running Reverse KL  | 7.88     |
| Running Update Time | 384      |
----------------------------------
--2023-11-07 00:31:47.990164 CST--
| Itration            | 385      |
| Real Det Return     | 2.39e+03 |
| Real Sto Return     | 2.68e+03 |
| Reward Loss         | -909     |
| Running Env Steps   | 1925000  |
| Running Forward KL  | 30       |
| Running Reverse KL  | 7.86     |
| Running Update Time | 385      |
----------------------------------
--2023-11-07 00:33:51.754833 CST--
| Itration            | 386      |
| Real Det Return     | 2.2e+03  |
| Real Sto Return     | 2.63e+03 |
| Reward Loss         | -882     |
| Running Env Steps   | 1930000  |
| Running Forward KL  | 30.3     |
| Running Reverse KL  | 7.65     |
| Running Update Time | 386      |
----------------------------------
--2023-11-07 00:35:56.540566 CST--
| Itration            | 387      |
| Real Det Return     | 2.26e+03 |
| Real Sto Return     | 2.67e+03 |
| Reward Loss         | -911     |
| Running Env Steps   | 1935000  |
| Running Forward KL  | 29.8     |
| Running Reverse KL  | 7.73     |
| Running Update Time | 387      |
----------------------------------
--2023-11-07 00:38:01.129778 CST--
| Itration            | 388      |
| Real Det Return     | 2.12e+03 |
| Real Sto Return     | 2.65e+03 |
| Reward Loss         | -896     |
| Running Env Steps   | 1940000  |
| Running Forward KL  | 30.3     |
| Running Reverse KL  | 8.06     |
| Running Update Time | 388      |
----------------------------------
--2023-11-07 00:40:02.043445 CST--
| Itration            | 389      |
| Real Det Return     | 2.26e+03 |
| Real Sto Return     | 2.67e+03 |
| Reward Loss         | -920     |
| Running Env Steps   | 1945000  |
| Running Forward KL  | 30.2     |
| Running Reverse KL  | 7.79     |
| Running Update Time | 389      |
----------------------------------
--2023-11-07 00:42:06.652393 CST--
| Itration            | 390      |
| Real Det Return     | 2.58e+03 |
| Real Sto Return     | 2.66e+03 |
| Reward Loss         | -925     |
| Running Env Steps   | 1950000  |
| Running Forward KL  | 29.9     |
| Running Reverse KL  | 7.77     |
| Running Update Time | 390      |
----------------------------------
--2023-11-07 00:44:11.259955 CST--
| Itration            | 391      |
| Real Det Return     | 2.3e+03  |
| Real Sto Return     | 2.66e+03 |
| Reward Loss         | -924     |
| Running Env Steps   | 1955000  |
| Running Forward KL  | 30.1     |
| Running Reverse KL  | 7.67     |
| Running Update Time | 391      |
----------------------------------
--2023-11-07 00:46:15.751982 CST--
| Itration            | 392      |
| Real Det Return     | 2.36e+03 |
| Real Sto Return     | 2.68e+03 |
| Reward Loss         | -913     |
| Running Env Steps   | 1960000  |
| Running Forward KL  | 30       |
| Running Reverse KL  | 7.85     |
| Running Update Time | 392      |
----------------------------------
--2023-11-07 00:48:20.362398 CST--
| Itration            | 393      |
| Real Det Return     | 2.39e+03 |
| Real Sto Return     | 2.66e+03 |
| Reward Loss         | -905     |
| Running Env Steps   | 1965000  |
| Running Forward KL  | 29.9     |
| Running Reverse KL  | 7.92     |
| Running Update Time | 393      |
----------------------------------
--2023-11-07 00:50:25.030543 CST--
| Itration            | 394      |
| Real Det Return     | 2.46e+03 |
| Real Sto Return     | 2.66e+03 |
| Reward Loss         | -943     |
| Running Env Steps   | 1970000  |
| Running Forward KL  | 29.5     |
| Running Reverse KL  | 7.59     |
| Running Update Time | 394      |
----------------------------------
--2023-11-07 00:52:29.640307 CST--
| Itration            | 395      |
| Real Det Return     | 2.34e+03 |
| Real Sto Return     | 2.68e+03 |
| Reward Loss         | -924     |
| Running Env Steps   | 1975000  |
| Running Forward KL  | 30.4     |
| Running Reverse KL  | 7.82     |
| Running Update Time | 395      |
----------------------------------
--2023-11-07 00:54:34.237408 CST--
| Itration            | 396      |
| Real Det Return     | 2.64e+03 |
| Real Sto Return     | 2.66e+03 |
| Reward Loss         | -950     |
| Running Env Steps   | 1980000  |
| Running Forward KL  | 29       |
| Running Reverse KL  | 7.63     |
| Running Update Time | 396      |
----------------------------------
--2023-11-07 00:56:38.229781 CST--
| Itration            | 397      |
| Real Det Return     | 2.3e+03  |
| Real Sto Return     | 2.68e+03 |
| Reward Loss         | -954     |
| Running Env Steps   | 1985000  |
| Running Forward KL  | 30.2     |
| Running Reverse KL  | 7.68     |
| Running Update Time | 397      |
----------------------------------
--2023-11-07 00:58:42.761904 CST--
| Itration            | 398      |
| Real Det Return     | 2.34e+03 |
| Real Sto Return     | 2.66e+03 |
| Reward Loss         | -928     |
| Running Env Steps   | 1990000  |
| Running Forward KL  | 30.1     |
| Running Reverse KL  | 7.8      |
| Running Update Time | 398      |
----------------------------------
--2023-11-07 01:00:46.927636 CST--
| Itration            | 399      |
| Real Det Return     | 2.33e+03 |
| Real Sto Return     | 2.65e+03 |
| Reward Loss         | -933     |
| Running Env Steps   | 1995000  |
| Running Forward KL  | 30.1     |
| Running Reverse KL  | 7.75     |
| Running Update Time | 399      |
----------------------------------
--2023-11-07 01:02:50.679477 CST--
| Itration            | 400      |
| Real Det Return     | 2.34e+03 |
| Real Sto Return     | 2.65e+03 |
| Reward Loss         | -947     |
| Running Env Steps   | 2000000  |
| Running Forward KL  | 29.9     |
| Running Reverse KL  | 7.75     |
| Running Update Time | 400      |
----------------------------------
--2023-11-07 01:04:54.541573 CST--
| Itration            | 401      |
| Real Det Return     | 2.57e+03 |
| Real Sto Return     | 2.65e+03 |
| Reward Loss         | -967     |
| Running Env Steps   | 2005000  |
| Running Forward KL  | 29.4     |
| Running Reverse KL  | 7.7      |
| Running Update Time | 401      |
----------------------------------
--2023-11-07 01:06:58.529529 CST--
| Itration            | 402      |
| Real Det Return     | 2.28e+03 |
| Real Sto Return     | 2.67e+03 |
| Reward Loss         | -931     |
| Running Env Steps   | 2010000  |
| Running Forward KL  | 30.5     |
| Running Reverse KL  | 7.95     |
| Running Update Time | 402      |
----------------------------------
--2023-11-07 01:09:02.247564 CST--
| Itration            | 403      |
| Real Det Return     | 2.34e+03 |
| Real Sto Return     | 2.68e+03 |
| Reward Loss         | -929     |
| Running Env Steps   | 2015000  |
| Running Forward KL  | 30.1     |
| Running Reverse KL  | 7.77     |
| Running Update Time | 403      |
----------------------------------
--2023-11-07 01:11:06.302663 CST--
| Itration            | 404      |
| Real Det Return     | 2.62e+03 |
| Real Sto Return     | 2.63e+03 |
| Reward Loss         | -970     |
| Running Env Steps   | 2020000  |
| Running Forward KL  | 30.2     |
| Running Reverse KL  | 7.71     |
| Running Update Time | 404      |
----------------------------------
--2023-11-07 01:13:10.220370 CST--
| Itration            | 405      |
| Real Det Return     | 2.26e+03 |
| Real Sto Return     | 2.67e+03 |
| Reward Loss         | -950     |
| Running Env Steps   | 2025000  |
| Running Forward KL  | 29.5     |
| Running Reverse KL  | 7.81     |
| Running Update Time | 405      |
----------------------------------
--2023-11-07 01:15:14.641180 CST--
| Itration            | 406      |
| Real Det Return     | 2.26e+03 |
| Real Sto Return     | 2.66e+03 |
| Reward Loss         | -961     |
| Running Env Steps   | 2030000  |
| Running Forward KL  | 30       |
| Running Reverse KL  | 7.66     |
| Running Update Time | 406      |
----------------------------------
--2023-11-07 01:17:19.069097 CST--
| Itration            | 407      |
| Real Det Return     | 2.3e+03  |
| Real Sto Return     | 2.69e+03 |
| Reward Loss         | -966     |
| Running Env Steps   | 2035000  |
| Running Forward KL  | 30.3     |
| Running Reverse KL  | 7.93     |
| Running Update Time | 407      |
----------------------------------
--2023-11-07 01:19:23.639903 CST--
| Itration            | 408      |
| Real Det Return     | 2.27e+03 |
| Real Sto Return     | 2.68e+03 |
| Reward Loss         | -977     |
| Running Env Steps   | 2040000  |
| Running Forward KL  | 29.8     |
| Running Reverse KL  | 7.81     |
| Running Update Time | 408      |
----------------------------------
--2023-11-07 01:21:27.679205 CST--
| Itration            | 409      |
| Real Det Return     | 2.54e+03 |
| Real Sto Return     | 2.62e+03 |
| Reward Loss         | -985     |
| Running Env Steps   | 2045000  |
| Running Forward KL  | 30       |
| Running Reverse KL  | 7.91     |
| Running Update Time | 409      |
----------------------------------
--2023-11-07 01:23:35.818232 CST--
| Itration            | 410      |
| Real Det Return     | 2.3e+03  |
| Real Sto Return     | 2.69e+03 |
| Reward Loss         | -940     |
| Running Env Steps   | 2050000  |
| Running Forward KL  | 29.6     |
| Running Reverse KL  | 7.85     |
| Running Update Time | 410      |
----------------------------------
--2023-11-07 01:25:41.015116 CST--
| Itration            | 411      |
| Real Det Return     | 2.49e+03 |
| Real Sto Return     | 2.68e+03 |
| Reward Loss         | -962     |
| Running Env Steps   | 2055000  |
| Running Forward KL  | 30.1     |
| Running Reverse KL  | 7.88     |
| Running Update Time | 411      |
----------------------------------
--2023-11-07 01:27:45.861185 CST--
| Itration            | 412      |
| Real Det Return     | 2.54e+03 |
| Real Sto Return     | 2.66e+03 |
| Reward Loss         | -977     |
| Running Env Steps   | 2060000  |
| Running Forward KL  | 29.6     |
| Running Reverse KL  | 7.81     |
| Running Update Time | 412      |
----------------------------------
--2023-11-07 01:29:50.869107 CST--
| Itration            | 413      |
| Real Det Return     | 2.6e+03  |
| Real Sto Return     | 2.65e+03 |
| Reward Loss         | -976     |
| Running Env Steps   | 2065000  |
| Running Forward KL  | 29.1     |
| Running Reverse KL  | 7.77     |
| Running Update Time | 413      |
----------------------------------
--2023-11-07 01:31:55.629892 CST--
| Itration            | 414      |
| Real Det Return     | 2.58e+03 |
| Real Sto Return     | 2.66e+03 |
| Reward Loss         | -955     |
| Running Env Steps   | 2070000  |
| Running Forward KL  | 30.3     |
| Running Reverse KL  | 7.81     |
| Running Update Time | 414      |
----------------------------------
--2023-11-07 01:34:00.179822 CST---
| Itration            | 415       |
| Real Det Return     | 2.48e+03  |
| Real Sto Return     | 2.65e+03  |
| Reward Loss         | -1.01e+03 |
| Running Env Steps   | 2075000   |
| Running Forward KL  | 29.9      |
| Running Reverse KL  | 7.95      |
| Running Update Time | 415       |
-----------------------------------
--2023-11-07 01:36:04.792449 CST--
| Itration            | 416      |
| Real Det Return     | 2.45e+03 |
| Real Sto Return     | 2.66e+03 |
| Reward Loss         | -974     |
| Running Env Steps   | 2080000  |
| Running Forward KL  | 30.2     |
| Running Reverse KL  | 7.9      |
| Running Update Time | 416      |
----------------------------------
--2023-11-07 01:38:09.273459 CST--
| Itration            | 417      |
| Real Det Return     | 2.48e+03 |
| Real Sto Return     | 2.65e+03 |
| Reward Loss         | -1e+03   |
| Running Env Steps   | 2085000  |
| Running Forward KL  | 30       |
| Running Reverse KL  | 7.95     |
| Running Update Time | 417      |
----------------------------------
--2023-11-07 01:40:13.615000 CST--
| Itration            | 418      |
| Real Det Return     | 2.43e+03 |
| Real Sto Return     | 2.67e+03 |
| Reward Loss         | -976     |
| Running Env Steps   | 2090000  |
| Running Forward KL  | 29.5     |
| Running Reverse KL  | 7.75     |
| Running Update Time | 418      |
----------------------------------
--2023-11-07 01:42:17.376623 CST--
| Itration            | 419      |
| Real Det Return     | 2.42e+03 |
| Real Sto Return     | 2.67e+03 |
| Reward Loss         | -998     |
| Running Env Steps   | 2095000  |
| Running Forward KL  | 29.9     |
| Running Reverse KL  | 8.03     |
| Running Update Time | 419      |
----------------------------------
--2023-11-07 01:44:21.032255 CST--
| Itration            | 420      |
| Real Det Return     | 2.83e+03 |
| Real Sto Return     | 2.59e+03 |
| Reward Loss         | -975     |
| Running Env Steps   | 2100000  |
| Running Forward KL  | 29.1     |
| Running Reverse KL  | 8.14     |
| Running Update Time | 420      |
----------------------------------
--2023-11-07 01:46:24.650399 CST---
| Itration            | 421       |
| Real Det Return     | 2.3e+03   |
| Real Sto Return     | 2.67e+03  |
| Reward Loss         | -1.02e+03 |
| Running Env Steps   | 2105000   |
| Running Forward KL  | 30.4      |
| Running Reverse KL  | 7.91      |
| Running Update Time | 421       |
-----------------------------------
--2023-11-07 01:48:28.161604 CST--
| Itration            | 422      |
| Real Det Return     | 2.45e+03 |
| Real Sto Return     | 2.67e+03 |
| Reward Loss         | -999     |
| Running Env Steps   | 2110000  |
| Running Forward KL  | 30.2     |
| Running Reverse KL  | 7.89     |
| Running Update Time | 422      |
----------------------------------
--2023-11-07 01:50:32.126227 CST--
| Itration            | 423      |
| Real Det Return     | 2.53e+03 |
| Real Sto Return     | 2.67e+03 |
| Reward Loss         | -991     |
| Running Env Steps   | 2115000  |
| Running Forward KL  | 30       |
| Running Reverse KL  | 8        |
| Running Update Time | 423      |
----------------------------------
--2023-11-07 01:52:36.103482 CST--
| Itration            | 424      |
| Real Det Return     | 2.42e+03 |
| Real Sto Return     | 2.66e+03 |
| Reward Loss         | -995     |
| Running Env Steps   | 2120000  |
| Running Forward KL  | 29.4     |
| Running Reverse KL  | 8        |
| Running Update Time | 424      |
----------------------------------
--2023-11-07 01:54:39.913491 CST--
| Itration            | 425      |
| Real Det Return     | 2.54e+03 |
| Real Sto Return     | 2.64e+03 |
| Reward Loss         | -1e+03   |
| Running Env Steps   | 2125000  |
| Running Forward KL  | 30.1     |
| Running Reverse KL  | 8.33     |
| Running Update Time | 425      |
----------------------------------
--2023-11-07 01:56:43.715880 CST--
| Itration            | 426      |
| Real Det Return     | 2.61e+03 |
| Real Sto Return     | 2.69e+03 |
| Reward Loss         | -999     |
| Running Env Steps   | 2130000  |
| Running Forward KL  | 29.6     |
| Running Reverse KL  | 8.08     |
| Running Update Time | 426      |
----------------------------------
--2023-11-07 01:58:47.579873 CST--
| Itration            | 427      |
| Real Det Return     | 2.67e+03 |
| Real Sto Return     | 2.61e+03 |
| Reward Loss         | -1e+03   |
| Running Env Steps   | 2135000  |
| Running Forward KL  | 29.7     |
| Running Reverse KL  | 8.24     |
| Running Update Time | 427      |
----------------------------------
--2023-11-07 02:00:51.011652 CST---
| Itration            | 428       |
| Real Det Return     | 2.79e+03  |
| Real Sto Return     | 2.59e+03  |
| Reward Loss         | -1.03e+03 |
| Running Env Steps   | 2140000   |
| Running Forward KL  | 29.7      |
| Running Reverse KL  | 8.14      |
| Running Update Time | 428       |
-----------------------------------
--2023-11-07 02:02:54.192138 CST---
| Itration            | 429       |
| Real Det Return     | 2.48e+03  |
| Real Sto Return     | 2.65e+03  |
| Reward Loss         | -1.04e+03 |
| Running Env Steps   | 2145000   |
| Running Forward KL  | 30.2      |
| Running Reverse KL  | 8.21      |
| Running Update Time | 429       |
-----------------------------------
--2023-11-07 02:04:57.181695 CST---
| Itration            | 430       |
| Real Det Return     | 2.76e+03  |
| Real Sto Return     | 2.6e+03   |
| Reward Loss         | -1.03e+03 |
| Running Env Steps   | 2150000   |
| Running Forward KL  | 29.6      |
| Running Reverse KL  | 8.2       |
| Running Update Time | 430       |
-----------------------------------
--2023-11-07 02:07:00.269469 CST---
| Itration            | 431       |
| Real Det Return     | 2.37e+03  |
| Real Sto Return     | 2.65e+03  |
| Reward Loss         | -1.02e+03 |
| Running Env Steps   | 2155000   |
| Running Forward KL  | 29.7      |
| Running Reverse KL  | 8.06      |
| Running Update Time | 431       |
-----------------------------------
--2023-11-07 02:09:03.957200 CST---
| Itration            | 432       |
| Real Det Return     | 2.66e+03  |
| Real Sto Return     | 2.6e+03   |
| Reward Loss         | -1.05e+03 |
| Running Env Steps   | 2160000   |
| Running Forward KL  | 30.2      |
| Running Reverse KL  | 8.27      |
| Running Update Time | 432       |
-----------------------------------
--2023-11-07 02:11:07.444177 CST---
| Itration            | 433       |
| Real Det Return     | 2.73e+03  |
| Real Sto Return     | 2.54e+03  |
| Reward Loss         | -1.06e+03 |
| Running Env Steps   | 2165000   |
| Running Forward KL  | 29.7      |
| Running Reverse KL  | 8.4       |
| Running Update Time | 433       |
-----------------------------------
--2023-11-07 02:13:10.857940 CST---
| Itration            | 434       |
| Real Det Return     | 2.74e+03  |
| Real Sto Return     | 2.61e+03  |
| Reward Loss         | -1.05e+03 |
| Running Env Steps   | 2170000   |
| Running Forward KL  | 29.4      |
| Running Reverse KL  | 8.13      |
| Running Update Time | 434       |
-----------------------------------
--2023-11-07 02:15:14.107176 CST---
| Itration            | 435       |
| Real Det Return     | 2.64e+03  |
| Real Sto Return     | 2.62e+03  |
| Reward Loss         | -1.04e+03 |
| Running Env Steps   | 2175000   |
| Running Forward KL  | 29.9      |
| Running Reverse KL  | 8.18      |
| Running Update Time | 435       |
-----------------------------------
--2023-11-07 02:17:17.160316 CST---
| Itration            | 436       |
| Real Det Return     | 2.49e+03  |
| Real Sto Return     | 2.67e+03  |
| Reward Loss         | -1.03e+03 |
| Running Env Steps   | 2180000   |
| Running Forward KL  | 30.1      |
| Running Reverse KL  | 8.32      |
| Running Update Time | 436       |
-----------------------------------
--2023-11-07 02:19:20.520867 CST---
| Itration            | 437       |
| Real Det Return     | 2.63e+03  |
| Real Sto Return     | 2.65e+03  |
| Reward Loss         | -1.07e+03 |
| Running Env Steps   | 2185000   |
| Running Forward KL  | 30.1      |
| Running Reverse KL  | 8.28      |
| Running Update Time | 437       |
-----------------------------------
--2023-11-07 02:21:23.768617 CST---
| Itration            | 438       |
| Real Det Return     | 2.54e+03  |
| Real Sto Return     | 2.67e+03  |
| Reward Loss         | -1.05e+03 |
| Running Env Steps   | 2190000   |
| Running Forward KL  | 29.2      |
| Running Reverse KL  | 8.27      |
| Running Update Time | 438       |
-----------------------------------
--2023-11-07 02:23:27.195981 CST---
| Itration            | 439       |
| Real Det Return     | 2.48e+03  |
| Real Sto Return     | 2.67e+03  |
| Reward Loss         | -1.06e+03 |
| Running Env Steps   | 2195000   |
| Running Forward KL  | 29.7      |
| Running Reverse KL  | 8.42      |
| Running Update Time | 439       |
-----------------------------------
--2023-11-07 02:25:30.567866 CST---
| Itration            | 440       |
| Real Det Return     | 2.75e+03  |
| Real Sto Return     | 2.58e+03  |
| Reward Loss         | -1.07e+03 |
| Running Env Steps   | 2200000   |
| Running Forward KL  | 29.8      |
| Running Reverse KL  | 8.36      |
| Running Update Time | 440       |
-----------------------------------
--2023-11-07 02:27:33.889979 CST---
| Itration            | 441       |
| Real Det Return     | 2.54e+03  |
| Real Sto Return     | 2.66e+03  |
| Reward Loss         | -1.06e+03 |
| Running Env Steps   | 2205000   |
| Running Forward KL  | 30.5      |
| Running Reverse KL  | 8.21      |
| Running Update Time | 441       |
-----------------------------------
--2023-11-07 02:29:38.840462 CST---
| Itration            | 442       |
| Real Det Return     | 2.56e+03  |
| Real Sto Return     | 2.65e+03  |
| Reward Loss         | -1.05e+03 |
| Running Env Steps   | 2210000   |
| Running Forward KL  | 30        |
| Running Reverse KL  | 8.3       |
| Running Update Time | 442       |
-----------------------------------
--2023-11-07 02:31:43.432691 CST---
| Itration            | 443       |
| Real Det Return     | 2.72e+03  |
| Real Sto Return     | 2.66e+03  |
| Reward Loss         | -1.07e+03 |
| Running Env Steps   | 2215000   |
| Running Forward KL  | 29.4      |
| Running Reverse KL  | 8.4       |
| Running Update Time | 443       |
-----------------------------------
--2023-11-07 02:33:48.057019 CST---
| Itration            | 444       |
| Real Det Return     | 2.48e+03  |
| Real Sto Return     | 2.65e+03  |
| Reward Loss         | -1.07e+03 |
| Running Env Steps   | 2220000   |
| Running Forward KL  | 30.2      |
| Running Reverse KL  | 8.23      |
| Running Update Time | 444       |
-----------------------------------
--2023-11-07 02:35:52.533768 CST---
| Itration            | 445       |
| Real Det Return     | 2.66e+03  |
| Real Sto Return     | 2.63e+03  |
| Reward Loss         | -1.07e+03 |
| Running Env Steps   | 2225000   |
| Running Forward KL  | 29.5      |
| Running Reverse KL  | 8.4       |
| Running Update Time | 445       |
-----------------------------------
--2023-11-07 02:37:57.178412 CST--
| Itration            | 446      |
| Real Det Return     | 2.62e+03 |
| Real Sto Return     | 2.61e+03 |
| Reward Loss         | -1.1e+03 |
| Running Env Steps   | 2230000  |
| Running Forward KL  | 29.8     |
| Running Reverse KL  | 8.39     |
| Running Update Time | 446      |
----------------------------------
--2023-11-07 02:40:01.902351 CST---
| Itration            | 447       |
| Real Det Return     | 2.73e+03  |
| Real Sto Return     | 2.66e+03  |
| Reward Loss         | -1.07e+03 |
| Running Env Steps   | 2235000   |
| Running Forward KL  | 29.4      |
| Running Reverse KL  | 8.24      |
| Running Update Time | 447       |
-----------------------------------
--2023-11-07 02:42:06.255950 CST---
| Itration            | 448       |
| Real Det Return     | 2.63e+03  |
| Real Sto Return     | 2.63e+03  |
| Reward Loss         | -1.07e+03 |
| Running Env Steps   | 2240000   |
| Running Forward KL  | 30.1      |
| Running Reverse KL  | 8.33      |
| Running Update Time | 448       |
-----------------------------------
--2023-11-07 02:44:11.095860 CST---
| Itration            | 449       |
| Real Det Return     | 2.66e+03  |
| Real Sto Return     | 2.6e+03   |
| Reward Loss         | -1.11e+03 |
| Running Env Steps   | 2245000   |
| Running Forward KL  | 29.7      |
| Running Reverse KL  | 8.44      |
| Running Update Time | 449       |
-----------------------------------
--2023-11-07 02:46:15.681898 CST---
| Itration            | 450       |
| Real Det Return     | 2.77e+03  |
| Real Sto Return     | 2.63e+03  |
| Reward Loss         | -1.13e+03 |
| Running Env Steps   | 2250000   |
| Running Forward KL  | 30.1      |
| Running Reverse KL  | 8.72      |
| Running Update Time | 450       |
-----------------------------------
--2023-11-07 02:48:20.290365 CST--
| Itration            | 451      |
| Real Det Return     | 2.77e+03 |
| Real Sto Return     | 2.63e+03 |
| Reward Loss         | -1.1e+03 |
| Running Env Steps   | 2255000  |
| Running Forward KL  | 29.8     |
| Running Reverse KL  | 8.54     |
| Running Update Time | 451      |
----------------------------------
--2023-11-07 02:50:24.866530 CST---
| Itration            | 452       |
| Real Det Return     | 2.69e+03  |
| Real Sto Return     | 2.6e+03   |
| Reward Loss         | -1.12e+03 |
| Running Env Steps   | 2260000   |
| Running Forward KL  | 29.4      |
| Running Reverse KL  | 8.65      |
| Running Update Time | 452       |
-----------------------------------
--2023-11-07 02:52:27.562656 CST---
| Itration            | 453       |
| Real Det Return     | 2.64e+03  |
| Real Sto Return     | 2.64e+03  |
| Reward Loss         | -1.11e+03 |
| Running Env Steps   | 2265000   |
| Running Forward KL  | 29.8      |
| Running Reverse KL  | 8.47      |
| Running Update Time | 453       |
-----------------------------------
--2023-11-07 02:54:22.468950 CST---
| Itration            | 454       |
| Real Det Return     | 2.65e+03  |
| Real Sto Return     | 2.59e+03  |
| Reward Loss         | -1.13e+03 |
| Running Env Steps   | 2270000   |
| Running Forward KL  | 29.4      |
| Running Reverse KL  | 8.44      |
| Running Update Time | 454       |
-----------------------------------
--2023-11-07 02:56:27.214196 CST---
| Itration            | 455       |
| Real Det Return     | 2.77e+03  |
| Real Sto Return     | 2.57e+03  |
| Reward Loss         | -1.13e+03 |
| Running Env Steps   | 2275000   |
| Running Forward KL  | 30.1      |
| Running Reverse KL  | 8.82      |
| Running Update Time | 455       |
-----------------------------------
--2023-11-07 02:58:31.859731 CST---
| Itration            | 456       |
| Real Det Return     | 2.66e+03  |
| Real Sto Return     | 2.63e+03  |
| Reward Loss         | -1.11e+03 |
| Running Env Steps   | 2280000   |
| Running Forward KL  | 29.9      |
| Running Reverse KL  | 8.84      |
| Running Update Time | 456       |
-----------------------------------
--2023-11-07 03:00:36.654121 CST---
| Itration            | 457       |
| Real Det Return     | 2.51e+03  |
| Real Sto Return     | 2.67e+03  |
| Reward Loss         | -1.12e+03 |
| Running Env Steps   | 2285000   |
| Running Forward KL  | 29.9      |
| Running Reverse KL  | 8.89      |
| Running Update Time | 457       |
-----------------------------------
--2023-11-07 03:02:41.213395 CST---
| Itration            | 458       |
| Real Det Return     | 2.69e+03  |
| Real Sto Return     | 2.61e+03  |
| Reward Loss         | -1.13e+03 |
| Running Env Steps   | 2290000   |
| Running Forward KL  | 29.3      |
| Running Reverse KL  | 8.91      |
| Running Update Time | 458       |
-----------------------------------
--2023-11-07 03:04:45.794233 CST---
| Itration            | 459       |
| Real Det Return     | 2.66e+03  |
| Real Sto Return     | 2.65e+03  |
| Reward Loss         | -1.16e+03 |
| Running Env Steps   | 2295000   |
| Running Forward KL  | 30.7      |
| Running Reverse KL  | 8.95      |
| Running Update Time | 459       |
-----------------------------------
--2023-11-07 03:06:50.624003 CST---
| Itration            | 460       |
| Real Det Return     | 2.54e+03  |
| Real Sto Return     | 2.67e+03  |
| Reward Loss         | -1.12e+03 |
| Running Env Steps   | 2300000   |
| Running Forward KL  | 30.4      |
| Running Reverse KL  | 8.79      |
| Running Update Time | 460       |
-----------------------------------
--2023-11-07 03:08:55.281635 CST---
| Itration            | 461       |
| Real Det Return     | 2.54e+03  |
| Real Sto Return     | 2.67e+03  |
| Reward Loss         | -1.15e+03 |
| Running Env Steps   | 2305000   |
| Running Forward KL  | 30.5      |
| Running Reverse KL  | 9.31      |
| Running Update Time | 461       |
-----------------------------------
--2023-11-07 03:11:00.340868 CST---
| Itration            | 462       |
| Real Det Return     | 2.6e+03   |
| Real Sto Return     | 2.65e+03  |
| Reward Loss         | -1.12e+03 |
| Running Env Steps   | 2310000   |
| Running Forward KL  | 29.7      |
| Running Reverse KL  | 8.72      |
| Running Update Time | 462       |
-----------------------------------
--2023-11-07 03:13:04.896081 CST---
| Itration            | 463       |
| Real Det Return     | 2.65e+03  |
| Real Sto Return     | 2.67e+03  |
| Reward Loss         | -1.16e+03 |
| Running Env Steps   | 2315000   |
| Running Forward KL  | 29.6      |
| Running Reverse KL  | 8.58      |
| Running Update Time | 463       |
-----------------------------------
--2023-11-07 03:15:09.856920 CST---
| Itration            | 464       |
| Real Det Return     | 2.54e+03  |
| Real Sto Return     | 2.64e+03  |
| Reward Loss         | -1.18e+03 |
| Running Env Steps   | 2320000   |
| Running Forward KL  | 30.4      |
| Running Reverse KL  | 8.97      |
| Running Update Time | 464       |
-----------------------------------
--2023-11-07 03:17:14.884608 CST---
| Itration            | 465       |
| Real Det Return     | 2.38e+03  |
| Real Sto Return     | 2.68e+03  |
| Reward Loss         | -1.15e+03 |
| Running Env Steps   | 2325000   |
| Running Forward KL  | 30.2      |
| Running Reverse KL  | 8.87      |
| Running Update Time | 465       |
-----------------------------------
--2023-11-07 03:19:19.788557 CST---
| Itration            | 466       |
| Real Det Return     | 2.76e+03  |
| Real Sto Return     | 2.58e+03  |
| Reward Loss         | -1.18e+03 |
| Running Env Steps   | 2330000   |
| Running Forward KL  | 30.1      |
| Running Reverse KL  | 8.81      |
| Running Update Time | 466       |
-----------------------------------
--2023-11-07 03:21:24.802231 CST---
| Itration            | 467       |
| Real Det Return     | 2.69e+03  |
| Real Sto Return     | 2.66e+03  |
| Reward Loss         | -1.15e+03 |
| Running Env Steps   | 2335000   |
| Running Forward KL  | 30.3      |
| Running Reverse KL  | 9.22      |
| Running Update Time | 467       |
-----------------------------------
--2023-11-07 03:23:30.744352 CST--
| Itration            | 468      |
| Real Det Return     | 2.72e+03 |
| Real Sto Return     | 2.6e+03  |
| Reward Loss         | -1.2e+03 |
| Running Env Steps   | 2340000  |
| Running Forward KL  | 30.2     |
| Running Reverse KL  | 9.07     |
| Running Update Time | 468      |
----------------------------------
--2023-11-07 03:25:36.261303 CST---
| Itration            | 469       |
| Real Det Return     | 2.71e+03  |
| Real Sto Return     | 2.58e+03  |
| Reward Loss         | -1.21e+03 |
| Running Env Steps   | 2345000   |
| Running Forward KL  | 30.3      |
| Running Reverse KL  | 9.18      |
| Running Update Time | 469       |
-----------------------------------
--2023-11-07 03:27:41.652702 CST---
| Itration            | 470       |
| Real Det Return     | 2.73e+03  |
| Real Sto Return     | 2.62e+03  |
| Reward Loss         | -1.18e+03 |
| Running Env Steps   | 2350000   |
| Running Forward KL  | 29.9      |
| Running Reverse KL  | 9.1       |
| Running Update Time | 470       |
-----------------------------------
--2023-11-07 03:29:46.738066 CST---
| Itration            | 471       |
| Real Det Return     | 2.72e+03  |
| Real Sto Return     | 2.6e+03   |
| Reward Loss         | -1.18e+03 |
| Running Env Steps   | 2355000   |
| Running Forward KL  | 30.2      |
| Running Reverse KL  | 9.1       |
| Running Update Time | 471       |
-----------------------------------
--2023-11-07 03:31:51.726325 CST---
| Itration            | 472       |
| Real Det Return     | 2.75e+03  |
| Real Sto Return     | 2.55e+03  |
| Reward Loss         | -1.19e+03 |
| Running Env Steps   | 2360000   |
| Running Forward KL  | 30.1      |
| Running Reverse KL  | 9.49      |
| Running Update Time | 472       |
-----------------------------------
--2023-11-07 03:33:56.810902 CST---
| Itration            | 473       |
| Real Det Return     | 2.74e+03  |
| Real Sto Return     | 2.6e+03   |
| Reward Loss         | -1.18e+03 |
| Running Env Steps   | 2365000   |
| Running Forward KL  | 30.1      |
| Running Reverse KL  | 9.04      |
| Running Update Time | 473       |
-----------------------------------
--2023-11-07 03:36:01.983789 CST--
| Itration            | 474      |
| Real Det Return     | 2.77e+03 |
| Real Sto Return     | 2.54e+03 |
| Reward Loss         | -1.2e+03 |
| Running Env Steps   | 2370000  |
| Running Forward KL  | 30.3     |
| Running Reverse KL  | 9.23     |
| Running Update Time | 474      |
----------------------------------
--2023-11-07 03:38:07.436276 CST---
| Itration            | 475       |
| Real Det Return     | 2.74e+03  |
| Real Sto Return     | 2.63e+03  |
| Reward Loss         | -1.21e+03 |
| Running Env Steps   | 2375000   |
| Running Forward KL  | 30.8      |
| Running Reverse KL  | 9.35      |
| Running Update Time | 475       |
-----------------------------------
--2023-11-07 03:40:12.508136 CST--
| Itration            | 476      |
| Real Det Return     | 2.69e+03 |
| Real Sto Return     | 2.64e+03 |
| Reward Loss         | -1.2e+03 |
| Running Env Steps   | 2380000  |
| Running Forward KL  | 30.1     |
| Running Reverse KL  | 9.21     |
| Running Update Time | 476      |
----------------------------------
--2023-11-07 03:42:17.985988 CST---
| Itration            | 477       |
| Real Det Return     | 2.67e+03  |
| Real Sto Return     | 2.61e+03  |
| Reward Loss         | -1.21e+03 |
| Running Env Steps   | 2385000   |
| Running Forward KL  | 30.4      |
| Running Reverse KL  | 9.09      |
| Running Update Time | 477       |
-----------------------------------
--2023-11-07 03:44:23.330281 CST---
| Itration            | 478       |
| Real Det Return     | 2.75e+03  |
| Real Sto Return     | 2.58e+03  |
| Reward Loss         | -1.23e+03 |
| Running Env Steps   | 2390000   |
| Running Forward KL  | 29.9      |
| Running Reverse KL  | 9.44      |
| Running Update Time | 478       |
-----------------------------------
--2023-11-07 03:46:28.855292 CST---
| Itration            | 479       |
| Real Det Return     | 2.71e+03  |
| Real Sto Return     | 2.6e+03   |
| Reward Loss         | -1.24e+03 |
| Running Env Steps   | 2395000   |
| Running Forward KL  | 30.7      |
| Running Reverse KL  | 9.41      |
| Running Update Time | 479       |
-----------------------------------
--2023-11-07 03:48:34.152014 CST---
| Itration            | 480       |
| Real Det Return     | 2.59e+03  |
| Real Sto Return     | 2.66e+03  |
| Reward Loss         | -1.23e+03 |
| Running Env Steps   | 2400000   |
| Running Forward KL  | 30.6      |
| Running Reverse KL  | 9.36      |
| Running Update Time | 480       |
-----------------------------------
--2023-11-07 03:50:39.613207 CST---
| Itration            | 481       |
| Real Det Return     | 2.77e+03  |
| Real Sto Return     | 2.6e+03   |
| Reward Loss         | -1.22e+03 |
| Running Env Steps   | 2405000   |
| Running Forward KL  | 29.7      |
| Running Reverse KL  | 9.28      |
| Running Update Time | 481       |
-----------------------------------
--2023-11-07 03:52:44.815632 CST---
| Itration            | 482       |
| Real Det Return     | 2.63e+03  |
| Real Sto Return     | 2.64e+03  |
| Reward Loss         | -1.21e+03 |
| Running Env Steps   | 2410000   |
| Running Forward KL  | 30.1      |
| Running Reverse KL  | 9.5       |
| Running Update Time | 482       |
-----------------------------------
--2023-11-07 03:54:49.311262 CST---
| Itration            | 483       |
| Real Det Return     | 2.67e+03  |
| Real Sto Return     | 2.65e+03  |
| Reward Loss         | -1.21e+03 |
| Running Env Steps   | 2415000   |
| Running Forward KL  | 30.1      |
| Running Reverse KL  | 9.65      |
| Running Update Time | 483       |
-----------------------------------
--2023-11-07 03:56:53.555633 CST---
| Itration            | 484       |
| Real Det Return     | 2.7e+03   |
| Real Sto Return     | 2.61e+03  |
| Reward Loss         | -1.25e+03 |
| Running Env Steps   | 2420000   |
| Running Forward KL  | 30.7      |
| Running Reverse KL  | 9.6       |
| Running Update Time | 484       |
-----------------------------------
--2023-11-07 03:58:58.447792 CST---
| Itration            | 485       |
| Real Det Return     | 2.78e+03  |
| Real Sto Return     | 2.59e+03  |
| Reward Loss         | -1.25e+03 |
| Running Env Steps   | 2425000   |
| Running Forward KL  | 31        |
| Running Reverse KL  | 9.48      |
| Running Update Time | 485       |
-----------------------------------
--2023-11-07 04:00:58.444214 CST---
| Itration            | 486       |
| Real Det Return     | 2.71e+03  |
| Real Sto Return     | 2.39e+03  |
| Reward Loss         | -1.28e+03 |
| Running Env Steps   | 2430000   |
| Running Forward KL  | 31        |
| Running Reverse KL  | 9.68      |
| Running Update Time | 486       |
-----------------------------------
--2023-11-07 04:03:02.812711 CST---
| Itration            | 487       |
| Real Det Return     | 2.77e+03  |
| Real Sto Return     | 2.58e+03  |
| Reward Loss         | -1.27e+03 |
| Running Env Steps   | 2435000   |
| Running Forward KL  | 29.8      |
| Running Reverse KL  | 9.58      |
| Running Update Time | 487       |
-----------------------------------
--2023-11-07 04:05:07.518502 CST---
| Itration            | 488       |
| Real Det Return     | 2.79e+03  |
| Real Sto Return     | 2.57e+03  |
| Reward Loss         | -1.26e+03 |
| Running Env Steps   | 2440000   |
| Running Forward KL  | 30.4      |
| Running Reverse KL  | 9.65      |
| Running Update Time | 488       |
-----------------------------------
--2023-11-07 04:07:11.982364 CST---
| Itration            | 489       |
| Real Det Return     | 2.74e+03  |
| Real Sto Return     | 2.57e+03  |
| Reward Loss         | -1.28e+03 |
| Running Env Steps   | 2445000   |
| Running Forward KL  | 30.1      |
| Running Reverse KL  | 9.42      |
| Running Update Time | 489       |
-----------------------------------
--2023-11-07 04:09:16.161826 CST---
| Itration            | 490       |
| Real Det Return     | 2.76e+03  |
| Real Sto Return     | 2.48e+03  |
| Reward Loss         | -1.29e+03 |
| Running Env Steps   | 2450000   |
| Running Forward KL  | 29.9      |
| Running Reverse KL  | 9.43      |
| Running Update Time | 490       |
-----------------------------------
--2023-11-07 04:11:20.466874 CST---
| Itration            | 491       |
| Real Det Return     | 2.78e+03  |
| Real Sto Return     | 2.57e+03  |
| Reward Loss         | -1.29e+03 |
| Running Env Steps   | 2455000   |
| Running Forward KL  | 30.9      |
| Running Reverse KL  | 9.48      |
| Running Update Time | 491       |
-----------------------------------
--2023-11-07 04:13:24.710594 CST---
| Itration            | 492       |
| Real Det Return     | 2.73e+03  |
| Real Sto Return     | 2.49e+03  |
| Reward Loss         | -1.31e+03 |
| Running Env Steps   | 2460000   |
| Running Forward KL  | 30.5      |
| Running Reverse KL  | 9.65      |
| Running Update Time | 492       |
-----------------------------------
--2023-11-07 04:15:29.137677 CST---
| Itration            | 493       |
| Real Det Return     | 2.8e+03   |
| Real Sto Return     | 2.51e+03  |
| Reward Loss         | -1.32e+03 |
| Running Env Steps   | 2465000   |
| Running Forward KL  | 30.5      |
| Running Reverse KL  | 9.8       |
| Running Update Time | 493       |
-----------------------------------
--2023-11-07 04:17:33.490051 CST---
| Itration            | 494       |
| Real Det Return     | 2.77e+03  |
| Real Sto Return     | 2.46e+03  |
| Reward Loss         | -1.32e+03 |
| Running Env Steps   | 2470000   |
| Running Forward KL  | 30.5      |
| Running Reverse KL  | 9.84      |
| Running Update Time | 494       |
-----------------------------------
--2023-11-07 04:19:37.524492 CST---
| Itration            | 495       |
| Real Det Return     | 2.74e+03  |
| Real Sto Return     | 2.52e+03  |
| Reward Loss         | -1.31e+03 |
| Running Env Steps   | 2475000   |
| Running Forward KL  | 30.6      |
| Running Reverse KL  | 9.71      |
| Running Update Time | 495       |
-----------------------------------
--2023-11-07 04:21:49.753726 CST---
| Itration            | 496       |
| Real Det Return     | 2.78e+03  |
| Real Sto Return     | 2.47e+03  |
| Reward Loss         | -1.33e+03 |
| Running Env Steps   | 2480000   |
| Running Forward KL  | 31.1      |
| Running Reverse KL  | 9.61      |
| Running Update Time | 496       |
-----------------------------------
--2023-11-07 04:24:01.857796 CST---
| Itration            | 497       |
| Real Det Return     | 2.71e+03  |
| Real Sto Return     | 2.49e+03  |
| Reward Loss         | -1.33e+03 |
| Running Env Steps   | 2485000   |
| Running Forward KL  | 30.7      |
| Running Reverse KL  | 9.89      |
| Running Update Time | 497       |
-----------------------------------
--2023-11-07 04:26:14.540705 CST---
| Itration            | 498       |
| Real Det Return     | 2.78e+03  |
| Real Sto Return     | 2.59e+03  |
| Reward Loss         | -1.34e+03 |
| Running Env Steps   | 2490000   |
| Running Forward KL  | 30.7      |
| Running Reverse KL  | 9.98      |
| Running Update Time | 498       |
-----------------------------------
--2023-11-07 04:28:26.382722 CST---
| Itration            | 499       |
| Real Det Return     | 2.75e+03  |
| Real Sto Return     | 2.63e+03  |
| Reward Loss         | -1.32e+03 |
| Running Env Steps   | 2495000   |
| Running Forward KL  | 30.7      |
| Running Reverse KL  | 9.69      |
| Running Update Time | 499       |
-----------------------------------
--2023-11-07 04:30:38.290410 CST---
| Itration            | 500       |
| Real Det Return     | 2.78e+03  |
| Real Sto Return     | 2.6e+03   |
| Reward Loss         | -1.35e+03 |
| Running Env Steps   | 2500000   |
| Running Forward KL  | 31        |
| Running Reverse KL  | 10.1      |
| Running Update Time | 500       |
-----------------------------------
--2023-11-07 04:32:50.399984 CST---
| Itration            | 501       |
| Real Det Return     | 2.78e+03  |
| Real Sto Return     | 2.59e+03  |
| Reward Loss         | -1.35e+03 |
| Running Env Steps   | 2505000   |
| Running Forward KL  | 31        |
| Running Reverse KL  | 9.87      |
| Running Update Time | 501       |
-----------------------------------
--2023-11-07 04:35:02.543803 CST---
| Itration            | 502       |
| Real Det Return     | 2.75e+03  |
| Real Sto Return     | 2.57e+03  |
| Reward Loss         | -1.35e+03 |
| Running Env Steps   | 2510000   |
| Running Forward KL  | 30.7      |
| Running Reverse KL  | 9.66      |
| Running Update Time | 502       |
-----------------------------------
--2023-11-07 04:37:07.356334 CST---
| Itration            | 503       |
| Real Det Return     | 2.77e+03  |
| Real Sto Return     | 2.5e+03   |
| Reward Loss         | -1.35e+03 |
| Running Env Steps   | 2515000   |
| Running Forward KL  | 30.8      |
| Running Reverse KL  | 9.95      |
| Running Update Time | 503       |
-----------------------------------
--2023-11-07 04:39:12.229138 CST---
| Itration            | 504       |
| Real Det Return     | 2.79e+03  |
| Real Sto Return     | 2.58e+03  |
| Reward Loss         | -1.34e+03 |
| Running Env Steps   | 2520000   |
| Running Forward KL  | 30        |
| Running Reverse KL  | 9.6       |
| Running Update Time | 504       |
-----------------------------------
--2023-11-07 04:41:17.620490 CST---
| Itration            | 505       |
| Real Det Return     | 2.77e+03  |
| Real Sto Return     | 2.55e+03  |
| Reward Loss         | -1.36e+03 |
| Running Env Steps   | 2525000   |
| Running Forward KL  | 30.7      |
| Running Reverse KL  | 9.9       |
| Running Update Time | 505       |
-----------------------------------
--2023-11-07 04:43:22.855466 CST---
| Itration            | 506       |
| Real Det Return     | 2.74e+03  |
| Real Sto Return     | 2.47e+03  |
| Reward Loss         | -1.39e+03 |
| Running Env Steps   | 2530000   |
| Running Forward KL  | 31.1      |
| Running Reverse KL  | 9.77      |
| Running Update Time | 506       |
-----------------------------------
--2023-11-07 04:45:27.587385 CST---
| Itration            | 507       |
| Real Det Return     | 2.79e+03  |
| Real Sto Return     | 2.54e+03  |
| Reward Loss         | -1.39e+03 |
| Running Env Steps   | 2535000   |
| Running Forward KL  | 30.8      |
| Running Reverse KL  | 9.92      |
| Running Update Time | 507       |
-----------------------------------
--2023-11-07 04:47:32.353469 CST---
| Itration            | 508       |
| Real Det Return     | 2.7e+03   |
| Real Sto Return     | 2.48e+03  |
| Reward Loss         | -1.37e+03 |
| Running Env Steps   | 2540000   |
| Running Forward KL  | 30.6      |
| Running Reverse KL  | 9.91      |
| Running Update Time | 508       |
-----------------------------------
--2023-11-07 04:49:37.293295 CST---
| Itration            | 509       |
| Real Det Return     | 2.77e+03  |
| Real Sto Return     | 2.62e+03  |
| Reward Loss         | -1.41e+03 |
| Running Env Steps   | 2545000   |
| Running Forward KL  | 31.2      |
| Running Reverse KL  | 10.2      |
| Running Update Time | 509       |
-----------------------------------
--2023-11-07 04:51:41.983273 CST---
| Itration            | 510       |
| Real Det Return     | 2.74e+03  |
| Real Sto Return     | 2.45e+03  |
| Reward Loss         | -1.43e+03 |
| Running Env Steps   | 2550000   |
| Running Forward KL  | 31        |
| Running Reverse KL  | 9.87      |
| Running Update Time | 510       |
-----------------------------------
--2023-11-07 04:53:46.757165 CST---
| Itration            | 511       |
| Real Det Return     | 2.69e+03  |
| Real Sto Return     | 2.45e+03  |
| Reward Loss         | -1.43e+03 |
| Running Env Steps   | 2555000   |
| Running Forward KL  | 30.6      |
| Running Reverse KL  | 10.1      |
| Running Update Time | 511       |
-----------------------------------
--2023-11-07 04:55:51.679678 CST---
| Itration            | 512       |
| Real Det Return     | 2.74e+03  |
| Real Sto Return     | 2.49e+03  |
| Reward Loss         | -1.44e+03 |
| Running Env Steps   | 2560000   |
| Running Forward KL  | 30.9      |
| Running Reverse KL  | 9.9       |
| Running Update Time | 512       |
-----------------------------------
--2023-11-07 04:57:58.203550 CST---
| Itration            | 513       |
| Real Det Return     | 2.5e+03   |
| Real Sto Return     | 2.45e+03  |
| Reward Loss         | -1.46e+03 |
| Running Env Steps   | 2565000   |
| Running Forward KL  | 31.4      |
| Running Reverse KL  | 10.2      |
| Running Update Time | 513       |
-----------------------------------
--2023-11-07 05:00:03.513488 CST---
| Itration            | 514       |
| Real Det Return     | 2.62e+03  |
| Real Sto Return     | 2.48e+03  |
| Reward Loss         | -1.44e+03 |
| Running Env Steps   | 2570000   |
| Running Forward KL  | 30.9      |
| Running Reverse KL  | 10.2      |
| Running Update Time | 514       |
-----------------------------------
--2023-11-07 05:02:09.105298 CST---
| Itration            | 515       |
| Real Det Return     | 2.68e+03  |
| Real Sto Return     | 2.45e+03  |
| Reward Loss         | -1.47e+03 |
| Running Env Steps   | 2575000   |
| Running Forward KL  | 31.1      |
| Running Reverse KL  | 10.3      |
| Running Update Time | 515       |
-----------------------------------
--2023-11-07 05:04:14.481386 CST---
| Itration            | 516       |
| Real Det Return     | 2.54e+03  |
| Real Sto Return     | 2.39e+03  |
| Reward Loss         | -1.48e+03 |
| Running Env Steps   | 2580000   |
| Running Forward KL  | 30.7      |
| Running Reverse KL  | 10.4      |
| Running Update Time | 516       |
-----------------------------------
--2023-11-07 05:06:19.800638 CST--
| Itration            | 517      |
| Real Det Return     | 2.64e+03 |
| Real Sto Return     | 2.44e+03 |
| Reward Loss         | -1.5e+03 |
| Running Env Steps   | 2585000  |
| Running Forward KL  | 31.4     |
| Running Reverse KL  | 10.6     |
| Running Update Time | 517      |
----------------------------------
--2023-11-07 05:08:20.544062 CST---
| Itration            | 518       |
| Real Det Return     | 2.64e+03  |
| Real Sto Return     | 2.48e+03  |
| Reward Loss         | -1.47e+03 |
| Running Env Steps   | 2590000   |
| Running Forward KL  | 30.8      |
| Running Reverse KL  | 10.1      |
| Running Update Time | 518       |
-----------------------------------
--2023-11-07 05:10:25.760104 CST---
| Itration            | 519       |
| Real Det Return     | 2.7e+03   |
| Real Sto Return     | 2.49e+03  |
| Reward Loss         | -1.47e+03 |
| Running Env Steps   | 2595000   |
| Running Forward KL  | 31.1      |
| Running Reverse KL  | 10.6      |
| Running Update Time | 519       |
-----------------------------------
--2023-11-07 05:12:31.475802 CST---
| Itration            | 520       |
| Real Det Return     | 2.62e+03  |
| Real Sto Return     | 2.43e+03  |
| Reward Loss         | -1.48e+03 |
| Running Env Steps   | 2600000   |
| Running Forward KL  | 31.3      |
| Running Reverse KL  | 10.6      |
| Running Update Time | 520       |
-----------------------------------
--2023-11-07 05:14:37.269934 CST--
| Itration            | 521      |
| Real Det Return     | 2.59e+03 |
| Real Sto Return     | 2.41e+03 |
| Reward Loss         | -1.5e+03 |
| Running Env Steps   | 2605000  |
| Running Forward KL  | 30.6     |
| Running Reverse KL  | 10.3     |
| Running Update Time | 521      |
----------------------------------
--2023-11-07 05:16:43.238177 CST--
| Itration            | 522      |
| Real Det Return     | 2.69e+03 |
| Real Sto Return     | 2.46e+03 |
| Reward Loss         | -1.5e+03 |
| Running Env Steps   | 2610000  |
| Running Forward KL  | 31.1     |
| Running Reverse KL  | 10.5     |
| Running Update Time | 522      |
----------------------------------
--2023-11-07 05:18:48.700726 CST---
| Itration            | 523       |
| Real Det Return     | 2.58e+03  |
| Real Sto Return     | 2.47e+03  |
| Reward Loss         | -1.49e+03 |
| Running Env Steps   | 2615000   |
| Running Forward KL  | 30        |
| Running Reverse KL  | 10.5      |
| Running Update Time | 523       |
-----------------------------------
--2023-11-07 05:20:49.235599 CST--
| Itration            | 524      |
| Real Det Return     | 2.76e+03 |
| Real Sto Return     | 2.52e+03 |
| Reward Loss         | -1.5e+03 |
| Running Env Steps   | 2620000  |
| Running Forward KL  | 31.5     |
| Running Reverse KL  | 10.6     |
| Running Update Time | 524      |
----------------------------------
--2023-11-07 05:22:54.504191 CST---
| Itration            | 525       |
| Real Det Return     | 2.59e+03  |
| Real Sto Return     | 2.43e+03  |
| Reward Loss         | -1.51e+03 |
| Running Env Steps   | 2625000   |
| Running Forward KL  | 31        |
| Running Reverse KL  | 10.4      |
| Running Update Time | 525       |
-----------------------------------
--2023-11-07 05:24:59.915444 CST---
| Itration            | 526       |
| Real Det Return     | 2.68e+03  |
| Real Sto Return     | 2.51e+03  |
| Reward Loss         | -1.53e+03 |
| Running Env Steps   | 2630000   |
| Running Forward KL  | 31.1      |
| Running Reverse KL  | 10.6      |
| Running Update Time | 526       |
-----------------------------------
--2023-11-07 05:27:05.286619 CST---
| Itration            | 527       |
| Real Det Return     | 2.49e+03  |
| Real Sto Return     | 2.38e+03  |
| Reward Loss         | -1.54e+03 |
| Running Env Steps   | 2635000   |
| Running Forward KL  | 31.3      |
| Running Reverse KL  | 10.9      |
| Running Update Time | 527       |
-----------------------------------
--2023-11-07 05:29:10.453313 CST---
| Itration            | 528       |
| Real Det Return     | 2.57e+03  |
| Real Sto Return     | 2.41e+03  |
| Reward Loss         | -1.55e+03 |
| Running Env Steps   | 2640000   |
| Running Forward KL  | 31.8      |
| Running Reverse KL  | 10.5      |
| Running Update Time | 528       |
-----------------------------------
--2023-11-07 05:31:15.757272 CST---
| Itration            | 529       |
| Real Det Return     | 2.76e+03  |
| Real Sto Return     | 2.45e+03  |
| Reward Loss         | -1.58e+03 |
| Running Env Steps   | 2645000   |
| Running Forward KL  | 31.8      |
| Running Reverse KL  | 10.6      |
| Running Update Time | 529       |
-----------------------------------
--2023-11-07 05:33:21.264859 CST---
| Itration            | 530       |
| Real Det Return     | 2.73e+03  |
| Real Sto Return     | 2.5e+03   |
| Reward Loss         | -1.55e+03 |
| Running Env Steps   | 2650000   |
| Running Forward KL  | 32.1      |
| Running Reverse KL  | 10.7      |
| Running Update Time | 530       |
-----------------------------------
--2023-11-07 05:35:26.683077 CST---
| Itration            | 531       |
| Real Det Return     | 2.48e+03  |
| Real Sto Return     | 2.3e+03   |
| Reward Loss         | -1.59e+03 |
| Running Env Steps   | 2655000   |
| Running Forward KL  | 31.5      |
| Running Reverse KL  | 11        |
| Running Update Time | 531       |
-----------------------------------
--2023-11-07 05:37:31.668818 CST---
| Itration            | 532       |
| Real Det Return     | 2.77e+03  |
| Real Sto Return     | 2.59e+03  |
| Reward Loss         | -1.55e+03 |
| Running Env Steps   | 2660000   |
| Running Forward KL  | 31.5      |
| Running Reverse KL  | 10.8      |
| Running Update Time | 532       |
-----------------------------------
--2023-11-07 05:39:36.841382 CST---
| Itration            | 533       |
| Real Det Return     | 2.61e+03  |
| Real Sto Return     | 2.46e+03  |
| Reward Loss         | -1.58e+03 |
| Running Env Steps   | 2665000   |
| Running Forward KL  | 31.5      |
| Running Reverse KL  | 11        |
| Running Update Time | 533       |
-----------------------------------
--2023-11-07 05:41:43.787570 CST---
| Itration            | 534       |
| Real Det Return     | 2.66e+03  |
| Real Sto Return     | 2.51e+03  |
| Reward Loss         | -1.56e+03 |
| Running Env Steps   | 2670000   |
| Running Forward KL  | 31.8      |
| Running Reverse KL  | 11.2      |
| Running Update Time | 534       |
-----------------------------------
--2023-11-07 05:43:50.569666 CST---
| Itration            | 535       |
| Real Det Return     | 2.69e+03  |
| Real Sto Return     | 2.46e+03  |
| Reward Loss         | -1.58e+03 |
| Running Env Steps   | 2675000   |
| Running Forward KL  | 32        |
| Running Reverse KL  | 10.8      |
| Running Update Time | 535       |
-----------------------------------
--2023-11-07 05:45:57.180312 CST--
| Itration            | 536      |
| Real Det Return     | 2.68e+03 |
| Real Sto Return     | 2.45e+03 |
| Reward Loss         | -1.6e+03 |
| Running Env Steps   | 2680000  |
| Running Forward KL  | 31.9     |
| Running Reverse KL  | 11.3     |
| Running Update Time | 536      |
----------------------------------
--2023-11-07 05:48:03.361455 CST---
| Itration            | 537       |
| Real Det Return     | 2.77e+03  |
| Real Sto Return     | 2.53e+03  |
| Reward Loss         | -1.59e+03 |
| Running Env Steps   | 2685000   |
| Running Forward KL  | 31.9      |
| Running Reverse KL  | 10.9      |
| Running Update Time | 537       |
-----------------------------------
--2023-11-07 05:50:10.158576 CST---
| Itration            | 538       |
| Real Det Return     | 2.61e+03  |
| Real Sto Return     | 2.46e+03  |
| Reward Loss         | -1.61e+03 |
| Running Env Steps   | 2690000   |
| Running Forward KL  | 31.6      |
| Running Reverse KL  | 11        |
| Running Update Time | 538       |
-----------------------------------
--2023-11-07 05:52:16.341110 CST---
| Itration            | 539       |
| Real Det Return     | 2.72e+03  |
| Real Sto Return     | 2.47e+03  |
| Reward Loss         | -1.63e+03 |
| Running Env Steps   | 2695000   |
| Running Forward KL  | 31.2      |
| Running Reverse KL  | 10.9      |
| Running Update Time | 539       |
-----------------------------------
--2023-11-07 05:54:20.130536 CST---
| Itration            | 540       |
| Real Det Return     | 2.7e+03   |
| Real Sto Return     | 2.47e+03  |
| Reward Loss         | -1.62e+03 |
| Running Env Steps   | 2700000   |
| Running Forward KL  | 31.8      |
| Running Reverse KL  | 10.9      |
| Running Update Time | 540       |
-----------------------------------
--2023-11-07 05:56:17.504544 CST---
| Itration            | 541       |
| Real Det Return     | 2.68e+03  |
| Real Sto Return     | 2.45e+03  |
| Reward Loss         | -1.66e+03 |
| Running Env Steps   | 2705000   |
| Running Forward KL  | 31.9      |
| Running Reverse KL  | 11.1      |
| Running Update Time | 541       |
-----------------------------------
--2023-11-07 05:58:21.188408 CST---
| Itration            | 542       |
| Real Det Return     | 2.66e+03  |
| Real Sto Return     | 2.43e+03  |
| Reward Loss         | -1.65e+03 |
| Running Env Steps   | 2710000   |
| Running Forward KL  | 32.1      |
| Running Reverse KL  | 11.1      |
| Running Update Time | 542       |
-----------------------------------
--2023-11-07 06:00:25.030666 CST---
| Itration            | 543       |
| Real Det Return     | 2.73e+03  |
| Real Sto Return     | 2.48e+03  |
| Reward Loss         | -1.65e+03 |
| Running Env Steps   | 2715000   |
| Running Forward KL  | 31.8      |
| Running Reverse KL  | 11.1      |
| Running Update Time | 543       |
-----------------------------------
--2023-11-07 06:02:29.007014 CST---
| Itration            | 544       |
| Real Det Return     | 2.68e+03  |
| Real Sto Return     | 2.47e+03  |
| Reward Loss         | -1.68e+03 |
| Running Env Steps   | 2720000   |
| Running Forward KL  | 30.8      |
| Running Reverse KL  | 11.1      |
| Running Update Time | 544       |
-----------------------------------
--2023-11-07 06:04:32.903635 CST---
| Itration            | 545       |
| Real Det Return     | 2.68e+03  |
| Real Sto Return     | 2.46e+03  |
| Reward Loss         | -1.67e+03 |
| Running Env Steps   | 2725000   |
| Running Forward KL  | 32.1      |
| Running Reverse KL  | 11.3      |
| Running Update Time | 545       |
-----------------------------------
--2023-11-07 06:06:36.492619 CST---
| Itration            | 546       |
| Real Det Return     | 2.77e+03  |
| Real Sto Return     | 2.49e+03  |
| Reward Loss         | -1.67e+03 |
| Running Env Steps   | 2730000   |
| Running Forward KL  | 32.3      |
| Running Reverse KL  | 11.6      |
| Running Update Time | 546       |
-----------------------------------
--2023-11-07 06:08:40.019440 CST---
| Itration            | 547       |
| Real Det Return     | 2.65e+03  |
| Real Sto Return     | 2.38e+03  |
| Reward Loss         | -1.71e+03 |
| Running Env Steps   | 2735000   |
| Running Forward KL  | 31.9      |
| Running Reverse KL  | 11.2      |
| Running Update Time | 547       |
-----------------------------------
--2023-11-07 06:10:44.185465 CST---
| Itration            | 548       |
| Real Det Return     | 2.59e+03  |
| Real Sto Return     | 2.31e+03  |
| Reward Loss         | -1.71e+03 |
| Running Env Steps   | 2740000   |
| Running Forward KL  | 31.2      |
| Running Reverse KL  | 11.4      |
| Running Update Time | 548       |
-----------------------------------
--2023-11-07 06:12:47.626759 CST---
| Itration            | 549       |
| Real Det Return     | 2.75e+03  |
| Real Sto Return     | 2.51e+03  |
| Reward Loss         | -1.74e+03 |
| Running Env Steps   | 2745000   |
| Running Forward KL  | 32.7      |
| Running Reverse KL  | 11.1      |
| Running Update Time | 549       |
-----------------------------------
--2023-11-07 06:14:51.048986 CST---
| Itration            | 550       |
| Real Det Return     | 2.64e+03  |
| Real Sto Return     | 2.43e+03  |
| Reward Loss         | -1.77e+03 |
| Running Env Steps   | 2750000   |
| Running Forward KL  | 32.3      |
| Running Reverse KL  | 11.5      |
| Running Update Time | 550       |
-----------------------------------
--2023-11-07 06:16:54.360073 CST---
| Itration            | 551       |
| Real Det Return     | 2.66e+03  |
| Real Sto Return     | 2.39e+03  |
| Reward Loss         | -1.73e+03 |
| Running Env Steps   | 2755000   |
| Running Forward KL  | 31.8      |
| Running Reverse KL  | 11.5      |
| Running Update Time | 551       |
-----------------------------------
--2023-11-07 06:18:57.720130 CST---
| Itration            | 552       |
| Real Det Return     | 2.79e+03  |
| Real Sto Return     | 2.51e+03  |
| Reward Loss         | -1.73e+03 |
| Running Env Steps   | 2760000   |
| Running Forward KL  | 32.3      |
| Running Reverse KL  | 11.1      |
| Running Update Time | 552       |
-----------------------------------
--2023-11-07 06:21:01.004485 CST---
| Itration            | 553       |
| Real Det Return     | 2.61e+03  |
| Real Sto Return     | 2.37e+03  |
| Reward Loss         | -1.78e+03 |
| Running Env Steps   | 2765000   |
| Running Forward KL  | 32.1      |
| Running Reverse KL  | 11.3      |
| Running Update Time | 553       |
-----------------------------------
--2023-11-07 06:23:04.192144 CST---
| Itration            | 554       |
| Real Det Return     | 2.7e+03   |
| Real Sto Return     | 2.38e+03  |
| Reward Loss         | -1.79e+03 |
| Running Env Steps   | 2770000   |
| Running Forward KL  | 32.7      |
| Running Reverse KL  | 11.3      |
| Running Update Time | 554       |
-----------------------------------
--2023-11-07 06:25:07.503041 CST--
| Itration            | 555      |
| Real Det Return     | 2.7e+03  |
| Real Sto Return     | 2.39e+03 |
| Reward Loss         | -1.8e+03 |
| Running Env Steps   | 2775000  |
| Running Forward KL  | 32.2     |
| Running Reverse KL  | 11.2     |
| Running Update Time | 555      |
----------------------------------
--2023-11-07 06:27:10.898709 CST---
| Itration            | 556       |
| Real Det Return     | 2.59e+03  |
| Real Sto Return     | 2.35e+03  |
| Reward Loss         | -1.78e+03 |
| Running Env Steps   | 2780000   |
| Running Forward KL  | 32.4      |
| Running Reverse KL  | 11.6      |
| Running Update Time | 556       |
-----------------------------------
--2023-11-07 06:29:14.338717 CST---
| Itration            | 557       |
| Real Det Return     | 2.49e+03  |
| Real Sto Return     | 2.19e+03  |
| Reward Loss         | -1.87e+03 |
| Running Env Steps   | 2785000   |
| Running Forward KL  | 32.2      |
| Running Reverse KL  | 11.2      |
| Running Update Time | 557       |
-----------------------------------
--2023-11-07 06:31:27.632960 CST---
| Itration            | 558       |
| Real Det Return     | 2.66e+03  |
| Real Sto Return     | 2.38e+03  |
| Reward Loss         | -1.82e+03 |
| Running Env Steps   | 2790000   |
| Running Forward KL  | 32.8      |
| Running Reverse KL  | 11.5      |
| Running Update Time | 558       |
-----------------------------------
--2023-11-07 06:33:40.453394 CST---
| Itration            | 559       |
| Real Det Return     | 2.67e+03  |
| Real Sto Return     | 2.35e+03  |
| Reward Loss         | -1.88e+03 |
| Running Env Steps   | 2795000   |
| Running Forward KL  | 32.3      |
| Running Reverse KL  | 11.5      |
| Running Update Time | 559       |
-----------------------------------
--2023-11-07 06:35:53.219126 CST---
| Itration            | 560       |
| Real Det Return     | 2.58e+03  |
| Real Sto Return     | 2.33e+03  |
| Reward Loss         | -1.86e+03 |
| Running Env Steps   | 2800000   |
| Running Forward KL  | 32.4      |
| Running Reverse KL  | 11.8      |
| Running Update Time | 560       |
-----------------------------------
--2023-11-07 06:38:05.990507 CST---
| Itration            | 561       |
| Real Det Return     | 2.71e+03  |
| Real Sto Return     | 2.37e+03  |
| Reward Loss         | -1.85e+03 |
| Running Env Steps   | 2805000   |
| Running Forward KL  | 32.3      |
| Running Reverse KL  | 11.5      |
| Running Update Time | 561       |
-----------------------------------
--2023-11-07 06:40:18.887278 CST---
| Itration            | 562       |
| Real Det Return     | 2.58e+03  |
| Real Sto Return     | 2.37e+03  |
| Reward Loss         | -1.87e+03 |
| Running Env Steps   | 2810000   |
| Running Forward KL  | 32.4      |
| Running Reverse KL  | 11.6      |
| Running Update Time | 562       |
-----------------------------------
--2023-11-07 06:42:31.780424 CST---
| Itration            | 563       |
| Real Det Return     | 2.54e+03  |
| Real Sto Return     | 2.21e+03  |
| Reward Loss         | -1.91e+03 |
| Running Env Steps   | 2815000   |
| Running Forward KL  | 32.6      |
| Running Reverse KL  | 11.4      |
| Running Update Time | 563       |
-----------------------------------
--2023-11-07 06:44:44.776293 CST---
| Itration            | 564       |
| Real Det Return     | 2.53e+03  |
| Real Sto Return     | 2.18e+03  |
| Reward Loss         | -1.94e+03 |
| Running Env Steps   | 2820000   |
| Running Forward KL  | 33.2      |
| Running Reverse KL  | 11.7      |
| Running Update Time | 564       |
-----------------------------------
--2023-11-07 06:46:57.777217 CST---
| Itration            | 565       |
| Real Det Return     | 2.29e+03  |
| Real Sto Return     | 2.21e+03  |
| Reward Loss         | -1.97e+03 |
| Running Env Steps   | 2825000   |
| Running Forward KL  | 33.4      |
| Running Reverse KL  | 11.9      |
| Running Update Time | 565       |
-----------------------------------
--2023-11-07 06:49:02.838752 CST--
| Itration            | 566      |
| Real Det Return     | 2.44e+03 |
| Real Sto Return     | 2.15e+03 |
| Reward Loss         | -2e+03   |
| Running Env Steps   | 2830000  |
| Running Forward KL  | 32.6     |
| Running Reverse KL  | 11.6     |
| Running Update Time | 566      |
----------------------------------
--2023-11-07 06:51:07.524175 CST---
| Itration            | 567       |
| Real Det Return     | 1.69e+03  |
| Real Sto Return     | 2e+03     |
| Reward Loss         | -2.07e+03 |
| Running Env Steps   | 2835000   |
| Running Forward KL  | 33.3      |
| Running Reverse KL  | 11.9      |
| Running Update Time | 567       |
-----------------------------------
--2023-11-07 06:53:12.677557 CST---
| Itration            | 568       |
| Real Det Return     | 1.7e+03   |
| Real Sto Return     | 2.06e+03  |
| Reward Loss         | -2.08e+03 |
| Running Env Steps   | 2840000   |
| Running Forward KL  | 33.2      |
| Running Reverse KL  | 11.6      |
| Running Update Time | 568       |
-----------------------------------
--2023-11-07 06:55:17.911189 CST---
| Itration            | 569       |
| Real Det Return     | 1.71e+03  |
| Real Sto Return     | 2.07e+03  |
| Reward Loss         | -2.11e+03 |
| Running Env Steps   | 2845000   |
| Running Forward KL  | 33.1      |
| Running Reverse KL  | 11.4      |
| Running Update Time | 569       |
-----------------------------------
--2023-11-07 06:57:22.985342 CST---
| Itration            | 570       |
| Real Det Return     | 1.73e+03  |
| Real Sto Return     | 2.15e+03  |
| Reward Loss         | -2.11e+03 |
| Running Env Steps   | 2850000   |
| Running Forward KL  | 32.9      |
| Running Reverse KL  | 11.8      |
| Running Update Time | 570       |
-----------------------------------
--2023-11-07 06:59:30.092460 CST---
| Itration            | 571       |
| Real Det Return     | 2.27e+03  |
| Real Sto Return     | 2.12e+03  |
| Reward Loss         | -2.11e+03 |
| Running Env Steps   | 2855000   |
| Running Forward KL  | 32.8      |
| Running Reverse KL  | 11.6      |
| Running Update Time | 571       |
-----------------------------------
--2023-11-07 07:01:35.695440 CST---
| Itration            | 572       |
| Real Det Return     | 1.83e+03  |
| Real Sto Return     | 2.07e+03  |
| Reward Loss         | -2.16e+03 |
| Running Env Steps   | 2860000   |
| Running Forward KL  | 32.9      |
| Running Reverse KL  | 11.6      |
| Running Update Time | 572       |
-----------------------------------
--2023-11-07 07:03:41.247958 CST---
| Itration            | 573       |
| Real Det Return     | 1.82e+03  |
| Real Sto Return     | 1.98e+03  |
| Reward Loss         | -2.16e+03 |
| Running Env Steps   | 2865000   |
| Running Forward KL  | 33.4      |
| Running Reverse KL  | 11.8      |
| Running Update Time | 573       |
-----------------------------------
--2023-11-07 07:05:46.838204 CST--
| Itration            | 574      |
| Real Det Return     | 1.93e+03 |
| Real Sto Return     | 2.03e+03 |
| Reward Loss         | -2.2e+03 |
| Running Env Steps   | 2870000  |
| Running Forward KL  | 33.2     |
| Running Reverse KL  | 11.8     |
| Running Update Time | 574      |
----------------------------------
--2023-11-07 07:07:52.633502 CST--
| Itration            | 575      |
| Real Det Return     | 1.97e+03 |
| Real Sto Return     | 2.12e+03 |
| Reward Loss         | -2.1e+03 |
| Running Env Steps   | 2875000  |
| Running Forward KL  | 32.7     |
| Running Reverse KL  | 11.4     |
| Running Update Time | 575      |
----------------------------------
--2023-11-07 07:09:58.204295 CST---
| Itration            | 576       |
| Real Det Return     | 1.7e+03   |
| Real Sto Return     | 2.04e+03  |
| Reward Loss         | -2.19e+03 |
| Running Env Steps   | 2880000   |
| Running Forward KL  | 32.8      |
| Running Reverse KL  | 11.8      |
| Running Update Time | 576       |
-----------------------------------
--2023-11-07 07:12:03.897384 CST---
| Itration            | 577       |
| Real Det Return     | 1.9e+03   |
| Real Sto Return     | 2.08e+03  |
| Reward Loss         | -2.17e+03 |
| Running Env Steps   | 2885000   |
| Running Forward KL  | 32.5      |
| Running Reverse KL  | 11.6      |
| Running Update Time | 577       |
-----------------------------------
--2023-11-07 07:14:09.953698 CST---
| Itration            | 578       |
| Real Det Return     | 1.98e+03  |
| Real Sto Return     | 1.98e+03  |
| Reward Loss         | -2.29e+03 |
| Running Env Steps   | 2890000   |
| Running Forward KL  | 33.7      |
| Running Reverse KL  | 12.1      |
| Running Update Time | 578       |
-----------------------------------
--2023-11-07 07:16:15.613566 CST---
| Itration            | 579       |
| Real Det Return     | 1.88e+03  |
| Real Sto Return     | 2.03e+03  |
| Reward Loss         | -2.26e+03 |
| Running Env Steps   | 2895000   |
| Running Forward KL  | 33.5      |
| Running Reverse KL  | 11.8      |
| Running Update Time | 579       |
-----------------------------------
--2023-11-07 07:18:21.091181 CST---
| Itration            | 580       |
| Real Det Return     | 2.1e+03   |
| Real Sto Return     | 2.17e+03  |
| Reward Loss         | -2.23e+03 |
| Running Env Steps   | 2900000   |
| Running Forward KL  | 33.2      |
| Running Reverse KL  | 11.6      |
| Running Update Time | 580       |
-----------------------------------
--2023-11-07 07:20:26.116824 CST---
| Itration            | 581       |
| Real Det Return     | 1.77e+03  |
| Real Sto Return     | 2.06e+03  |
| Reward Loss         | -2.27e+03 |
| Running Env Steps   | 2905000   |
| Running Forward KL  | 33.2      |
| Running Reverse KL  | 12        |
| Running Update Time | 581       |
-----------------------------------
--2023-11-07 07:22:31.067716 CST---
| Itration            | 582       |
| Real Det Return     | 1.8e+03   |
| Real Sto Return     | 2.05e+03  |
| Reward Loss         | -2.18e+03 |
| Running Env Steps   | 2910000   |
| Running Forward KL  | 32.8      |
| Running Reverse KL  | 11.6      |
| Running Update Time | 582       |
-----------------------------------
--2023-11-07 07:24:36.117943 CST--
| Itration            | 583      |
| Real Det Return     | 1.9e+03  |
| Real Sto Return     | 2.1e+03  |
| Reward Loss         | -2.2e+03 |
| Running Env Steps   | 2915000  |
| Running Forward KL  | 32.6     |
| Running Reverse KL  | 11.7     |
| Running Update Time | 583      |
----------------------------------
--2023-11-07 07:26:41.178995 CST---
| Itration            | 584       |
| Real Det Return     | 1.87e+03  |
| Real Sto Return     | 2.07e+03  |
| Reward Loss         | -2.24e+03 |
| Running Env Steps   | 2920000   |
| Running Forward KL  | 33.4      |
| Running Reverse KL  | 12        |
| Running Update Time | 584       |
-----------------------------------
--2023-11-07 07:28:46.160568 CST--
| Itration            | 585      |
| Real Det Return     | 1.89e+03 |
| Real Sto Return     | 2.12e+03 |
| Reward Loss         | -2.3e+03 |
| Running Env Steps   | 2925000  |
| Running Forward KL  | 33.1     |
| Running Reverse KL  | 11.5     |
| Running Update Time | 585      |
----------------------------------
--2023-11-07 07:30:51.302505 CST---
| Itration            | 586       |
| Real Det Return     | 1.91e+03  |
| Real Sto Return     | 2.04e+03  |
| Reward Loss         | -2.32e+03 |
| Running Env Steps   | 2930000   |
| Running Forward KL  | 33.4      |
| Running Reverse KL  | 12        |
| Running Update Time | 586       |
-----------------------------------
--2023-11-07 07:32:45.998010 CST---
| Itration            | 587       |
| Real Det Return     | 2.13e+03  |
| Real Sto Return     | 2.12e+03  |
| Reward Loss         | -2.27e+03 |
| Running Env Steps   | 2935000   |
| Running Forward KL  | 32.8      |
| Running Reverse KL  | 11.7      |
| Running Update Time | 587       |
-----------------------------------
--2023-11-07 07:34:51.022402 CST---
| Itration            | 588       |
| Real Det Return     | 2.07e+03  |
| Real Sto Return     | 2.23e+03  |
| Reward Loss         | -2.18e+03 |
| Running Env Steps   | 2940000   |
| Running Forward KL  | 32.2      |
| Running Reverse KL  | 11.5      |
| Running Update Time | 588       |
-----------------------------------
--2023-11-07 07:36:56.019138 CST--
| Itration            | 589      |
| Real Det Return     | 2.05e+03 |
| Real Sto Return     | 2.11e+03 |
| Reward Loss         | -2.3e+03 |
| Running Env Steps   | 2945000  |
| Running Forward KL  | 32.2     |
| Running Reverse KL  | 11.5     |
| Running Update Time | 589      |
----------------------------------
--2023-11-07 07:39:01.015263 CST---
| Itration            | 590       |
| Real Det Return     | 2.09e+03  |
| Real Sto Return     | 2.06e+03  |
| Reward Loss         | -2.34e+03 |
| Running Env Steps   | 2950000   |
| Running Forward KL  | 32.8      |
| Running Reverse KL  | 11.9      |
| Running Update Time | 590       |
-----------------------------------
--2023-11-07 07:41:05.903339 CST---
| Itration            | 591       |
| Real Det Return     | 2.58e+03  |
| Real Sto Return     | 2.51e+03  |
| Reward Loss         | -2.02e+03 |
| Running Env Steps   | 2955000   |
| Running Forward KL  | 31.8      |
| Running Reverse KL  | 11.7      |
| Running Update Time | 591       |
-----------------------------------
--2023-11-07 07:43:10.974935 CST--
| Itration            | 592      |
| Real Det Return     | 2.15e+03 |
| Real Sto Return     | 2.48e+03 |
| Reward Loss         | -2.1e+03 |
| Running Env Steps   | 2960000  |
| Running Forward KL  | 32.3     |
| Running Reverse KL  | 11.4     |
| Running Update Time | 592      |
----------------------------------
--2023-11-07 07:45:16.055583 CST--
| Itration            | 593      |
| Real Det Return     | 2.11e+03 |
| Real Sto Return     | 2.33e+03 |
| Reward Loss         | -2.2e+03 |
| Running Env Steps   | 2965000  |
| Running Forward KL  | 32.3     |
| Running Reverse KL  | 11.7     |
| Running Update Time | 593      |
----------------------------------
--2023-11-07 07:47:21.179669 CST---
| Itration            | 594       |
| Real Det Return     | 2.18e+03  |
| Real Sto Return     | 2.49e+03  |
| Reward Loss         | -2.09e+03 |
| Running Env Steps   | 2970000   |
| Running Forward KL  | 32.6      |
| Running Reverse KL  | 11.6      |
| Running Update Time | 594       |
-----------------------------------
--2023-11-07 07:49:26.330552 CST---
| Itration            | 595       |
| Real Det Return     | 2.58e+03  |
| Real Sto Return     | 2.53e+03  |
| Reward Loss         | -2.08e+03 |
| Running Env Steps   | 2975000   |
| Running Forward KL  | 32.6      |
| Running Reverse KL  | 11.9      |
| Running Update Time | 595       |
-----------------------------------
--2023-11-07 07:51:35.607176 CST---
| Itration            | 596       |
| Real Det Return     | 2.16e+03  |
| Real Sto Return     | 2.29e+03  |
| Reward Loss         | -2.31e+03 |
| Running Env Steps   | 2980000   |
| Running Forward KL  | 32.8      |
| Running Reverse KL  | 11.5      |
| Running Update Time | 596       |
-----------------------------------
--2023-11-07 07:53:44.832283 CST--
| Itration            | 597      |
| Real Det Return     | 2.68e+03 |
| Real Sto Return     | 2.64e+03 |
| Reward Loss         | -2e+03   |
| Running Env Steps   | 2985000  |
| Running Forward KL  | 32.7     |
| Running Reverse KL  | 12.2     |
| Running Update Time | 597      |
----------------------------------
--2023-11-07 07:55:54.307825 CST--
| Itration            | 598      |
| Real Det Return     | 2.68e+03 |
| Real Sto Return     | 2.59e+03 |
| Reward Loss         | -2.1e+03 |
| Running Env Steps   | 2990000  |
| Running Forward KL  | 32.3     |
| Running Reverse KL  | 11.8     |
| Running Update Time | 598      |
----------------------------------
--2023-11-07 07:58:03.631714 CST---
| Itration            | 599       |
| Real Det Return     | 2.74e+03  |
| Real Sto Return     | 2.53e+03  |
| Reward Loss         | -2.13e+03 |
| Running Env Steps   | 2995000   |
| Running Forward KL  | 32.5      |
| Running Reverse KL  | 12.2      |
| Running Update Time | 599       |
-----------------------------------
