[{"env_step": 0, "rew": 130.0823, "rew_std": 15.1427, "Agent": "PPO"}, {"env_step": 30720, "rew": 350.9917, "rew_std": 24.4802, "Agent": "PPO"}, {"env_step": 61440, "rew": 425.4232, "rew_std": 23.1423, "Agent": "PPO"}, {"env_step": 92160, "rew": 465.9451, "rew_std": 49.5543, "Agent": "PPO"}, {"env_step": 122880, "rew": 493.9147, "rew_std": 26.3191, "Agent": "PPO"}, {"env_step": 153600, "rew": 490.4975, "rew_std": 42.5076, "Agent": "PPO"}, {"env_step": 184320, "rew": 501.0533, "rew_std": 44.1211, "Agent": "PPO"}, {"env_step": 215040, "rew": 511.8286, "rew_std": 45.6841, "Agent": "PPO"}, {"env_step": 245760, "rew": 510.9731, "rew_std": 39.5026, "Agent": "PPO"}, {"env_step": 276480, "rew": 521.749, "rew_std": 45.4886, "Agent": "PPO"}, {"env_step": 307200, "rew": 541.7495, "rew_std": 33.5348, "Agent": "PPO"}, {"env_step": 337920, "rew": 551.0738, "rew_std": 41.6129, "Agent": "PPO"}, {"env_step": 368640, "rew": 558.4841, "rew_std": 42.2806, "Agent": "PPO"}, {"env_step": 399360, "rew": 559.4836, "rew_std": 61.2039, "Agent": "PPO"}, {"env_step": 430080, "rew": 567.995, "rew_std": 38.5396, "Agent": "PPO"}, {"env_step": 460800, "rew": 550.0916, "rew_std": 39.8131, "Agent": "PPO"}, {"env_step": 491520, "rew": 582.7719, "rew_std": 64.735, "Agent": "PPO"}, {"env_step": 522240, "rew": 579.7875, "rew_std": 48.9013, "Agent": "PPO"}, {"env_step": 552960, "rew": 606.7364, "rew_std": 78.9236, "Agent": "PPO"}, {"env_step": 583680, "rew": 609.9051, "rew_std": 50.6975, "Agent": "PPO"}, {"env_step": 614400, "rew": 631.2371, "rew_std": 77.1233, "Agent": "PPO"}, {"env_step": 645120, "rew": 648.6753, "rew_std": 92.364, "Agent": "PPO"}, {"env_step": 675840, "rew": 634.2489, "rew_std": 73.4048, "Agent": "PPO"}, {"env_step": 706560, "rew": 628.1442, "rew_std": 72.5634, "Agent": "PPO"}, {"env_step": 737280, "rew": 663.1003, "rew_std": 80.5057, "Agent": "PPO"}, {"env_step": 768000, "rew": 676.9848, "rew_std": 73.3874, "Agent": "PPO"}, {"env_step": 798720, "rew": 656.3851, "rew_std": 78.3265, "Agent": "PPO"}, {"env_step": 829440, "rew": 712.8563, "rew_std": 67.9891, "Agent": "PPO"}, {"env_step": 860160, "rew": 701.9783, "rew_std": 119.4269, "Agent": "PPO"}, {"env_step": 890880, "rew": 727.9524, "rew_std": 98.1045, "Agent": "PPO"}, {"env_step": 921600, "rew": 716.8859, "rew_std": 90.7377, "Agent": "PPO"}, {"env_step": 952320, "rew": 739.1209, "rew_std": 132.9358, "Agent": "PPO"}, {"env_step": 983040, "rew": 787.0681, "rew_std": 193.5017, "Agent": "PPO"}, {"env_step": 1013760, "rew": 732.3068, "rew_std": 105.6359, "Agent": "PPO"}, {"env_step": 1044480, "rew": 747.3812, "rew_std": 144.6905, "Agent": "PPO"}, {"env_step": 1075200, "rew": 753.0065, "rew_std": 150.7269, "Agent": "PPO"}, {"env_step": 1105920, "rew": 767.1866, "rew_std": 177.7926, "Agent": "PPO"}, {"env_step": 1136640, "rew": 745.1658, "rew_std": 115.0446, "Agent": "PPO"}, {"env_step": 1167360, "rew": 775.4483, "rew_std": 129.888, "Agent": "PPO"}, {"env_step": 1198080, "rew": 784.5837, "rew_std": 148.4, "Agent": "PPO"}, {"env_step": 1228800, "rew": 825.0454, "rew_std": 157.0856, "Agent": "PPO"}, {"env_step": 1259520, "rew": 829.8744, "rew_std": 171.9486, "Agent": "PPO"}, {"env_step": 1290240, "rew": 826.0339, "rew_std": 164.3613, "Agent": "PPO"}, {"env_step": 1320960, "rew": 804.6047, "rew_std": 151.2456, "Agent": "PPO"}, {"env_step": 1351680, "rew": 815.0404, "rew_std": 188.6186, "Agent": "PPO"}, {"env_step": 1382400, "rew": 835.5702, "rew_std": 150.8863, "Agent": "PPO"}, {"env_step": 1413120, "rew": 842.724, "rew_std": 188.133, "Agent": "PPO"}, {"env_step": 1443840, "rew": 860.3203, "rew_std": 198.2533, "Agent": "PPO"}, {"env_step": 1474560, "rew": 841.7917, "rew_std": 155.3849, "Agent": "PPO"}, {"env_step": 1505280, "rew": 800.4889, "rew_std": 148.3306, "Agent": "PPO"}, {"env_step": 1536000, "rew": 935.7042, "rew_std": 249.8531, "Agent": "PPO"}, {"env_step": 1566720, "rew": 888.7137, "rew_std": 174.3786, "Agent": "PPO"}, {"env_step": 1597440, "rew": 832.1629, "rew_std": 155.7721, "Agent": "PPO"}, {"env_step": 1628160, "rew": 986.3306, "rew_std": 285.295, "Agent": "PPO"}, {"env_step": 1658880, "rew": 853.313, "rew_std": 158.3305, "Agent": "PPO"}, {"env_step": 1689600, "rew": 877.4147, "rew_std": 171.3564, "Agent": "PPO"}, {"env_step": 1720320, "rew": 925.5333, "rew_std": 274.6513, "Agent": "PPO"}, {"env_step": 1751040, "rew": 920.2305, "rew_std": 239.9945, "Agent": "PPO"}, {"env_step": 1781760, "rew": 927.6438, "rew_std": 268.7642, "Agent": "PPO"}, {"env_step": 1812480, "rew": 965.5925, "rew_std": 252.3835, "Agent": "PPO"}, {"env_step": 1843200, "rew": 977.3575, "rew_std": 338.2636, "Agent": "PPO"}, {"env_step": 1873920, "rew": 1062.624, "rew_std": 421.2998, "Agent": "PPO"}, {"env_step": 1904640, "rew": 1017.8632, "rew_std": 357.3262, "Agent": "PPO"}, {"env_step": 1935360, "rew": 1045.3381, "rew_std": 363.1296, "Agent": "PPO"}, {"env_step": 1966080, "rew": 988.6769, "rew_std": 293.54, "Agent": "PPO"}, {"env_step": 1996800, "rew": 1039.9539, "rew_std": 317.9886, "Agent": "PPO"}, {"env_step": 2027520, "rew": 1000.3818, "rew_std": 267.0232, "Agent": "PPO"}, {"env_step": 2058240, "rew": 932.8863, "rew_std": 172.0988, "Agent": "PPO"}, {"env_step": 2088960, "rew": 1063.8193, "rew_std": 356.9004, "Agent": "PPO"}, {"env_step": 2119680, "rew": 1007.1344, "rew_std": 293.2305, "Agent": "PPO"}, {"env_step": 2150400, "rew": 1118.3303, "rew_std": 434.818, "Agent": "PPO"}, {"env_step": 2181120, "rew": 1040.4434, "rew_std": 270.6467, "Agent": "PPO"}, {"env_step": 2211840, "rew": 1104.2401, "rew_std": 395.4114, "Agent": "PPO"}, {"env_step": 2242560, "rew": 1083.2706, "rew_std": 306.5721, "Agent": "PPO"}, {"env_step": 2273280, "rew": 1027.5872, "rew_std": 275.1138, "Agent": "PPO"}, {"env_step": 2304000, "rew": 1177.9164, "rew_std": 353.1948, "Agent": "PPO"}, {"env_step": 2334720, "rew": 1087.1684, "rew_std": 305.1818, "Agent": "PPO"}, {"env_step": 2365440, "rew": 1177.7415, "rew_std": 304.9442, "Agent": "PPO"}, {"env_step": 2396160, "rew": 1058.5766, "rew_std": 268.4139, "Agent": "PPO"}, {"env_step": 2426880, "rew": 1219.0824, "rew_std": 504.7934, "Agent": "PPO"}, {"env_step": 2457600, "rew": 1138.8759, "rew_std": 339.5198, "Agent": "PPO"}, {"env_step": 2488320, "rew": 1154.2304, "rew_std": 377.9643, "Agent": "PPO"}, {"env_step": 2519040, "rew": 1290.3548, "rew_std": 410.5781, "Agent": "PPO"}, {"env_step": 2549760, "rew": 1251.92, "rew_std": 435.415, "Agent": "PPO"}, {"env_step": 2580480, "rew": 1235.0206, "rew_std": 365.7419, "Agent": "PPO"}, {"env_step": 2611200, "rew": 1273.9936, "rew_std": 443.1518, "Agent": "PPO"}, {"env_step": 2641920, "rew": 1222.3642, "rew_std": 409.0311, "Agent": "PPO"}, {"env_step": 2672640, "rew": 1348.982, "rew_std": 560.3245, "Agent": "PPO"}, {"env_step": 2703360, "rew": 1274.8993, "rew_std": 312.1054, "Agent": "PPO"}, {"env_step": 2734080, "rew": 1359.7101, "rew_std": 572.6597, "Agent": "PPO"}, {"env_step": 2764800, "rew": 1323.7258, "rew_std": 509.658, "Agent": "PPO"}, {"env_step": 2795520, "rew": 1181.5144, "rew_std": 341.507, "Agent": "PPO"}, {"env_step": 2826240, "rew": 1279.5406, "rew_std": 448.5542, "Agent": "PPO"}, {"env_step": 2856960, "rew": 1291.4052, "rew_std": 369.7179, "Agent": "PPO"}, {"env_step": 2887680, "rew": 1144.7832, "rew_std": 223.4122, "Agent": "PPO"}, {"env_step": 2918400, "rew": 1323.9516, "rew_std": 476.6721, "Agent": "PPO"}, {"env_step": 2949120, "rew": 1208.2497, "rew_std": 322.735, "Agent": "PPO"}, {"env_step": 2979840, "rew": 1346.5563, "rew_std": 454.0205, "Agent": "PPO"}, {"env_step": 3010560, "rew": 1418.4356, "rew_std": 586.806, "Agent": "PPO"}, {"env_step": 3041280, "rew": 1401.6184, "rew_std": 675.0394, "Agent": "PPO"}, {"env_step": 3072000, "rew": 1225.8906, "rew_std": 338.3397, "Agent": "PPO"}, {"env_step": 5000, "rew": 235.9497, "rew_std": 126.1434, "Agent": "TD3"}, {"env_step": 10000, "rew": 164.07, "rew_std": 81.7212, "Agent": "TD3"}, {"env_step": 15000, "rew": 211.2634, "rew_std": 79.2344, "Agent": "TD3"}, {"env_step": 20000, "rew": 282.4783, "rew_std": 93.0359, "Agent": "TD3"}, {"env_step": 25000, "rew": 318.5609, "rew_std": 73.6385, "Agent": "TD3"}, {"env_step": 30000, "rew": 291.8901, "rew_std": 40.7493, "Agent": "TD3"}, {"env_step": 35000, "rew": 313.7815, "rew_std": 73.0841, "Agent": "TD3"}, {"env_step": 40000, "rew": 337.9159, "rew_std": 57.573, "Agent": "TD3"}, {"env_step": 45000, "rew": 368.3768, "rew_std": 92.3044, "Agent": "TD3"}, {"env_step": 50000, "rew": 344.416, "rew_std": 76.0211, "Agent": "TD3"}, {"env_step": 55000, "rew": 429.7109, "rew_std": 82.0808, "Agent": "TD3"}, {"env_step": 60000, "rew": 395.007, "rew_std": 63.4624, "Agent": "TD3"}, {"env_step": 65000, "rew": 415.4698, "rew_std": 62.3147, "Agent": "TD3"}, {"env_step": 70000, "rew": 459.2035, "rew_std": 48.2942, "Agent": "TD3"}, {"env_step": 75000, "rew": 452.3541, "rew_std": 65.0611, "Agent": "TD3"}, {"env_step": 80000, "rew": 461.8969, "rew_std": 63.6509, "Agent": "TD3"}, {"env_step": 85000, "rew": 476.0453, "rew_std": 71.275, "Agent": "TD3"}, {"env_step": 90000, "rew": 500.811, "rew_std": 84.8932, "Agent": "TD3"}, {"env_step": 95000, "rew": 485.3997, "rew_std": 80.3051, "Agent": "TD3"}, {"env_step": 100000, "rew": 503.4416, "rew_std": 42.9756, "Agent": "TD3"}, {"env_step": 105000, "rew": 527.5804, "rew_std": 77.3744, "Agent": "TD3"}, {"env_step": 110000, "rew": 544.3686, "rew_std": 55.0087, "Agent": "TD3"}, {"env_step": 115000, "rew": 553.5231, "rew_std": 50.6329, "Agent": "TD3"}, {"env_step": 120000, "rew": 574.4474, "rew_std": 75.047, "Agent": "TD3"}, {"env_step": 125000, "rew": 559.3873, "rew_std": 86.2582, "Agent": "TD3"}, {"env_step": 130000, "rew": 570.9049, "rew_std": 59.5154, "Agent": "TD3"}, {"env_step": 135000, "rew": 580.3405, "rew_std": 50.9925, "Agent": "TD3"}, {"env_step": 140000, "rew": 606.0723, "rew_std": 62.0672, "Agent": "TD3"}, {"env_step": 145000, "rew": 605.5913, "rew_std": 31.7131, "Agent": "TD3"}, {"env_step": 150000, "rew": 625.5167, "rew_std": 66.0565, "Agent": "TD3"}, {"env_step": 155000, "rew": 652.0839, "rew_std": 133.1029, "Agent": "TD3"}, {"env_step": 160000, "rew": 677.93, "rew_std": 73.4751, "Agent": "TD3"}, {"env_step": 165000, "rew": 660.96, "rew_std": 107.0351, "Agent": "TD3"}, {"env_step": 170000, "rew": 667.0291, "rew_std": 57.4566, "Agent": "TD3"}, {"env_step": 175000, "rew": 699.7508, "rew_std": 86.6757, "Agent": "TD3"}, {"env_step": 180000, "rew": 724.8383, "rew_std": 124.4392, "Agent": "TD3"}, {"env_step": 185000, "rew": 792.9929, "rew_std": 102.3493, "Agent": "TD3"}, {"env_step": 190000, "rew": 801.6827, "rew_std": 176.7923, "Agent": "TD3"}, {"env_step": 195000, "rew": 860.7451, "rew_std": 123.1047, "Agent": "TD3"}, {"env_step": 200000, "rew": 831.1765, "rew_std": 115.7513, "Agent": "TD3"}, {"env_step": 205000, "rew": 891.3844, "rew_std": 153.8025, "Agent": "TD3"}, {"env_step": 210000, "rew": 920.1051, "rew_std": 138.4675, "Agent": "TD3"}, {"env_step": 215000, "rew": 968.2489, "rew_std": 206.803, "Agent": "TD3"}, {"env_step": 220000, "rew": 987.881, "rew_std": 128.4658, "Agent": "TD3"}, {"env_step": 225000, "rew": 1061.9422, "rew_std": 223.8467, "Agent": "TD3"}, {"env_step": 230000, "rew": 1259.2323, "rew_std": 497.5445, "Agent": "TD3"}, {"env_step": 235000, "rew": 1096.4967, "rew_std": 141.7399, "Agent": "TD3"}, {"env_step": 240000, "rew": 1311.5082, "rew_std": 429.5385, "Agent": "TD3"}, {"env_step": 245000, "rew": 1311.3561, "rew_std": 450.7312, "Agent": "TD3"}, {"env_step": 250000, "rew": 1557.6187, "rew_std": 1001.0859, "Agent": "TD3"}, {"env_step": 255000, "rew": 1492.0918, "rew_std": 536.5407, "Agent": "TD3"}, {"env_step": 260000, "rew": 1478.4514, "rew_std": 597.8008, "Agent": "TD3"}, {"env_step": 265000, "rew": 1759.7188, "rew_std": 679.3698, "Agent": "TD3"}, {"env_step": 270000, "rew": 1536.9493, "rew_std": 357.449, "Agent": "TD3"}, {"env_step": 275000, "rew": 1667.6531, "rew_std": 376.0051, "Agent": "TD3"}, {"env_step": 280000, "rew": 1751.9256, "rew_std": 554.9098, "Agent": "TD3"}, {"env_step": 285000, "rew": 2053.3891, "rew_std": 597.2069, "Agent": "TD3"}, {"env_step": 290000, "rew": 2180.2304, "rew_std": 747.0793, "Agent": "TD3"}, {"env_step": 295000, "rew": 2150.2635, "rew_std": 542.9699, "Agent": "TD3"}, {"env_step": 300000, "rew": 2311.3341, "rew_std": 776.4552, "Agent": "TD3"}, {"env_step": 305000, "rew": 2605.4033, "rew_std": 969.016, "Agent": "TD3"}, {"env_step": 310000, "rew": 2496.6585, "rew_std": 490.1734, "Agent": "TD3"}, {"env_step": 315000, "rew": 2636.3198, "rew_std": 815.1771, "Agent": "TD3"}, {"env_step": 320000, "rew": 2553.8276, "rew_std": 1048.6062, "Agent": "TD3"}, {"env_step": 325000, "rew": 2962.0407, "rew_std": 1075.7931, "Agent": "TD3"}, {"env_step": 330000, "rew": 2935.3863, "rew_std": 1000.7385, "Agent": "TD3"}, {"env_step": 335000, "rew": 2921.3217, "rew_std": 774.101, "Agent": "TD3"}, {"env_step": 340000, "rew": 3469.4737, "rew_std": 1022.4847, "Agent": "TD3"}, {"env_step": 345000, "rew": 3185.8696, "rew_std": 733.3435, "Agent": "TD3"}, {"env_step": 350000, "rew": 3575.7222, "rew_std": 921.7069, "Agent": "TD3"}, {"env_step": 355000, "rew": 3627.7872, "rew_std": 1142.049, "Agent": "TD3"}, {"env_step": 360000, "rew": 3227.9706, "rew_std": 711.5102, "Agent": "TD3"}, {"env_step": 365000, "rew": 3068.6233, "rew_std": 691.8184, "Agent": "TD3"}, {"env_step": 370000, "rew": 3962.7737, "rew_std": 760.0341, "Agent": "TD3"}, {"env_step": 375000, "rew": 3594.7677, "rew_std": 928.1101, "Agent": "TD3"}, {"env_step": 380000, "rew": 3654.0992, "rew_std": 881.6398, "Agent": "TD3"}, {"env_step": 385000, "rew": 3912.8499, "rew_std": 945.1385, "Agent": "TD3"}, {"env_step": 390000, "rew": 3789.8911, "rew_std": 863.4987, "Agent": "TD3"}, {"env_step": 395000, "rew": 3682.2004, "rew_std": 1050.2498, "Agent": "TD3"}, {"env_step": 400000, "rew": 4042.171, "rew_std": 855.7865, "Agent": "TD3"}, {"env_step": 405000, "rew": 4160.8874, "rew_std": 634.3616, "Agent": "TD3"}, {"env_step": 410000, "rew": 3968.93, "rew_std": 772.6093, "Agent": "TD3"}, {"env_step": 415000, "rew": 4362.0422, "rew_std": 761.5106, "Agent": "TD3"}, {"env_step": 420000, "rew": 3947.9836, "rew_std": 735.9527, "Agent": "TD3"}, {"env_step": 425000, "rew": 4205.5062, "rew_std": 788.3009, "Agent": "TD3"}, {"env_step": 430000, "rew": 4308.0382, "rew_std": 395.7122, "Agent": "TD3"}, {"env_step": 435000, "rew": 4216.2622, "rew_std": 871.5691, "Agent": "TD3"}, {"env_step": 440000, "rew": 4050.0608, "rew_std": 577.2572, "Agent": "TD3"}, {"env_step": 445000, "rew": 4563.2002, "rew_std": 491.0323, "Agent": "TD3"}, {"env_step": 450000, "rew": 4183.4363, "rew_std": 674.3578, "Agent": "TD3"}, {"env_step": 455000, "rew": 4401.7438, "rew_std": 639.4418, "Agent": "TD3"}, {"env_step": 460000, "rew": 4497.9864, "rew_std": 751.2121, "Agent": "TD3"}, {"env_step": 465000, "rew": 4643.5722, "rew_std": 438.428, "Agent": "TD3"}, {"env_step": 470000, "rew": 4488.679, "rew_std": 531.0604, "Agent": "TD3"}, {"env_step": 475000, "rew": 4291.1472, "rew_std": 1132.5677, "Agent": "TD3"}, {"env_step": 480000, "rew": 4397.5194, "rew_std": 554.6465, "Agent": "TD3"}, {"env_step": 485000, "rew": 4631.6336, "rew_std": 421.5592, "Agent": "TD3"}, {"env_step": 490000, "rew": 4728.4588, "rew_std": 522.8134, "Agent": "TD3"}, {"env_step": 495000, "rew": 4670.8286, "rew_std": 437.9568, "Agent": "TD3"}, {"env_step": 500000, "rew": 4623.3424, "rew_std": 494.8101, "Agent": "TD3"}, {"env_step": 505000, "rew": 4941.599, "rew_std": 156.4723, "Agent": "TD3"}, {"env_step": 510000, "rew": 4498.4272, "rew_std": 492.6321, "Agent": "TD3"}, {"env_step": 515000, "rew": 4630.5692, "rew_std": 397.6329, "Agent": "TD3"}, {"env_step": 520000, "rew": 4826.7184, "rew_std": 320.7131, "Agent": "TD3"}, {"env_step": 525000, "rew": 4598.1875, "rew_std": 483.902, "Agent": "TD3"}, {"env_step": 530000, "rew": 4496.8694, "rew_std": 584.4539, "Agent": "TD3"}, {"env_step": 535000, "rew": 4623.5366, "rew_std": 351.8769, "Agent": "TD3"}, {"env_step": 540000, "rew": 4603.9342, "rew_std": 658.6824, "Agent": "TD3"}, {"env_step": 545000, "rew": 4682.8686, "rew_std": 562.6961, "Agent": "TD3"}, {"env_step": 550000, "rew": 4620.4423, "rew_std": 732.4667, "Agent": "TD3"}, {"env_step": 555000, "rew": 5009.661, "rew_std": 194.2122, "Agent": "TD3"}, {"env_step": 560000, "rew": 4688.508, "rew_std": 488.5095, "Agent": "TD3"}, {"env_step": 565000, "rew": 4785.6807, "rew_std": 295.0808, "Agent": "TD3"}, {"env_step": 570000, "rew": 4644.8156, "rew_std": 532.46, "Agent": "TD3"}, {"env_step": 575000, "rew": 4779.7482, "rew_std": 295.8876, "Agent": "TD3"}, {"env_step": 580000, "rew": 4770.5819, "rew_std": 491.2643, "Agent": "TD3"}, {"env_step": 585000, "rew": 4631.8668, "rew_std": 404.3156, "Agent": "TD3"}, {"env_step": 590000, "rew": 4815.5844, "rew_std": 477.5273, "Agent": "TD3"}, {"env_step": 595000, "rew": 4915.4074, "rew_std": 276.115, "Agent": "TD3"}, {"env_step": 600000, "rew": 4720.8844, "rew_std": 419.8293, "Agent": "TD3"}, {"env_step": 605000, "rew": 4830.0452, "rew_std": 425.9804, "Agent": "TD3"}, {"env_step": 610000, "rew": 4847.5045, "rew_std": 386.9902, "Agent": "TD3"}, {"env_step": 615000, "rew": 4924.1368, "rew_std": 266.5693, "Agent": "TD3"}, {"env_step": 620000, "rew": 4988.3792, "rew_std": 169.3005, "Agent": "TD3"}, {"env_step": 625000, "rew": 4724.847, "rew_std": 579.4092, "Agent": "TD3"}, {"env_step": 630000, "rew": 4761.8745, "rew_std": 440.2406, "Agent": "TD3"}, {"env_step": 635000, "rew": 4775.3046, "rew_std": 381.7462, "Agent": "TD3"}, {"env_step": 640000, "rew": 4946.9403, "rew_std": 383.9484, "Agent": "TD3"}, {"env_step": 645000, "rew": 4982.5448, "rew_std": 214.4079, "Agent": "TD3"}, {"env_step": 650000, "rew": 5004.9466, "rew_std": 150.9016, "Agent": "TD3"}, {"env_step": 655000, "rew": 4995.9812, "rew_std": 240.261, "Agent": "TD3"}, {"env_step": 660000, "rew": 4917.1866, "rew_std": 469.1764, "Agent": "TD3"}, {"env_step": 665000, "rew": 4801.5734, "rew_std": 506.8326, "Agent": "TD3"}, {"env_step": 670000, "rew": 4858.4089, "rew_std": 262.0223, "Agent": "TD3"}, {"env_step": 675000, "rew": 4995.3341, "rew_std": 190.7018, "Agent": "TD3"}, {"env_step": 680000, "rew": 4993.243, "rew_std": 256.0528, "Agent": "TD3"}, {"env_step": 685000, "rew": 4894.9504, "rew_std": 329.4103, "Agent": "TD3"}, {"env_step": 690000, "rew": 4836.4288, "rew_std": 333.3621, "Agent": "TD3"}, {"env_step": 695000, "rew": 4863.7781, "rew_std": 429.5135, "Agent": "TD3"}, {"env_step": 700000, "rew": 5047.3576, "rew_std": 176.8078, "Agent": "TD3"}, {"env_step": 705000, "rew": 4996.33, "rew_std": 201.191, "Agent": "TD3"}, {"env_step": 710000, "rew": 4880.6173, "rew_std": 230.9537, "Agent": "TD3"}, {"env_step": 715000, "rew": 5037.2655, "rew_std": 184.4567, "Agent": "TD3"}, {"env_step": 720000, "rew": 4857.1692, "rew_std": 454.8993, "Agent": "TD3"}, {"env_step": 725000, "rew": 4750.6899, "rew_std": 463.4295, "Agent": "TD3"}, {"env_step": 730000, "rew": 5040.6027, "rew_std": 215.3514, "Agent": "TD3"}, {"env_step": 735000, "rew": 4920.5525, "rew_std": 265.3201, "Agent": "TD3"}, {"env_step": 740000, "rew": 4908.3612, "rew_std": 355.8871, "Agent": "TD3"}, {"env_step": 745000, "rew": 5125.8994, "rew_std": 161.9509, "Agent": "TD3"}, {"env_step": 750000, "rew": 5000.1682, "rew_std": 244.1228, "Agent": "TD3"}, {"env_step": 755000, "rew": 5019.9781, "rew_std": 267.8087, "Agent": "TD3"}, {"env_step": 760000, "rew": 5121.22, "rew_std": 108.2708, "Agent": "TD3"}, {"env_step": 765000, "rew": 5064.4168, "rew_std": 237.7942, "Agent": "TD3"}, {"env_step": 770000, "rew": 5113.9521, "rew_std": 139.6293, "Agent": "TD3"}, {"env_step": 775000, "rew": 4808.9893, "rew_std": 458.4127, "Agent": "TD3"}, {"env_step": 780000, "rew": 5108.4583, "rew_std": 140.2175, "Agent": "TD3"}, {"env_step": 785000, "rew": 4874.2555, "rew_std": 306.674, "Agent": "TD3"}, {"env_step": 790000, "rew": 5114.0341, "rew_std": 222.1771, "Agent": "TD3"}, {"env_step": 795000, "rew": 4875.5048, "rew_std": 385.4428, "Agent": "TD3"}, {"env_step": 800000, "rew": 5079.8931, "rew_std": 246.6054, "Agent": "TD3"}, {"env_step": 805000, "rew": 5133.4923, "rew_std": 139.7789, "Agent": "TD3"}, {"env_step": 810000, "rew": 5050.1196, "rew_std": 288.2048, "Agent": "TD3"}, {"env_step": 815000, "rew": 5100.0691, "rew_std": 271.2653, "Agent": "TD3"}, {"env_step": 820000, "rew": 4971.7669, "rew_std": 269.1686, "Agent": "TD3"}, {"env_step": 825000, "rew": 4933.0076, "rew_std": 430.8825, "Agent": "TD3"}, {"env_step": 830000, "rew": 5101.0741, "rew_std": 113.8671, "Agent": "TD3"}, {"env_step": 835000, "rew": 5013.3863, "rew_std": 249.3497, "Agent": "TD3"}, {"env_step": 840000, "rew": 5001.234, "rew_std": 243.7169, "Agent": "TD3"}, {"env_step": 845000, "rew": 5018.7245, "rew_std": 199.6715, "Agent": "TD3"}, {"env_step": 850000, "rew": 4988.2064, "rew_std": 411.9275, "Agent": "TD3"}, {"env_step": 855000, "rew": 4938.9949, "rew_std": 352.3513, "Agent": "TD3"}, {"env_step": 860000, "rew": 5002.8016, "rew_std": 254.9775, "Agent": "TD3"}, {"env_step": 865000, "rew": 5017.9034, "rew_std": 171.6877, "Agent": "TD3"}, {"env_step": 870000, "rew": 4930.6844, "rew_std": 457.0508, "Agent": "TD3"}, {"env_step": 875000, "rew": 4979.0143, "rew_std": 219.4724, "Agent": "TD3"}, {"env_step": 880000, "rew": 4947.4845, "rew_std": 345.9994, "Agent": "TD3"}, {"env_step": 885000, "rew": 4908.4159, "rew_std": 484.5035, "Agent": "TD3"}, {"env_step": 890000, "rew": 4946.5147, "rew_std": 332.8934, "Agent": "TD3"}, {"env_step": 895000, "rew": 5160.1536, "rew_std": 207.4863, "Agent": "TD3"}, {"env_step": 900000, "rew": 5084.8653, "rew_std": 252.4938, "Agent": "TD3"}, {"env_step": 905000, "rew": 5131.8246, "rew_std": 158.9648, "Agent": "TD3"}, {"env_step": 910000, "rew": 5086.175, "rew_std": 151.9426, "Agent": "TD3"}, {"env_step": 915000, "rew": 5163.2683, "rew_std": 139.7717, "Agent": "TD3"}, {"env_step": 920000, "rew": 5113.859, "rew_std": 133.0161, "Agent": "TD3"}, {"env_step": 925000, "rew": 5114.2944, "rew_std": 214.1085, "Agent": "TD3"}, {"env_step": 930000, "rew": 5185.9206, "rew_std": 109.1179, "Agent": "TD3"}, {"env_step": 935000, "rew": 5128.1275, "rew_std": 169.5002, "Agent": "TD3"}, {"env_step": 940000, "rew": 4936.1542, "rew_std": 303.652, "Agent": "TD3"}, {"env_step": 945000, "rew": 5150.1266, "rew_std": 105.97, "Agent": "TD3"}, {"env_step": 950000, "rew": 5045.5078, "rew_std": 263.0376, "Agent": "TD3"}, {"env_step": 955000, "rew": 5106.9053, "rew_std": 143.1704, "Agent": "TD3"}, {"env_step": 960000, "rew": 4965.0764, "rew_std": 365.9184, "Agent": "TD3"}, {"env_step": 965000, "rew": 5094.2522, "rew_std": 240.831, "Agent": "TD3"}, {"env_step": 970000, "rew": 5142.6073, "rew_std": 128.5266, "Agent": "TD3"}, {"env_step": 975000, "rew": 5189.5491, "rew_std": 178.4785, "Agent": "TD3"}, {"env_step": 980000, "rew": 5005.5165, "rew_std": 513.0527, "Agent": "TD3"}, {"env_step": 985000, "rew": 5129.9301, "rew_std": 168.1549, "Agent": "TD3"}, {"env_step": 990000, "rew": 5030.1055, "rew_std": 318.9333, "Agent": "TD3"}, {"env_step": 995000, "rew": 5137.759, "rew_std": 203.0376, "Agent": "TD3"}, {"env_step": 1000000, "rew": 5043.2619, "rew_std": 286.2232, "Agent": "TD3"}, {"env_step": 1005000, "rew": 5153.1375, "rew_std": 176.2132, "Agent": "TD3"}, {"env_step": 1010000, "rew": 5121.4074, "rew_std": 239.9469, "Agent": "TD3"}, {"env_step": 1015000, "rew": 5029.4641, "rew_std": 281.9055, "Agent": "TD3"}, {"env_step": 1020000, "rew": 5119.6649, "rew_std": 238.2116, "Agent": "TD3"}, {"env_step": 1025000, "rew": 5093.208, "rew_std": 266.519, "Agent": "TD3"}, {"env_step": 1030000, "rew": 5063.8444, "rew_std": 267.4462, "Agent": "TD3"}, {"env_step": 1035000, "rew": 5060.6371, "rew_std": 270.9232, "Agent": "TD3"}, {"env_step": 1040000, "rew": 5145.6034, "rew_std": 225.2249, "Agent": "TD3"}, {"env_step": 1045000, "rew": 5199.8301, "rew_std": 118.791, "Agent": "TD3"}, {"env_step": 1050000, "rew": 5124.249, "rew_std": 271.596, "Agent": "TD3"}, {"env_step": 1055000, "rew": 5157.4669, "rew_std": 147.9857, "Agent": "TD3"}, {"env_step": 1060000, "rew": 5171.9615, "rew_std": 221.3771, "Agent": "TD3"}, {"env_step": 1065000, "rew": 5168.2077, "rew_std": 235.7423, "Agent": "TD3"}, {"env_step": 1070000, "rew": 5131.0357, "rew_std": 203.1461, "Agent": "TD3"}, {"env_step": 1075000, "rew": 5114.448, "rew_std": 254.8144, "Agent": "TD3"}, {"env_step": 1080000, "rew": 5188.6507, "rew_std": 171.5331, "Agent": "TD3"}, {"env_step": 1085000, "rew": 5094.6068, "rew_std": 242.4939, "Agent": "TD3"}, {"env_step": 1090000, "rew": 5178.7567, "rew_std": 117.6536, "Agent": "TD3"}, {"env_step": 1095000, "rew": 5134.6964, "rew_std": 241.2062, "Agent": "TD3"}, {"env_step": 1100000, "rew": 5021.4631, "rew_std": 283.4483, "Agent": "TD3"}, {"env_step": 1105000, "rew": 5129.941, "rew_std": 238.1083, "Agent": "TD3"}, {"env_step": 1110000, "rew": 5179.2979, "rew_std": 226.6365, "Agent": "TD3"}, {"env_step": 1115000, "rew": 5054.2752, "rew_std": 288.4716, "Agent": "TD3"}, {"env_step": 1120000, "rew": 5118.64, "rew_std": 223.76, "Agent": "TD3"}, {"env_step": 1125000, "rew": 5032.9734, "rew_std": 233.2601, "Agent": "TD3"}, {"env_step": 1130000, "rew": 5138.4733, "rew_std": 235.9326, "Agent": "TD3"}, {"env_step": 1135000, "rew": 4996.6592, "rew_std": 360.9811, "Agent": "TD3"}, {"env_step": 1140000, "rew": 5107.5643, "rew_std": 267.7652, "Agent": "TD3"}, {"env_step": 1145000, "rew": 4829.5349, "rew_std": 501.3194, "Agent": "TD3"}, {"env_step": 1150000, "rew": 5098.5737, "rew_std": 269.75, "Agent": "TD3"}, {"env_step": 1155000, "rew": 5140.4421, "rew_std": 219.9037, "Agent": "TD3"}, {"env_step": 1160000, "rew": 4887.2352, "rew_std": 754.7954, "Agent": "TD3"}, {"env_step": 1165000, "rew": 5194.6158, "rew_std": 238.8039, "Agent": "TD3"}, {"env_step": 1170000, "rew": 5103.5817, "rew_std": 252.1515, "Agent": "TD3"}, {"env_step": 1175000, "rew": 4956.8485, "rew_std": 407.4093, "Agent": "TD3"}, {"env_step": 1180000, "rew": 4921.0582, "rew_std": 443.066, "Agent": "TD3"}, {"env_step": 1185000, "rew": 5166.1484, "rew_std": 154.7587, "Agent": "TD3"}, {"env_step": 1190000, "rew": 5014.7964, "rew_std": 365.9749, "Agent": "TD3"}, {"env_step": 1195000, "rew": 4814.9366, "rew_std": 545.8645, "Agent": "TD3"}, {"env_step": 1200000, "rew": 5006.7689, "rew_std": 300.7244, "Agent": "TD3"}, {"env_step": 1205000, "rew": 5108.7124, "rew_std": 302.142, "Agent": "TD3"}, {"env_step": 1210000, "rew": 5088.0629, "rew_std": 416.3904, "Agent": "TD3"}, {"env_step": 1215000, "rew": 4947.1785, "rew_std": 551.1925, "Agent": "TD3"}, {"env_step": 1220000, "rew": 5089.226, "rew_std": 211.0536, "Agent": "TD3"}, {"env_step": 1225000, "rew": 4877.8198, "rew_std": 470.0478, "Agent": "TD3"}, {"env_step": 1230000, "rew": 5148.8341, "rew_std": 444.5354, "Agent": "TD3"}, {"env_step": 1235000, "rew": 5116.8597, "rew_std": 298.4278, "Agent": "TD3"}, {"env_step": 1240000, "rew": 5092.3513, "rew_std": 270.159, "Agent": "TD3"}, {"env_step": 1245000, "rew": 4793.7686, "rew_std": 1118.6323, "Agent": "TD3"}, {"env_step": 1250000, "rew": 4907.0573, "rew_std": 349.6552, "Agent": "TD3"}, {"env_step": 0, "rew": 134.2851, "rew_std": 8.9071, "Agent": "REINFORCE"}, {"env_step": 30720, "rew": 132.3317, "rew_std": 11.5884, "Agent": "REINFORCE"}, {"env_step": 61440, "rew": 145.5181, "rew_std": 8.2425, "Agent": "REINFORCE"}, {"env_step": 92160, "rew": 160.6736, "rew_std": 20.2516, "Agent": "REINFORCE"}, {"env_step": 122880, "rew": 182.995, "rew_std": 21.3789, "Agent": "REINFORCE"}, {"env_step": 153600, "rew": 229.754, "rew_std": 36.6985, "Agent": "REINFORCE"}, {"env_step": 184320, "rew": 279.1829, "rew_std": 34.0526, "Agent": "REINFORCE"}, {"env_step": 215040, "rew": 298.9748, "rew_std": 51.2942, "Agent": "REINFORCE"}, {"env_step": 245760, "rew": 347.8587, "rew_std": 34.0078, "Agent": "REINFORCE"}, {"env_step": 276480, "rew": 346.622, "rew_std": 40.2387, "Agent": "REINFORCE"}, {"env_step": 307200, "rew": 356.9964, "rew_std": 31.2667, "Agent": "REINFORCE"}, {"env_step": 337920, "rew": 348.9647, "rew_std": 42.06, "Agent": "REINFORCE"}, {"env_step": 368640, "rew": 357.4741, "rew_std": 44.106, "Agent": "REINFORCE"}, {"env_step": 399360, "rew": 369.9218, "rew_std": 54.5148, "Agent": "REINFORCE"}, {"env_step": 430080, "rew": 390.0737, "rew_std": 44.8478, "Agent": "REINFORCE"}, {"env_step": 460800, "rew": 381.269, "rew_std": 48.6122, "Agent": "REINFORCE"}, {"env_step": 491520, "rew": 362.2927, "rew_std": 40.5626, "Agent": "REINFORCE"}, {"env_step": 522240, "rew": 376.2153, "rew_std": 48.4882, "Agent": "REINFORCE"}, {"env_step": 552960, "rew": 392.1445, "rew_std": 49.4761, "Agent": "REINFORCE"}, {"env_step": 583680, "rew": 385.8984, "rew_std": 51.5347, "Agent": "REINFORCE"}, {"env_step": 614400, "rew": 379.0199, "rew_std": 37.4646, "Agent": "REINFORCE"}, {"env_step": 645120, "rew": 384.7891, "rew_std": 28.1911, "Agent": "REINFORCE"}, {"env_step": 675840, "rew": 370.1497, "rew_std": 46.0869, "Agent": "REINFORCE"}, {"env_step": 706560, "rew": 382.5503, "rew_std": 30.2578, "Agent": "REINFORCE"}, {"env_step": 737280, "rew": 392.037, "rew_std": 35.1496, "Agent": "REINFORCE"}, {"env_step": 768000, "rew": 385.1342, "rew_std": 54.9051, "Agent": "REINFORCE"}, {"env_step": 798720, "rew": 373.2024, "rew_std": 46.5376, "Agent": "REINFORCE"}, {"env_step": 829440, "rew": 382.3954, "rew_std": 54.6306, "Agent": "REINFORCE"}, {"env_step": 860160, "rew": 370.3266, "rew_std": 56.9917, "Agent": "REINFORCE"}, {"env_step": 890880, "rew": 374.9132, "rew_std": 60.8034, "Agent": "REINFORCE"}, {"env_step": 921600, "rew": 372.2838, "rew_std": 55.2198, "Agent": "REINFORCE"}, {"env_step": 952320, "rew": 363.9386, "rew_std": 44.3701, "Agent": "REINFORCE"}, {"env_step": 983040, "rew": 393.1796, "rew_std": 53.9256, "Agent": "REINFORCE"}, {"env_step": 1013760, "rew": 391.3388, "rew_std": 41.1072, "Agent": "REINFORCE"}, {"env_step": 1044480, "rew": 378.9883, "rew_std": 50.5282, "Agent": "REINFORCE"}, {"env_step": 1075200, "rew": 377.087, "rew_std": 56.9021, "Agent": "REINFORCE"}, {"env_step": 1105920, "rew": 363.5972, "rew_std": 51.4931, "Agent": "REINFORCE"}, {"env_step": 1136640, "rew": 399.5731, "rew_std": 55.8625, "Agent": "REINFORCE"}, {"env_step": 1167360, "rew": 405.3753, "rew_std": 62.2749, "Agent": "REINFORCE"}, {"env_step": 1198080, "rew": 402.9043, "rew_std": 53.5287, "Agent": "REINFORCE"}, {"env_step": 1228800, "rew": 414.8761, "rew_std": 38.5687, "Agent": "REINFORCE"}, {"env_step": 1259520, "rew": 399.3817, "rew_std": 50.0419, "Agent": "REINFORCE"}, {"env_step": 1290240, "rew": 398.1147, "rew_std": 57.708, "Agent": "REINFORCE"}, {"env_step": 1320960, "rew": 380.6883, "rew_std": 54.8462, "Agent": "REINFORCE"}, {"env_step": 1351680, "rew": 396.672, "rew_std": 56.6795, "Agent": "REINFORCE"}, {"env_step": 1382400, "rew": 386.1521, "rew_std": 58.6364, "Agent": "REINFORCE"}, {"env_step": 1413120, "rew": 367.3148, "rew_std": 41.4321, "Agent": "REINFORCE"}, {"env_step": 1443840, "rew": 372.0875, "rew_std": 50.2092, "Agent": "REINFORCE"}, {"env_step": 1474560, "rew": 382.4313, "rew_std": 48.7902, "Agent": "REINFORCE"}, {"env_step": 1505280, "rew": 396.4733, "rew_std": 44.2938, "Agent": "REINFORCE"}, {"env_step": 1536000, "rew": 380.5775, "rew_std": 46.8464, "Agent": "REINFORCE"}, {"env_step": 1566720, "rew": 382.3344, "rew_std": 28.7958, "Agent": "REINFORCE"}, {"env_step": 1597440, "rew": 382.907, "rew_std": 40.5035, "Agent": "REINFORCE"}, {"env_step": 1628160, "rew": 406.9931, "rew_std": 37.8681, "Agent": "REINFORCE"}, {"env_step": 1658880, "rew": 413.1177, "rew_std": 62.0168, "Agent": "REINFORCE"}, {"env_step": 1689600, "rew": 401.5583, "rew_std": 20.9659, "Agent": "REINFORCE"}, {"env_step": 1720320, "rew": 391.8222, "rew_std": 27.7617, "Agent": "REINFORCE"}, {"env_step": 1751040, "rew": 423.1126, "rew_std": 38.2972, "Agent": "REINFORCE"}, {"env_step": 1781760, "rew": 412.7687, "rew_std": 37.9509, "Agent": "REINFORCE"}, {"env_step": 1812480, "rew": 397.8555, "rew_std": 32.0286, "Agent": "REINFORCE"}, {"env_step": 1843200, "rew": 399.915, "rew_std": 26.438, "Agent": "REINFORCE"}, {"env_step": 1873920, "rew": 438.2131, "rew_std": 47.8379, "Agent": "REINFORCE"}, {"env_step": 1904640, "rew": 388.0629, "rew_std": 37.9841, "Agent": "REINFORCE"}, {"env_step": 1935360, "rew": 405.3549, "rew_std": 47.5364, "Agent": "REINFORCE"}, {"env_step": 1966080, "rew": 400.3994, "rew_std": 48.1861, "Agent": "REINFORCE"}, {"env_step": 1996800, "rew": 421.4098, "rew_std": 58.5822, "Agent": "REINFORCE"}, {"env_step": 2027520, "rew": 419.1956, "rew_std": 60.8501, "Agent": "REINFORCE"}, {"env_step": 2058240, "rew": 404.4959, "rew_std": 39.7589, "Agent": "REINFORCE"}, {"env_step": 2088960, "rew": 411.0288, "rew_std": 45.8849, "Agent": "REINFORCE"}, {"env_step": 2119680, "rew": 403.3878, "rew_std": 45.458, "Agent": "REINFORCE"}, {"env_step": 2150400, "rew": 402.6161, "rew_std": 44.98, "Agent": "REINFORCE"}, {"env_step": 2181120, "rew": 402.5555, "rew_std": 37.1715, "Agent": "REINFORCE"}, {"env_step": 2211840, "rew": 405.1573, "rew_std": 46.4707, "Agent": "REINFORCE"}, {"env_step": 2242560, "rew": 405.7697, "rew_std": 51.8826, "Agent": "REINFORCE"}, {"env_step": 2273280, "rew": 399.8488, "rew_std": 45.9409, "Agent": "REINFORCE"}, {"env_step": 2304000, "rew": 400.3283, "rew_std": 37.1483, "Agent": "REINFORCE"}, {"env_step": 2334720, "rew": 404.6552, "rew_std": 43.07, "Agent": "REINFORCE"}, {"env_step": 2365440, "rew": 417.5301, "rew_std": 57.2134, "Agent": "REINFORCE"}, {"env_step": 2396160, "rew": 422.0997, "rew_std": 46.2711, "Agent": "REINFORCE"}, {"env_step": 2426880, "rew": 421.0184, "rew_std": 50.7304, "Agent": "REINFORCE"}, {"env_step": 2457600, "rew": 417.0316, "rew_std": 41.817, "Agent": "REINFORCE"}, {"env_step": 2488320, "rew": 398.6818, "rew_std": 42.1057, "Agent": "REINFORCE"}, {"env_step": 2519040, "rew": 403.3902, "rew_std": 34.9101, "Agent": "REINFORCE"}, {"env_step": 2549760, "rew": 413.0594, "rew_std": 57.6956, "Agent": "REINFORCE"}, {"env_step": 2580480, "rew": 391.2237, "rew_std": 43.119, "Agent": "REINFORCE"}, {"env_step": 2611200, "rew": 398.634, "rew_std": 38.1579, "Agent": "REINFORCE"}, {"env_step": 2641920, "rew": 414.8102, "rew_std": 55.8519, "Agent": "REINFORCE"}, {"env_step": 2672640, "rew": 428.2386, "rew_std": 61.3671, "Agent": "REINFORCE"}, {"env_step": 2703360, "rew": 413.7839, "rew_std": 53.886, "Agent": "REINFORCE"}, {"env_step": 2734080, "rew": 409.3724, "rew_std": 58.9423, "Agent": "REINFORCE"}, {"env_step": 2764800, "rew": 418.4324, "rew_std": 41.7632, "Agent": "REINFORCE"}, {"env_step": 2795520, "rew": 411.0972, "rew_std": 53.0598, "Agent": "REINFORCE"}, {"env_step": 2826240, "rew": 385.6242, "rew_std": 45.5054, "Agent": "REINFORCE"}, {"env_step": 2856960, "rew": 409.6031, "rew_std": 46.3376, "Agent": "REINFORCE"}, {"env_step": 2887680, "rew": 401.2584, "rew_std": 62.2796, "Agent": "REINFORCE"}, {"env_step": 2918400, "rew": 401.0642, "rew_std": 58.2344, "Agent": "REINFORCE"}, {"env_step": 2949120, "rew": 400.8198, "rew_std": 67.4508, "Agent": "REINFORCE"}, {"env_step": 2979840, "rew": 399.4039, "rew_std": 53.3394, "Agent": "REINFORCE"}, {"env_step": 3010560, "rew": 389.8431, "rew_std": 39.3272, "Agent": "REINFORCE"}, {"env_step": 3041280, "rew": 394.067, "rew_std": 47.9829, "Agent": "REINFORCE"}, {"env_step": 3072000, "rew": 387.9552, "rew_std": 49.9772, "Agent": "REINFORCE"}, {"env_step": 3102720, "rew": 387.1675, "rew_std": 65.9888, "Agent": "REINFORCE"}, {"env_step": 3133440, "rew": 378.6828, "rew_std": 64.4292, "Agent": "REINFORCE"}, {"env_step": 3164160, "rew": 393.6185, "rew_std": 45.4058, "Agent": "REINFORCE"}, {"env_step": 3194880, "rew": 394.6443, "rew_std": 46.5393, "Agent": "REINFORCE"}, {"env_step": 3225600, "rew": 393.1369, "rew_std": 62.1013, "Agent": "REINFORCE"}, {"env_step": 3256320, "rew": 407.482, "rew_std": 51.7877, "Agent": "REINFORCE"}, {"env_step": 3287040, "rew": 400.4091, "rew_std": 62.9306, "Agent": "REINFORCE"}, {"env_step": 3317760, "rew": 393.4948, "rew_std": 64.1455, "Agent": "REINFORCE"}, {"env_step": 3348480, "rew": 406.3127, "rew_std": 56.6238, "Agent": "REINFORCE"}, {"env_step": 3379200, "rew": 397.3756, "rew_std": 64.2524, "Agent": "REINFORCE"}, {"env_step": 3409920, "rew": 415.5537, "rew_std": 78.358, "Agent": "REINFORCE"}, {"env_step": 3440640, "rew": 390.5978, "rew_std": 48.545, "Agent": "REINFORCE"}, {"env_step": 3471360, "rew": 381.6533, "rew_std": 50.4349, "Agent": "REINFORCE"}, {"env_step": 3502080, "rew": 414.7084, "rew_std": 75.1391, "Agent": "REINFORCE"}, {"env_step": 3532800, "rew": 411.7969, "rew_std": 61.9639, "Agent": "REINFORCE"}, {"env_step": 3563520, "rew": 395.862, "rew_std": 51.1378, "Agent": "REINFORCE"}, {"env_step": 3594240, "rew": 394.9354, "rew_std": 72.9375, "Agent": "REINFORCE"}, {"env_step": 3624960, "rew": 389.1405, "rew_std": 57.53, "Agent": "REINFORCE"}, {"env_step": 3655680, "rew": 397.4184, "rew_std": 69.5013, "Agent": "REINFORCE"}, {"env_step": 3686400, "rew": 402.134, "rew_std": 68.5505, "Agent": "REINFORCE"}, {"env_step": 3717120, "rew": 388.0043, "rew_std": 60.6637, "Agent": "REINFORCE"}, {"env_step": 3747840, "rew": 388.857, "rew_std": 61.1726, "Agent": "REINFORCE"}, {"env_step": 3778560, "rew": 395.8664, "rew_std": 80.3261, "Agent": "REINFORCE"}, {"env_step": 3809280, "rew": 391.2895, "rew_std": 50.6701, "Agent": "REINFORCE"}, {"env_step": 3840000, "rew": 375.5112, "rew_std": 51.7993, "Agent": "REINFORCE"}, {"env_step": 3870720, "rew": 385.1477, "rew_std": 74.1886, "Agent": "REINFORCE"}, {"env_step": 3901440, "rew": 385.6211, "rew_std": 58.569, "Agent": "REINFORCE"}, {"env_step": 3932160, "rew": 403.1113, "rew_std": 56.767, "Agent": "REINFORCE"}, {"env_step": 3962880, "rew": 393.6033, "rew_std": 51.2387, "Agent": "REINFORCE"}, {"env_step": 3993600, "rew": 398.7294, "rew_std": 53.0198, "Agent": "REINFORCE"}, {"env_step": 4024320, "rew": 404.4069, "rew_std": 53.2228, "Agent": "REINFORCE"}, {"env_step": 4055040, "rew": 379.2343, "rew_std": 57.0353, "Agent": "REINFORCE"}, {"env_step": 4085760, "rew": 387.5677, "rew_std": 60.9631, "Agent": "REINFORCE"}, {"env_step": 4116480, "rew": 377.398, "rew_std": 49.0542, "Agent": "REINFORCE"}, {"env_step": 4147200, "rew": 406.3338, "rew_std": 63.9793, "Agent": "REINFORCE"}, {"env_step": 4177920, "rew": 405.1044, "rew_std": 58.2787, "Agent": "REINFORCE"}, {"env_step": 4208640, "rew": 394.9841, "rew_std": 57.9348, "Agent": "REINFORCE"}, {"env_step": 4239360, "rew": 425.3993, "rew_std": 55.3748, "Agent": "REINFORCE"}, {"env_step": 4270080, "rew": 395.7237, "rew_std": 50.2733, "Agent": "REINFORCE"}, {"env_step": 4300800, "rew": 410.0695, "rew_std": 58.4723, "Agent": "REINFORCE"}, {"env_step": 4331520, "rew": 420.7224, "rew_std": 54.1291, "Agent": "REINFORCE"}, {"env_step": 4362240, "rew": 407.6703, "rew_std": 57.0062, "Agent": "REINFORCE"}, {"env_step": 4392960, "rew": 388.5928, "rew_std": 59.4505, "Agent": "REINFORCE"}, {"env_step": 4423680, "rew": 398.4204, "rew_std": 38.8942, "Agent": "REINFORCE"}, {"env_step": 4454400, "rew": 422.9708, "rew_std": 62.4621, "Agent": "REINFORCE"}, {"env_step": 4485120, "rew": 407.7592, "rew_std": 45.2911, "Agent": "REINFORCE"}, {"env_step": 4515840, "rew": 397.7424, "rew_std": 64.5239, "Agent": "REINFORCE"}, {"env_step": 4546560, "rew": 364.0651, "rew_std": 42.8236, "Agent": "REINFORCE"}, {"env_step": 4577280, "rew": 387.8125, "rew_std": 67.7828, "Agent": "REINFORCE"}, {"env_step": 4608000, "rew": 387.8849, "rew_std": 56.7927, "Agent": "REINFORCE"}, {"env_step": 4638720, "rew": 395.0737, "rew_std": 52.0062, "Agent": "REINFORCE"}, {"env_step": 4669440, "rew": 377.2858, "rew_std": 39.734, "Agent": "REINFORCE"}, {"env_step": 4700160, "rew": 408.0436, "rew_std": 84.4176, "Agent": "REINFORCE"}, {"env_step": 4730880, "rew": 393.7722, "rew_std": 55.7614, "Agent": "REINFORCE"}, {"env_step": 4761600, "rew": 386.8071, "rew_std": 64.2477, "Agent": "REINFORCE"}, {"env_step": 4792320, "rew": 394.8259, "rew_std": 72.5374, "Agent": "REINFORCE"}, {"env_step": 4823040, "rew": 390.2458, "rew_std": 65.5436, "Agent": "REINFORCE"}, {"env_step": 4853760, "rew": 382.4817, "rew_std": 62.6421, "Agent": "REINFORCE"}, {"env_step": 4884480, "rew": 399.1333, "rew_std": 66.9132, "Agent": "REINFORCE"}, {"env_step": 4915200, "rew": 395.0744, "rew_std": 65.0951, "Agent": "REINFORCE"}, {"env_step": 4945920, "rew": 401.2925, "rew_std": 70.9549, "Agent": "REINFORCE"}, {"env_step": 4976640, "rew": 399.4059, "rew_std": 60.6538, "Agent": "REINFORCE"}, {"env_step": 5007360, "rew": 406.6179, "rew_std": 68.7601, "Agent": "REINFORCE"}, {"env_step": 5038080, "rew": 387.8888, "rew_std": 71.1222, "Agent": "REINFORCE"}, {"env_step": 5068800, "rew": 417.4409, "rew_std": 72.5182, "Agent": "REINFORCE"}, {"env_step": 5099520, "rew": 426.0181, "rew_std": 84.6085, "Agent": "REINFORCE"}, {"env_step": 5130240, "rew": 416.9954, "rew_std": 63.1179, "Agent": "REINFORCE"}, {"env_step": 5160960, "rew": 441.1564, "rew_std": 79.9664, "Agent": "REINFORCE"}, {"env_step": 5191680, "rew": 433.2006, "rew_std": 75.029, "Agent": "REINFORCE"}, {"env_step": 5222400, "rew": 414.7991, "rew_std": 56.961, "Agent": "REINFORCE"}, {"env_step": 5253120, "rew": 414.7902, "rew_std": 71.8032, "Agent": "REINFORCE"}, {"env_step": 5283840, "rew": 425.6593, "rew_std": 62.7082, "Agent": "REINFORCE"}, {"env_step": 5314560, "rew": 419.4213, "rew_std": 53.4877, "Agent": "REINFORCE"}, {"env_step": 5345280, "rew": 424.5813, "rew_std": 77.928, "Agent": "REINFORCE"}, {"env_step": 5376000, "rew": 403.1615, "rew_std": 76.368, "Agent": "REINFORCE"}, {"env_step": 5406720, "rew": 415.7097, "rew_std": 78.4011, "Agent": "REINFORCE"}, {"env_step": 5437440, "rew": 401.4143, "rew_std": 75.9469, "Agent": "REINFORCE"}, {"env_step": 5468160, "rew": 392.6702, "rew_std": 76.9324, "Agent": "REINFORCE"}, {"env_step": 5498880, "rew": 387.4285, "rew_std": 59.568, "Agent": "REINFORCE"}, {"env_step": 5529600, "rew": 384.1608, "rew_std": 57.6717, "Agent": "REINFORCE"}, {"env_step": 5560320, "rew": 397.3022, "rew_std": 80.0755, "Agent": "REINFORCE"}, {"env_step": 5591040, "rew": 401.4928, "rew_std": 73.1254, "Agent": "REINFORCE"}, {"env_step": 5621760, "rew": 405.6077, "rew_std": 64.9382, "Agent": "REINFORCE"}, {"env_step": 5652480, "rew": 403.2244, "rew_std": 63.7616, "Agent": "REINFORCE"}, {"env_step": 5683200, "rew": 391.268, "rew_std": 54.4662, "Agent": "REINFORCE"}, {"env_step": 5713920, "rew": 379.5553, "rew_std": 61.4862, "Agent": "REINFORCE"}, {"env_step": 5744640, "rew": 380.6899, "rew_std": 54.1494, "Agent": "REINFORCE"}, {"env_step": 5775360, "rew": 395.1274, "rew_std": 40.2667, "Agent": "REINFORCE"}, {"env_step": 5806080, "rew": 395.3674, "rew_std": 46.3753, "Agent": "REINFORCE"}, {"env_step": 5836800, "rew": 407.7103, "rew_std": 64.0663, "Agent": "REINFORCE"}, {"env_step": 5867520, "rew": 411.9753, "rew_std": 66.9703, "Agent": "REINFORCE"}, {"env_step": 5898240, "rew": 424.2286, "rew_std": 69.2321, "Agent": "REINFORCE"}, {"env_step": 5928960, "rew": 414.3711, "rew_std": 52.4139, "Agent": "REINFORCE"}, {"env_step": 5959680, "rew": 411.0705, "rew_std": 41.1486, "Agent": "REINFORCE"}, {"env_step": 5990400, "rew": 412.0928, "rew_std": 68.2498, "Agent": "REINFORCE"}, {"env_step": 6021120, "rew": 435.4422, "rew_std": 67.59, "Agent": "REINFORCE"}, {"env_step": 6051840, "rew": 421.7476, "rew_std": 54.2258, "Agent": "REINFORCE"}, {"env_step": 6082560, "rew": 421.9272, "rew_std": 56.9114, "Agent": "REINFORCE"}, {"env_step": 6113280, "rew": 434.3955, "rew_std": 50.4299, "Agent": "REINFORCE"}, {"env_step": 6144000, "rew": 417.1998, "rew_std": 50.2433, "Agent": "REINFORCE"}, {"env_step": 6174720, "rew": 423.4868, "rew_std": 69.0047, "Agent": "REINFORCE"}, {"env_step": 6205440, "rew": 421.0292, "rew_std": 55.9664, "Agent": "REINFORCE"}, {"env_step": 6236160, "rew": 421.5478, "rew_std": 61.617, "Agent": "REINFORCE"}, {"env_step": 6266880, "rew": 438.953, "rew_std": 73.0025, "Agent": "REINFORCE"}, {"env_step": 6297600, "rew": 417.898, "rew_std": 56.2191, "Agent": "REINFORCE"}, {"env_step": 6328320, "rew": 430.4892, "rew_std": 72.7653, "Agent": "REINFORCE"}, {"env_step": 6359040, "rew": 423.9785, "rew_std": 54.0521, "Agent": "REINFORCE"}, {"env_step": 6389760, "rew": 418.1322, "rew_std": 60.4062, "Agent": "REINFORCE"}, {"env_step": 6420480, "rew": 432.6341, "rew_std": 52.3553, "Agent": "REINFORCE"}, {"env_step": 6451200, "rew": 429.442, "rew_std": 66.8584, "Agent": "REINFORCE"}, {"env_step": 6481920, "rew": 429.4091, "rew_std": 55.5702, "Agent": "REINFORCE"}, {"env_step": 6512640, "rew": 433.1991, "rew_std": 57.5528, "Agent": "REINFORCE"}, {"env_step": 6543360, "rew": 421.4787, "rew_std": 64.1868, "Agent": "REINFORCE"}, {"env_step": 6574080, "rew": 429.2496, "rew_std": 68.345, "Agent": "REINFORCE"}, {"env_step": 6604800, "rew": 428.7888, "rew_std": 72.7331, "Agent": "REINFORCE"}, {"env_step": 6635520, "rew": 421.8156, "rew_std": 53.2816, "Agent": "REINFORCE"}, {"env_step": 6666240, "rew": 441.9151, "rew_std": 58.0016, "Agent": "REINFORCE"}, {"env_step": 6696960, "rew": 432.4622, "rew_std": 52.1868, "Agent": "REINFORCE"}, {"env_step": 6727680, "rew": 428.4346, "rew_std": 51.4958, "Agent": "REINFORCE"}, {"env_step": 6758400, "rew": 448.5581, "rew_std": 61.1799, "Agent": "REINFORCE"}, {"env_step": 6789120, "rew": 436.737, "rew_std": 56.055, "Agent": "REINFORCE"}, {"env_step": 6819840, "rew": 450.0283, "rew_std": 60.1757, "Agent": "REINFORCE"}, {"env_step": 6850560, "rew": 426.9679, "rew_std": 53.4073, "Agent": "REINFORCE"}, {"env_step": 6881280, "rew": 445.6709, "rew_std": 58.9099, "Agent": "REINFORCE"}, {"env_step": 6912000, "rew": 435.5077, "rew_std": 50.8351, "Agent": "REINFORCE"}, {"env_step": 6942720, "rew": 438.1268, "rew_std": 47.7346, "Agent": "REINFORCE"}, {"env_step": 6973440, "rew": 435.6654, "rew_std": 48.6435, "Agent": "REINFORCE"}, {"env_step": 7004160, "rew": 447.6092, "rew_std": 45.757, "Agent": "REINFORCE"}, {"env_step": 7034880, "rew": 432.7806, "rew_std": 59.0931, "Agent": "REINFORCE"}, {"env_step": 7065600, "rew": 464.3061, "rew_std": 58.4102, "Agent": "REINFORCE"}, {"env_step": 7096320, "rew": 448.0351, "rew_std": 54.4852, "Agent": "REINFORCE"}, {"env_step": 7127040, "rew": 438.2387, "rew_std": 51.9289, "Agent": "REINFORCE"}, {"env_step": 7157760, "rew": 445.8886, "rew_std": 49.4097, "Agent": "REINFORCE"}, {"env_step": 7188480, "rew": 428.4683, "rew_std": 62.5219, "Agent": "REINFORCE"}, {"env_step": 7219200, "rew": 447.5914, "rew_std": 62.3059, "Agent": "REINFORCE"}, {"env_step": 7249920, "rew": 422.7578, "rew_std": 64.5611, "Agent": "REINFORCE"}, {"env_step": 7280640, "rew": 435.1532, "rew_std": 53.3779, "Agent": "REINFORCE"}, {"env_step": 7311360, "rew": 425.5023, "rew_std": 46.7849, "Agent": "REINFORCE"}, {"env_step": 7342080, "rew": 432.1564, "rew_std": 57.7707, "Agent": "REINFORCE"}, {"env_step": 7372800, "rew": 415.4793, "rew_std": 49.0723, "Agent": "REINFORCE"}, {"env_step": 7403520, "rew": 423.3059, "rew_std": 54.1695, "Agent": "REINFORCE"}, {"env_step": 7434240, "rew": 434.0937, "rew_std": 65.467, "Agent": "REINFORCE"}, {"env_step": 7464960, "rew": 421.1951, "rew_std": 37.9896, "Agent": "REINFORCE"}, {"env_step": 7495680, "rew": 424.2354, "rew_std": 32.1225, "Agent": "REINFORCE"}, {"env_step": 7526400, "rew": 414.4942, "rew_std": 61.44, "Agent": "REINFORCE"}, {"env_step": 7557120, "rew": 420.6777, "rew_std": 48.6498, "Agent": "REINFORCE"}, {"env_step": 7587840, "rew": 421.6311, "rew_std": 41.9637, "Agent": "REINFORCE"}, {"env_step": 7618560, "rew": 419.5132, "rew_std": 44.5098, "Agent": "REINFORCE"}, {"env_step": 7649280, "rew": 453.7393, "rew_std": 72.3884, "Agent": "REINFORCE"}, {"env_step": 7680000, "rew": 431.989, "rew_std": 67.0335, "Agent": "REINFORCE"}, {"env_step": 7710720, "rew": 437.4101, "rew_std": 66.4708, "Agent": "REINFORCE"}, {"env_step": 7741440, "rew": 428.4059, "rew_std": 57.9871, "Agent": "REINFORCE"}, {"env_step": 7772160, "rew": 429.2049, "rew_std": 46.1541, "Agent": "REINFORCE"}, {"env_step": 7802880, "rew": 427.6781, "rew_std": 50.5812, "Agent": "REINFORCE"}, {"env_step": 7833600, "rew": 435.1144, "rew_std": 41.9573, "Agent": "REINFORCE"}, {"env_step": 7864320, "rew": 442.6668, "rew_std": 63.9423, "Agent": "REINFORCE"}, {"env_step": 7895040, "rew": 416.4572, "rew_std": 35.7496, "Agent": "REINFORCE"}, {"env_step": 7925760, "rew": 432.7108, "rew_std": 52.7162, "Agent": "REINFORCE"}, {"env_step": 7956480, "rew": 435.7087, "rew_std": 63.0129, "Agent": "REINFORCE"}, {"env_step": 7987200, "rew": 443.6482, "rew_std": 64.473, "Agent": "REINFORCE"}, {"env_step": 8017920, "rew": 426.112, "rew_std": 65.1428, "Agent": "REINFORCE"}, {"env_step": 8048640, "rew": 419.717, "rew_std": 49.5256, "Agent": "REINFORCE"}, {"env_step": 8079360, "rew": 427.3948, "rew_std": 51.7217, "Agent": "REINFORCE"}, {"env_step": 8110080, "rew": 418.2876, "rew_std": 55.8575, "Agent": "REINFORCE"}, {"env_step": 8140800, "rew": 425.3464, "rew_std": 63.9193, "Agent": "REINFORCE"}, {"env_step": 8171520, "rew": 422.2139, "rew_std": 64.3602, "Agent": "REINFORCE"}, {"env_step": 8202240, "rew": 425.3817, "rew_std": 62.3121, "Agent": "REINFORCE"}, {"env_step": 8232960, "rew": 430.0611, "rew_std": 74.026, "Agent": "REINFORCE"}, {"env_step": 8263680, "rew": 426.6266, "rew_std": 54.1855, "Agent": "REINFORCE"}, {"env_step": 8294400, "rew": 425.9563, "rew_std": 54.4198, "Agent": "REINFORCE"}, {"env_step": 8325120, "rew": 416.8308, "rew_std": 43.4318, "Agent": "REINFORCE"}, {"env_step": 8355840, "rew": 427.924, "rew_std": 53.4286, "Agent": "REINFORCE"}, {"env_step": 8386560, "rew": 425.8094, "rew_std": 48.7615, "Agent": "REINFORCE"}, {"env_step": 8417280, "rew": 436.37, "rew_std": 51.3194, "Agent": "REINFORCE"}, {"env_step": 8448000, "rew": 450.7627, "rew_std": 73.5331, "Agent": "REINFORCE"}, {"env_step": 8478720, "rew": 428.6428, "rew_std": 39.332, "Agent": "REINFORCE"}, {"env_step": 8509440, "rew": 415.792, "rew_std": 35.9552, "Agent": "REINFORCE"}, {"env_step": 8540160, "rew": 442.3338, "rew_std": 55.9098, "Agent": "REINFORCE"}, {"env_step": 8570880, "rew": 420.0383, "rew_std": 40.6303, "Agent": "REINFORCE"}, {"env_step": 8601600, "rew": 427.539, "rew_std": 48.1522, "Agent": "REINFORCE"}, {"env_step": 8632320, "rew": 446.8737, "rew_std": 53.3549, "Agent": "REINFORCE"}, {"env_step": 8663040, "rew": 422.7955, "rew_std": 49.8506, "Agent": "REINFORCE"}, {"env_step": 8693760, "rew": 415.8156, "rew_std": 53.8267, "Agent": "REINFORCE"}, {"env_step": 8724480, "rew": 437.5864, "rew_std": 68.5622, "Agent": "REINFORCE"}, {"env_step": 8755200, "rew": 441.8165, "rew_std": 61.7589, "Agent": "REINFORCE"}, {"env_step": 8785920, "rew": 432.717, "rew_std": 62.6678, "Agent": "REINFORCE"}, {"env_step": 8816640, "rew": 430.1473, "rew_std": 52.4954, "Agent": "REINFORCE"}, {"env_step": 8847360, "rew": 434.8537, "rew_std": 58.7462, "Agent": "REINFORCE"}, {"env_step": 8878080, "rew": 422.1588, "rew_std": 50.1868, "Agent": "REINFORCE"}, {"env_step": 8908800, "rew": 419.7322, "rew_std": 43.2847, "Agent": "REINFORCE"}, {"env_step": 8939520, "rew": 415.9212, "rew_std": 43.222, "Agent": "REINFORCE"}, {"env_step": 8970240, "rew": 425.6137, "rew_std": 60.322, "Agent": "REINFORCE"}, {"env_step": 9000960, "rew": 421.9776, "rew_std": 63.0022, "Agent": "REINFORCE"}, {"env_step": 9031680, "rew": 425.4186, "rew_std": 55.3349, "Agent": "REINFORCE"}, {"env_step": 9062400, "rew": 432.6951, "rew_std": 54.8226, "Agent": "REINFORCE"}, {"env_step": 9093120, "rew": 422.8864, "rew_std": 48.8194, "Agent": "REINFORCE"}, {"env_step": 9123840, "rew": 421.418, "rew_std": 46.865, "Agent": "REINFORCE"}, {"env_step": 9154560, "rew": 433.4248, "rew_std": 42.999, "Agent": "REINFORCE"}, {"env_step": 9185280, "rew": 419.0434, "rew_std": 44.146, "Agent": "REINFORCE"}, {"env_step": 9216000, "rew": 415.736, "rew_std": 41.3839, "Agent": "REINFORCE"}, {"env_step": 9246720, "rew": 414.7147, "rew_std": 36.7896, "Agent": "REINFORCE"}, {"env_step": 9277440, "rew": 434.3581, "rew_std": 54.3064, "Agent": "REINFORCE"}, {"env_step": 9308160, "rew": 425.1595, "rew_std": 55.6919, "Agent": "REINFORCE"}, {"env_step": 9338880, "rew": 442.9066, "rew_std": 67.8961, "Agent": "REINFORCE"}, {"env_step": 9369600, "rew": 429.9155, "rew_std": 52.8229, "Agent": "REINFORCE"}, {"env_step": 9400320, "rew": 433.3738, "rew_std": 67.7054, "Agent": "REINFORCE"}, {"env_step": 9431040, "rew": 424.5967, "rew_std": 58.8434, "Agent": "REINFORCE"}, {"env_step": 9461760, "rew": 432.9595, "rew_std": 46.7897, "Agent": "REINFORCE"}, {"env_step": 9492480, "rew": 427.9092, "rew_std": 43.758, "Agent": "REINFORCE"}, {"env_step": 9523200, "rew": 426.2477, "rew_std": 48.9913, "Agent": "REINFORCE"}, {"env_step": 9553920, "rew": 415.2017, "rew_std": 49.432, "Agent": "REINFORCE"}, {"env_step": 9584640, "rew": 438.1663, "rew_std": 57.0268, "Agent": "REINFORCE"}, {"env_step": 9615360, "rew": 445.0344, "rew_std": 56.2595, "Agent": "REINFORCE"}, {"env_step": 9646080, "rew": 431.6359, "rew_std": 52.3226, "Agent": "REINFORCE"}, {"env_step": 9676800, "rew": 428.2467, "rew_std": 53.144, "Agent": "REINFORCE"}, {"env_step": 9707520, "rew": 430.8904, "rew_std": 50.9101, "Agent": "REINFORCE"}, {"env_step": 9738240, "rew": 435.7712, "rew_std": 74.0012, "Agent": "REINFORCE"}, {"env_step": 9768960, "rew": 440.82, "rew_std": 61.388, "Agent": "REINFORCE"}, {"env_step": 9799680, "rew": 434.538, "rew_std": 62.4474, "Agent": "REINFORCE"}, {"env_step": 9830400, "rew": 414.1024, "rew_std": 48.7035, "Agent": "REINFORCE"}, {"env_step": 9861120, "rew": 427.8226, "rew_std": 53.4481, "Agent": "REINFORCE"}, {"env_step": 9891840, "rew": 426.8527, "rew_std": 56.4748, "Agent": "REINFORCE"}, {"env_step": 9922560, "rew": 415.904, "rew_std": 42.7152, "Agent": "REINFORCE"}, {"env_step": 9953280, "rew": 428.6406, "rew_std": 52.1272, "Agent": "REINFORCE"}, {"env_step": 9984000, "rew": 427.6787, "rew_std": 49.7561, "Agent": "REINFORCE"}, {"env_step": 10014720, "rew": 420.2958, "rew_std": 53.3219, "Agent": "REINFORCE"}, {"env_step": 10045440, "rew": 435.3111, "rew_std": 58.5596, "Agent": "REINFORCE"}, {"env_step": 10076160, "rew": 428.058, "rew_std": 52.0583, "Agent": "REINFORCE"}, {"env_step": 10106880, "rew": 430.8424, "rew_std": 53.0753, "Agent": "REINFORCE"}, {"env_step": 10137600, "rew": 434.0074, "rew_std": 58.8144, "Agent": "REINFORCE"}, {"env_step": 10168320, "rew": 427.3266, "rew_std": 67.2677, "Agent": "REINFORCE"}, {"env_step": 10199040, "rew": 436.6506, "rew_std": 58.1863, "Agent": "REINFORCE"}, {"env_step": 10229760, "rew": 425.308, "rew_std": 53.5519, "Agent": "REINFORCE"}, {"env_step": 0, "rew": 177.3211, "rew_std": 77.5947, "Agent": "SAC"}, {"env_step": 5000, "rew": 283.2922, "rew_std": 15.6399, "Agent": "SAC"}, {"env_step": 10000, "rew": 299.9204, "rew_std": 31.8772, "Agent": "SAC"}, {"env_step": 15000, "rew": 435.967, "rew_std": 59.9478, "Agent": "SAC"}, {"env_step": 20000, "rew": 449.6315, "rew_std": 50.5159, "Agent": "SAC"}, {"env_step": 25000, "rew": 462.7225, "rew_std": 70.3407, "Agent": "SAC"}, {"env_step": 30000, "rew": 527.9205, "rew_std": 62.4189, "Agent": "SAC"}, {"env_step": 35000, "rew": 462.1104, "rew_std": 103.0253, "Agent": "SAC"}, {"env_step": 40000, "rew": 502.3742, "rew_std": 89.7226, "Agent": "SAC"}, {"env_step": 45000, "rew": 508.4995, "rew_std": 71.7847, "Agent": "SAC"}, {"env_step": 50000, "rew": 573.9444, "rew_std": 99.0155, "Agent": "SAC"}, {"env_step": 55000, "rew": 550.6721, "rew_std": 65.356, "Agent": "SAC"}, {"env_step": 60000, "rew": 587.3824, "rew_std": 68.5067, "Agent": "SAC"}, {"env_step": 65000, "rew": 601.1097, "rew_std": 87.2493, "Agent": "SAC"}, {"env_step": 70000, "rew": 600.142, "rew_std": 60.1349, "Agent": "SAC"}, {"env_step": 75000, "rew": 594.4696, "rew_std": 61.1347, "Agent": "SAC"}, {"env_step": 80000, "rew": 590.6473, "rew_std": 71.1667, "Agent": "SAC"}, {"env_step": 85000, "rew": 594.3895, "rew_std": 62.5243, "Agent": "SAC"}, {"env_step": 90000, "rew": 618.5582, "rew_std": 86.4116, "Agent": "SAC"}, {"env_step": 95000, "rew": 644.4827, "rew_std": 102.1717, "Agent": "SAC"}, {"env_step": 100000, "rew": 629.4648, "rew_std": 106.451, "Agent": "SAC"}, {"env_step": 105000, "rew": 633.1271, "rew_std": 68.8717, "Agent": "SAC"}, {"env_step": 110000, "rew": 631.02, "rew_std": 71.8617, "Agent": "SAC"}, {"env_step": 115000, "rew": 584.2877, "rew_std": 59.1475, "Agent": "SAC"}, {"env_step": 120000, "rew": 597.579, "rew_std": 52.4268, "Agent": "SAC"}, {"env_step": 125000, "rew": 622.5235, "rew_std": 61.8045, "Agent": "SAC"}, {"env_step": 130000, "rew": 649.8092, "rew_std": 110.1307, "Agent": "SAC"}, {"env_step": 135000, "rew": 613.3262, "rew_std": 75.1675, "Agent": "SAC"}, {"env_step": 140000, "rew": 645.5737, "rew_std": 97.3171, "Agent": "SAC"}, {"env_step": 145000, "rew": 586.2649, "rew_std": 59.617, "Agent": "SAC"}, {"env_step": 150000, "rew": 625.0649, "rew_std": 79.55, "Agent": "SAC"}, {"env_step": 155000, "rew": 637.2469, "rew_std": 83.9602, "Agent": "SAC"}, {"env_step": 160000, "rew": 620.3274, "rew_std": 89.7393, "Agent": "SAC"}, {"env_step": 165000, "rew": 619.5069, "rew_std": 67.1062, "Agent": "SAC"}, {"env_step": 170000, "rew": 630.8656, "rew_std": 68.1679, "Agent": "SAC"}, {"env_step": 175000, "rew": 682.0407, "rew_std": 99.4304, "Agent": "SAC"}, {"env_step": 180000, "rew": 651.833, "rew_std": 60.173, "Agent": "SAC"}, {"env_step": 185000, "rew": 658.08, "rew_std": 53.9764, "Agent": "SAC"}, {"env_step": 190000, "rew": 680.1662, "rew_std": 106.7121, "Agent": "SAC"}, {"env_step": 195000, "rew": 673.2192, "rew_std": 86.1533, "Agent": "SAC"}, {"env_step": 200000, "rew": 767.8674, "rew_std": 306.8412, "Agent": "SAC"}, {"env_step": 205000, "rew": 720.5668, "rew_std": 146.6656, "Agent": "SAC"}, {"env_step": 210000, "rew": 747.1972, "rew_std": 239.9881, "Agent": "SAC"}, {"env_step": 215000, "rew": 790.9514, "rew_std": 322.2662, "Agent": "SAC"}, {"env_step": 220000, "rew": 817.9376, "rew_std": 308.4281, "Agent": "SAC"}, {"env_step": 225000, "rew": 788.8247, "rew_std": 334.612, "Agent": "SAC"}, {"env_step": 230000, "rew": 882.7069, "rew_std": 506.6814, "Agent": "SAC"}, {"env_step": 235000, "rew": 839.2083, "rew_std": 410.4154, "Agent": "SAC"}, {"env_step": 240000, "rew": 835.0124, "rew_std": 357.7152, "Agent": "SAC"}, {"env_step": 245000, "rew": 1098.2356, "rew_std": 823.3634, "Agent": "SAC"}, {"env_step": 250000, "rew": 718.2728, "rew_std": 111.0831, "Agent": "SAC"}, {"env_step": 255000, "rew": 827.5897, "rew_std": 350.9259, "Agent": "SAC"}, {"env_step": 260000, "rew": 863.331, "rew_std": 285.7051, "Agent": "SAC"}, {"env_step": 265000, "rew": 961.4804, "rew_std": 394.793, "Agent": "SAC"}, {"env_step": 270000, "rew": 974.2971, "rew_std": 384.0907, "Agent": "SAC"}, {"env_step": 275000, "rew": 1315.7752, "rew_std": 1288.8193, "Agent": "SAC"}, {"env_step": 280000, "rew": 1036.5671, "rew_std": 413.9318, "Agent": "SAC"}, {"env_step": 285000, "rew": 928.6535, "rew_std": 325.435, "Agent": "SAC"}, {"env_step": 290000, "rew": 1266.3388, "rew_std": 1018.1861, "Agent": "SAC"}, {"env_step": 295000, "rew": 1888.0376, "rew_std": 1495.7165, "Agent": "SAC"}, {"env_step": 300000, "rew": 2044.8745, "rew_std": 1310.538, "Agent": "SAC"}, {"env_step": 305000, "rew": 1470.7834, "rew_std": 803.1499, "Agent": "SAC"}, {"env_step": 310000, "rew": 1434.7183, "rew_std": 748.1661, "Agent": "SAC"}, {"env_step": 315000, "rew": 1784.8552, "rew_std": 942.3052, "Agent": "SAC"}, {"env_step": 320000, "rew": 2115.5942, "rew_std": 1219.7121, "Agent": "SAC"}, {"env_step": 325000, "rew": 2098.7451, "rew_std": 1303.318, "Agent": "SAC"}, {"env_step": 330000, "rew": 1410.295, "rew_std": 761.9196, "Agent": "SAC"}, {"env_step": 335000, "rew": 1552.3471, "rew_std": 741.9198, "Agent": "SAC"}, {"env_step": 340000, "rew": 2020.108, "rew_std": 1466.2618, "Agent": "SAC"}, {"env_step": 345000, "rew": 1933.2728, "rew_std": 1159.0629, "Agent": "SAC"}, {"env_step": 350000, "rew": 2628.7817, "rew_std": 1552.1157, "Agent": "SAC"}, {"env_step": 355000, "rew": 2216.6806, "rew_std": 1650.5325, "Agent": "SAC"}, {"env_step": 360000, "rew": 2484.4005, "rew_std": 1243.7294, "Agent": "SAC"}, {"env_step": 365000, "rew": 2407.9889, "rew_std": 1347.9589, "Agent": "SAC"}, {"env_step": 370000, "rew": 2311.8579, "rew_std": 1337.9997, "Agent": "SAC"}, {"env_step": 375000, "rew": 2689.6973, "rew_std": 1398.341, "Agent": "SAC"}, {"env_step": 380000, "rew": 2529.8016, "rew_std": 1376.7045, "Agent": "SAC"}, {"env_step": 385000, "rew": 2972.2652, "rew_std": 1538.8946, "Agent": "SAC"}, {"env_step": 390000, "rew": 2250.7697, "rew_std": 1463.934, "Agent": "SAC"}, {"env_step": 395000, "rew": 3235.0548, "rew_std": 1710.5823, "Agent": "SAC"}, {"env_step": 400000, "rew": 2194.9027, "rew_std": 1050.3855, "Agent": "SAC"}, {"env_step": 405000, "rew": 2287.7077, "rew_std": 869.8738, "Agent": "SAC"}, {"env_step": 410000, "rew": 2320.09, "rew_std": 1832.5621, "Agent": "SAC"}, {"env_step": 415000, "rew": 3345.4752, "rew_std": 1581.5452, "Agent": "SAC"}, {"env_step": 420000, "rew": 2544.4616, "rew_std": 1693.8445, "Agent": "SAC"}, {"env_step": 425000, "rew": 2865.4076, "rew_std": 1797.1184, "Agent": "SAC"}, {"env_step": 430000, "rew": 3017.8232, "rew_std": 1433.5879, "Agent": "SAC"}, {"env_step": 435000, "rew": 2893.0204, "rew_std": 1024.7995, "Agent": "SAC"}, {"env_step": 440000, "rew": 3590.2399, "rew_std": 1626.9296, "Agent": "SAC"}, {"env_step": 445000, "rew": 3408.5708, "rew_std": 1331.236, "Agent": "SAC"}, {"env_step": 450000, "rew": 3857.306, "rew_std": 1314.3741, "Agent": "SAC"}, {"env_step": 455000, "rew": 3739.2678, "rew_std": 1672.9652, "Agent": "SAC"}, {"env_step": 460000, "rew": 2776.1559, "rew_std": 1809.8104, "Agent": "SAC"}, {"env_step": 465000, "rew": 3620.809, "rew_std": 1596.7628, "Agent": "SAC"}, {"env_step": 470000, "rew": 3130.615, "rew_std": 1227.9251, "Agent": "SAC"}, {"env_step": 475000, "rew": 3261.6376, "rew_std": 1696.0082, "Agent": "SAC"}, {"env_step": 480000, "rew": 3720.7236, "rew_std": 1627.3018, "Agent": "SAC"}, {"env_step": 485000, "rew": 5117.4884, "rew_std": 345.2388, "Agent": "SAC"}, {"env_step": 490000, "rew": 4224.7134, "rew_std": 1283.841, "Agent": "SAC"}, {"env_step": 495000, "rew": 3923.3252, "rew_std": 1043.406, "Agent": "SAC"}, {"env_step": 500000, "rew": 3513.0907, "rew_std": 1830.6286, "Agent": "SAC"}, {"env_step": 505000, "rew": 4370.6183, "rew_std": 838.9721, "Agent": "SAC"}, {"env_step": 510000, "rew": 3937.4691, "rew_std": 1341.3907, "Agent": "SAC"}, {"env_step": 515000, "rew": 4388.9263, "rew_std": 1050.192, "Agent": "SAC"}, {"env_step": 520000, "rew": 4552.7993, "rew_std": 1075.7803, "Agent": "SAC"}, {"env_step": 525000, "rew": 3348.2774, "rew_std": 1406.7555, "Agent": "SAC"}, {"env_step": 530000, "rew": 3760.4822, "rew_std": 1752.8619, "Agent": "SAC"}, {"env_step": 535000, "rew": 3860.4773, "rew_std": 1670.5976, "Agent": "SAC"}, {"env_step": 540000, "rew": 4280.2371, "rew_std": 1125.5536, "Agent": "SAC"}, {"env_step": 545000, "rew": 4687.5066, "rew_std": 800.7659, "Agent": "SAC"}, {"env_step": 550000, "rew": 4513.5009, "rew_std": 960.5825, "Agent": "SAC"}, {"env_step": 555000, "rew": 4916.996, "rew_std": 1105.08, "Agent": "SAC"}, {"env_step": 560000, "rew": 3862.9368, "rew_std": 1644.8431, "Agent": "SAC"}, {"env_step": 565000, "rew": 4770.655, "rew_std": 881.5879, "Agent": "SAC"}, {"env_step": 570000, "rew": 4187.2924, "rew_std": 1616.1352, "Agent": "SAC"}, {"env_step": 575000, "rew": 4504.8732, "rew_std": 1389.8827, "Agent": "SAC"}, {"env_step": 580000, "rew": 4440.6944, "rew_std": 1185.3543, "Agent": "SAC"}, {"env_step": 585000, "rew": 4227.2634, "rew_std": 1261.4641, "Agent": "SAC"}, {"env_step": 590000, "rew": 4496.8565, "rew_std": 1100.5603, "Agent": "SAC"}, {"env_step": 595000, "rew": 4897.1523, "rew_std": 673.0572, "Agent": "SAC"}, {"env_step": 600000, "rew": 4824.998, "rew_std": 1298.6373, "Agent": "SAC"}, {"env_step": 605000, "rew": 4338.918, "rew_std": 1322.4879, "Agent": "SAC"}, {"env_step": 610000, "rew": 4937.4641, "rew_std": 694.7557, "Agent": "SAC"}, {"env_step": 615000, "rew": 5122.7475, "rew_std": 560.8034, "Agent": "SAC"}, {"env_step": 620000, "rew": 4848.3673, "rew_std": 1080.9785, "Agent": "SAC"}, {"env_step": 625000, "rew": 5232.965, "rew_std": 625.975, "Agent": "SAC"}, {"env_step": 630000, "rew": 5002.0817, "rew_std": 737.5698, "Agent": "SAC"}, {"env_step": 635000, "rew": 5374.9484, "rew_std": 216.2208, "Agent": "SAC"}, {"env_step": 640000, "rew": 5125.9609, "rew_std": 1028.8434, "Agent": "SAC"}, {"env_step": 645000, "rew": 4931.8062, "rew_std": 1508.0666, "Agent": "SAC"}, {"env_step": 650000, "rew": 4572.6578, "rew_std": 1386.8231, "Agent": "SAC"}, {"env_step": 655000, "rew": 4731.1344, "rew_std": 1108.9666, "Agent": "SAC"}, {"env_step": 660000, "rew": 4734.3651, "rew_std": 1294.0055, "Agent": "SAC"}, {"env_step": 665000, "rew": 4941.1906, "rew_std": 622.0798, "Agent": "SAC"}, {"env_step": 670000, "rew": 4804.5048, "rew_std": 890.0309, "Agent": "SAC"}, {"env_step": 675000, "rew": 4684.468, "rew_std": 821.0354, "Agent": "SAC"}, {"env_step": 680000, "rew": 5363.6274, "rew_std": 164.0225, "Agent": "SAC"}, {"env_step": 685000, "rew": 5001.633, "rew_std": 1051.6927, "Agent": "SAC"}, {"env_step": 690000, "rew": 5298.3275, "rew_std": 339.2928, "Agent": "SAC"}, {"env_step": 695000, "rew": 4865.5476, "rew_std": 1470.0991, "Agent": "SAC"}, {"env_step": 700000, "rew": 4609.8391, "rew_std": 1406.8704, "Agent": "SAC"}, {"env_step": 705000, "rew": 5323.9809, "rew_std": 306.6037, "Agent": "SAC"}, {"env_step": 710000, "rew": 5128.291, "rew_std": 443.2792, "Agent": "SAC"}, {"env_step": 715000, "rew": 5192.4866, "rew_std": 402.7956, "Agent": "SAC"}, {"env_step": 720000, "rew": 5305.8674, "rew_std": 212.3237, "Agent": "SAC"}, {"env_step": 725000, "rew": 4923.7567, "rew_std": 1082.2713, "Agent": "SAC"}, {"env_step": 730000, "rew": 4893.8484, "rew_std": 1127.4641, "Agent": "SAC"}, {"env_step": 735000, "rew": 5376.7686, "rew_std": 154.4458, "Agent": "SAC"}, {"env_step": 740000, "rew": 5129.1078, "rew_std": 422.2793, "Agent": "SAC"}, {"env_step": 745000, "rew": 5254.9446, "rew_std": 345.5945, "Agent": "SAC"}, {"env_step": 750000, "rew": 5201.6401, "rew_std": 529.1572, "Agent": "SAC"}, {"env_step": 755000, "rew": 5287.1598, "rew_std": 430.0224, "Agent": "SAC"}, {"env_step": 760000, "rew": 5188.2075, "rew_std": 406.3099, "Agent": "SAC"}, {"env_step": 765000, "rew": 5321.3263, "rew_std": 380.4228, "Agent": "SAC"}, {"env_step": 770000, "rew": 5150.8102, "rew_std": 472.9078, "Agent": "SAC"}, {"env_step": 775000, "rew": 5112.3058, "rew_std": 448.8352, "Agent": "SAC"}, {"env_step": 780000, "rew": 5438.7415, "rew_std": 139.0196, "Agent": "SAC"}, {"env_step": 785000, "rew": 5424.2751, "rew_std": 219.4044, "Agent": "SAC"}, {"env_step": 790000, "rew": 5420.4271, "rew_std": 170.9598, "Agent": "SAC"}, {"env_step": 795000, "rew": 5409.7089, "rew_std": 152.7513, "Agent": "SAC"}, {"env_step": 800000, "rew": 5369.1825, "rew_std": 271.0678, "Agent": "SAC"}, {"env_step": 805000, "rew": 5061.0436, "rew_std": 772.6225, "Agent": "SAC"}, {"env_step": 810000, "rew": 4937.3571, "rew_std": 1475.3603, "Agent": "SAC"}, {"env_step": 815000, "rew": 4996.5811, "rew_std": 1230.9226, "Agent": "SAC"}, {"env_step": 820000, "rew": 5018.8375, "rew_std": 786.6848, "Agent": "SAC"}, {"env_step": 825000, "rew": 5130.769, "rew_std": 610.5639, "Agent": "SAC"}, {"env_step": 830000, "rew": 5208.4764, "rew_std": 526.7289, "Agent": "SAC"}, {"env_step": 835000, "rew": 5122.3821, "rew_std": 995.9235, "Agent": "SAC"}, {"env_step": 840000, "rew": 5104.1109, "rew_std": 827.8651, "Agent": "SAC"}, {"env_step": 845000, "rew": 5429.061, "rew_std": 141.7453, "Agent": "SAC"}, {"env_step": 850000, "rew": 5427.7533, "rew_std": 187.8448, "Agent": "SAC"}, {"env_step": 855000, "rew": 5487.2295, "rew_std": 65.2655, "Agent": "SAC"}, {"env_step": 860000, "rew": 5392.2913, "rew_std": 200.2466, "Agent": "SAC"}, {"env_step": 865000, "rew": 5458.626, "rew_std": 116.5534, "Agent": "SAC"}, {"env_step": 870000, "rew": 5341.482, "rew_std": 513.9814, "Agent": "SAC"}, {"env_step": 875000, "rew": 5148.9941, "rew_std": 933.1094, "Agent": "SAC"}, {"env_step": 880000, "rew": 5302.6708, "rew_std": 569.9856, "Agent": "SAC"}, {"env_step": 885000, "rew": 5309.8879, "rew_std": 352.142, "Agent": "SAC"}, {"env_step": 890000, "rew": 5392.5359, "rew_std": 305.3011, "Agent": "SAC"}, {"env_step": 895000, "rew": 5182.5145, "rew_std": 779.8814, "Agent": "SAC"}, {"env_step": 900000, "rew": 4960.3537, "rew_std": 1161.7267, "Agent": "SAC"}, {"env_step": 905000, "rew": 4939.2962, "rew_std": 1498.3747, "Agent": "SAC"}, {"env_step": 910000, "rew": 4885.5797, "rew_std": 1316.2522, "Agent": "SAC"}, {"env_step": 915000, "rew": 5341.225, "rew_std": 407.8162, "Agent": "SAC"}, {"env_step": 920000, "rew": 5306.9093, "rew_std": 475.8455, "Agent": "SAC"}, {"env_step": 925000, "rew": 5105.3437, "rew_std": 579.3931, "Agent": "SAC"}, {"env_step": 930000, "rew": 5402.4238, "rew_std": 152.8403, "Agent": "SAC"}, {"env_step": 935000, "rew": 5371.9716, "rew_std": 303.9729, "Agent": "SAC"}, {"env_step": 940000, "rew": 4486.8878, "rew_std": 1637.3413, "Agent": "SAC"}, {"env_step": 945000, "rew": 4823.5619, "rew_std": 1488.3126, "Agent": "SAC"}, {"env_step": 950000, "rew": 4822.0419, "rew_std": 1248.3136, "Agent": "SAC"}, {"env_step": 955000, "rew": 5447.5403, "rew_std": 165.6376, "Agent": "SAC"}, {"env_step": 960000, "rew": 5380.7014, "rew_std": 231.9971, "Agent": "SAC"}, {"env_step": 965000, "rew": 4889.1171, "rew_std": 894.6478, "Agent": "SAC"}, {"env_step": 970000, "rew": 5488.5109, "rew_std": 81.1671, "Agent": "SAC"}, {"env_step": 975000, "rew": 5480.2766, "rew_std": 153.2717, "Agent": "SAC"}, {"env_step": 980000, "rew": 5278.1923, "rew_std": 386.9493, "Agent": "SAC"}, {"env_step": 985000, "rew": 4943.0578, "rew_std": 1237.4507, "Agent": "SAC"}, {"env_step": 990000, "rew": 5409.148, "rew_std": 380.3438, "Agent": "SAC"}, {"env_step": 995000, "rew": 5483.5326, "rew_std": 103.0683, "Agent": "SAC"}, {"env_step": 1000000, "rew": 5415.5553, "rew_std": 214.0002, "Agent": "SAC"}, {"env_step": 1005000, "rew": 4959.1109, "rew_std": 1027.8864, "Agent": "SAC"}, {"env_step": 1010000, "rew": 5287.968, "rew_std": 535.2375, "Agent": "SAC"}, {"env_step": 1015000, "rew": 5500.3241, "rew_std": 233.4036, "Agent": "SAC"}, {"env_step": 1020000, "rew": 5212.1734, "rew_std": 952.0981, "Agent": "SAC"}, {"env_step": 1025000, "rew": 4906.8683, "rew_std": 966.5824, "Agent": "SAC"}, {"env_step": 1030000, "rew": 5261.8926, "rew_std": 551.9458, "Agent": "SAC"}, {"env_step": 1035000, "rew": 4983.7048, "rew_std": 1141.9197, "Agent": "SAC"}, {"env_step": 1040000, "rew": 5295.4149, "rew_std": 447.8563, "Agent": "SAC"}, {"env_step": 1045000, "rew": 4679.6166, "rew_std": 1609.6388, "Agent": "SAC"}, {"env_step": 1050000, "rew": 4691.6723, "rew_std": 1552.6393, "Agent": "SAC"}, {"env_step": 1055000, "rew": 5203.9302, "rew_std": 994.1317, "Agent": "SAC"}, {"env_step": 1060000, "rew": 5220.7184, "rew_std": 593.7466, "Agent": "SAC"}, {"env_step": 1065000, "rew": 5501.3539, "rew_std": 181.2919, "Agent": "SAC"}, {"env_step": 1070000, "rew": 5522.3152, "rew_std": 170.9723, "Agent": "SAC"}, {"env_step": 1075000, "rew": 5227.2177, "rew_std": 999.9346, "Agent": "SAC"}, {"env_step": 1080000, "rew": 5061.4714, "rew_std": 846.1303, "Agent": "SAC"}, {"env_step": 1085000, "rew": 5546.8159, "rew_std": 84.1642, "Agent": "SAC"}, {"env_step": 1090000, "rew": 5231.8019, "rew_std": 575.674, "Agent": "SAC"}, {"env_step": 1095000, "rew": 5367.6769, "rew_std": 420.0235, "Agent": "SAC"}, {"env_step": 1100000, "rew": 5506.1081, "rew_std": 179.8471, "Agent": "SAC"}, {"env_step": 1105000, "rew": 5601.4685, "rew_std": 68.1431, "Agent": "SAC"}, {"env_step": 1110000, "rew": 5408.7534, "rew_std": 325.9523, "Agent": "SAC"}, {"env_step": 1115000, "rew": 5535.2153, "rew_std": 186.8377, "Agent": "SAC"}, {"env_step": 1120000, "rew": 5532.6407, "rew_std": 205.192, "Agent": "SAC"}, {"env_step": 1125000, "rew": 5552.3668, "rew_std": 77.1201, "Agent": "SAC"}, {"env_step": 1130000, "rew": 5129.3217, "rew_std": 1263.6823, "Agent": "SAC"}, {"env_step": 1135000, "rew": 5500.5953, "rew_std": 187.8342, "Agent": "SAC"}, {"env_step": 1140000, "rew": 5503.6788, "rew_std": 275.1286, "Agent": "SAC"}, {"env_step": 1145000, "rew": 4995.5923, "rew_std": 1255.58, "Agent": "SAC"}, {"env_step": 1150000, "rew": 5248.8098, "rew_std": 751.2548, "Agent": "SAC"}, {"env_step": 1155000, "rew": 5435.8424, "rew_std": 209.4219, "Agent": "SAC"}, {"env_step": 1160000, "rew": 5527.5078, "rew_std": 200.7482, "Agent": "SAC"}, {"env_step": 1165000, "rew": 5550.173, "rew_std": 65.9799, "Agent": "SAC"}, {"env_step": 1170000, "rew": 5443.7728, "rew_std": 418.8417, "Agent": "SAC"}, {"env_step": 1175000, "rew": 5464.0429, "rew_std": 348.5082, "Agent": "SAC"}, {"env_step": 1180000, "rew": 5568.4337, "rew_std": 82.9834, "Agent": "SAC"}, {"env_step": 1185000, "rew": 5524.763, "rew_std": 171.4394, "Agent": "SAC"}, {"env_step": 1190000, "rew": 5212.8234, "rew_std": 1062.9118, "Agent": "SAC"}, {"env_step": 1195000, "rew": 5102.0455, "rew_std": 1028.9742, "Agent": "SAC"}, {"env_step": 1200000, "rew": 5481.4111, "rew_std": 230.1548, "Agent": "SAC"}, {"env_step": 1205000, "rew": 4889.8177, "rew_std": 1342.0486, "Agent": "SAC"}, {"env_step": 1210000, "rew": 5501.9494, "rew_std": 315.0388, "Agent": "SAC"}, {"env_step": 1215000, "rew": 5507.2537, "rew_std": 196.4056, "Agent": "SAC"}, {"env_step": 1220000, "rew": 5481.4773, "rew_std": 304.5546, "Agent": "SAC"}, {"env_step": 1225000, "rew": 5331.5667, "rew_std": 802.8777, "Agent": "SAC"}, {"env_step": 1230000, "rew": 5621.8863, "rew_std": 65.417, "Agent": "SAC"}, {"env_step": 1235000, "rew": 5310.1082, "rew_std": 560.1617, "Agent": "SAC"}, {"env_step": 1240000, "rew": 5518.8848, "rew_std": 221.8269, "Agent": "SAC"}, {"env_step": 1245000, "rew": 5296.2923, "rew_std": 998.7259, "Agent": "SAC"}, {"env_step": 1250000, "rew": 5378.8669, "rew_std": 392.2601, "Agent": "SAC"}, {"env_step": 0, "rew": 130.7126, "rew_std": 15.6136, "Agent": "TRPO"}, {"env_step": 30720, "rew": 226.8736, "rew_std": 12.392, "Agent": "TRPO"}, {"env_step": 61440, "rew": 349.9484, "rew_std": 34.8935, "Agent": "TRPO"}, {"env_step": 92160, "rew": 415.3155, "rew_std": 33.0504, "Agent": "TRPO"}, {"env_step": 122880, "rew": 438.3635, "rew_std": 39.9775, "Agent": "TRPO"}, {"env_step": 153600, "rew": 451.6102, "rew_std": 34.5927, "Agent": "TRPO"}, {"env_step": 184320, "rew": 482.4092, "rew_std": 34.5978, "Agent": "TRPO"}, {"env_step": 215040, "rew": 489.3611, "rew_std": 25.8785, "Agent": "TRPO"}, {"env_step": 245760, "rew": 497.038, "rew_std": 47.2623, "Agent": "TRPO"}, {"env_step": 276480, "rew": 515.3574, "rew_std": 38.2701, "Agent": "TRPO"}, {"env_step": 307200, "rew": 533.849, "rew_std": 40.7011, "Agent": "TRPO"}, {"env_step": 337920, "rew": 540.9039, "rew_std": 47.8602, "Agent": "TRPO"}, {"env_step": 368640, "rew": 533.3149, "rew_std": 39.9207, "Agent": "TRPO"}, {"env_step": 399360, "rew": 535.4808, "rew_std": 39.5439, "Agent": "TRPO"}, {"env_step": 430080, "rew": 551.0049, "rew_std": 62.1324, "Agent": "TRPO"}, {"env_step": 460800, "rew": 549.1813, "rew_std": 33.9869, "Agent": "TRPO"}, {"env_step": 491520, "rew": 573.173, "rew_std": 34.2006, "Agent": "TRPO"}, {"env_step": 522240, "rew": 551.7235, "rew_std": 26.4329, "Agent": "TRPO"}, {"env_step": 552960, "rew": 600.2877, "rew_std": 41.1054, "Agent": "TRPO"}, {"env_step": 583680, "rew": 588.1711, "rew_std": 62.2999, "Agent": "TRPO"}, {"env_step": 614400, "rew": 598.293, "rew_std": 32.4528, "Agent": "TRPO"}, {"env_step": 645120, "rew": 639.6377, "rew_std": 52.8143, "Agent": "TRPO"}, {"env_step": 675840, "rew": 624.9327, "rew_std": 46.1414, "Agent": "TRPO"}, {"env_step": 706560, "rew": 632.0389, "rew_std": 50.6505, "Agent": "TRPO"}, {"env_step": 737280, "rew": 653.4298, "rew_std": 47.047, "Agent": "TRPO"}, {"env_step": 768000, "rew": 678.1306, "rew_std": 76.9806, "Agent": "TRPO"}, {"env_step": 798720, "rew": 688.6861, "rew_std": 84.0171, "Agent": "TRPO"}, {"env_step": 829440, "rew": 709.0345, "rew_std": 116.5584, "Agent": "TRPO"}, {"env_step": 860160, "rew": 698.1775, "rew_std": 47.4192, "Agent": "TRPO"}, {"env_step": 890880, "rew": 788.5274, "rew_std": 151.7209, "Agent": "TRPO"}, {"env_step": 921600, "rew": 735.9283, "rew_std": 94.4404, "Agent": "TRPO"}, {"env_step": 952320, "rew": 794.3346, "rew_std": 120.8067, "Agent": "TRPO"}, {"env_step": 983040, "rew": 810.0602, "rew_std": 126.1111, "Agent": "TRPO"}, {"env_step": 1013760, "rew": 798.5407, "rew_std": 145.3247, "Agent": "TRPO"}, {"env_step": 1044480, "rew": 871.2716, "rew_std": 241.1752, "Agent": "TRPO"}, {"env_step": 1075200, "rew": 848.4981, "rew_std": 150.7763, "Agent": "TRPO"}, {"env_step": 1105920, "rew": 913.738, "rew_std": 164.1103, "Agent": "TRPO"}, {"env_step": 1136640, "rew": 958.4103, "rew_std": 174.4827, "Agent": "TRPO"}, {"env_step": 1167360, "rew": 1060.269, "rew_std": 252.2171, "Agent": "TRPO"}, {"env_step": 1198080, "rew": 978.3352, "rew_std": 253.0927, "Agent": "TRPO"}, {"env_step": 1228800, "rew": 1007.6961, "rew_std": 272.0871, "Agent": "TRPO"}, {"env_step": 1259520, "rew": 1142.1278, "rew_std": 293.5601, "Agent": "TRPO"}, {"env_step": 1290240, "rew": 1179.4149, "rew_std": 276.1729, "Agent": "TRPO"}, {"env_step": 1320960, "rew": 1289.5336, "rew_std": 443.125, "Agent": "TRPO"}, {"env_step": 1351680, "rew": 1352.0565, "rew_std": 500.1908, "Agent": "TRPO"}, {"env_step": 1382400, "rew": 1580.4102, "rew_std": 600.5368, "Agent": "TRPO"}, {"env_step": 1413120, "rew": 1648.1469, "rew_std": 629.6008, "Agent": "TRPO"}, {"env_step": 1443840, "rew": 1613.4132, "rew_std": 652.2997, "Agent": "TRPO"}, {"env_step": 1474560, "rew": 1656.0897, "rew_std": 514.4549, "Agent": "TRPO"}, {"env_step": 1505280, "rew": 1670.3156, "rew_std": 615.8045, "Agent": "TRPO"}, {"env_step": 1536000, "rew": 1998.4139, "rew_std": 828.7502, "Agent": "TRPO"}, {"env_step": 1566720, "rew": 1855.801, "rew_std": 785.2249, "Agent": "TRPO"}, {"env_step": 1597440, "rew": 2032.4979, "rew_std": 825.8749, "Agent": "TRPO"}, {"env_step": 1628160, "rew": 2209.814, "rew_std": 862.7375, "Agent": "TRPO"}, {"env_step": 1658880, "rew": 2214.2652, "rew_std": 832.3896, "Agent": "TRPO"}, {"env_step": 1689600, "rew": 2301.5468, "rew_std": 973.7445, "Agent": "TRPO"}, {"env_step": 1720320, "rew": 2325.3191, "rew_std": 601.7854, "Agent": "TRPO"}, {"env_step": 1751040, "rew": 2545.681, "rew_std": 857.882, "Agent": "TRPO"}, {"env_step": 1781760, "rew": 2493.511, "rew_std": 929.6768, "Agent": "TRPO"}, {"env_step": 1812480, "rew": 2382.4376, "rew_std": 841.1032, "Agent": "TRPO"}, {"env_step": 1843200, "rew": 2967.9437, "rew_std": 1054.8878, "Agent": "TRPO"}, {"env_step": 1873920, "rew": 2712.3964, "rew_std": 808.9423, "Agent": "TRPO"}, {"env_step": 1904640, "rew": 2863.5728, "rew_std": 1074.1575, "Agent": "TRPO"}, {"env_step": 1935360, "rew": 3396.4443, "rew_std": 1173.8096, "Agent": "TRPO"}, {"env_step": 1966080, "rew": 3366.6014, "rew_std": 935.0809, "Agent": "TRPO"}, {"env_step": 1996800, "rew": 3424.3939, "rew_std": 977.0058, "Agent": "TRPO"}, {"env_step": 2027520, "rew": 3418.3379, "rew_std": 713.7476, "Agent": "TRPO"}, {"env_step": 2058240, "rew": 3193.769, "rew_std": 983.3857, "Agent": "TRPO"}, {"env_step": 2088960, "rew": 3764.1014, "rew_std": 997.041, "Agent": "TRPO"}, {"env_step": 2119680, "rew": 3324.6148, "rew_std": 1049.9666, "Agent": "TRPO"}, {"env_step": 2150400, "rew": 3744.067, "rew_std": 1091.1226, "Agent": "TRPO"}, {"env_step": 2181120, "rew": 3916.1158, "rew_std": 539.2794, "Agent": "TRPO"}, {"env_step": 2211840, "rew": 3953.745, "rew_std": 688.9312, "Agent": "TRPO"}, {"env_step": 2242560, "rew": 4246.9708, "rew_std": 569.9072, "Agent": "TRPO"}, {"env_step": 2273280, "rew": 3852.2697, "rew_std": 755.746, "Agent": "TRPO"}, {"env_step": 2304000, "rew": 4055.375, "rew_std": 790.9762, "Agent": "TRPO"}, {"env_step": 2334720, "rew": 4214.089, "rew_std": 861.1226, "Agent": "TRPO"}, {"env_step": 2365440, "rew": 4291.6303, "rew_std": 575.5174, "Agent": "TRPO"}, {"env_step": 2396160, "rew": 4118.7938, "rew_std": 576.8646, "Agent": "TRPO"}, {"env_step": 2426880, "rew": 4372.9623, "rew_std": 365.566, "Agent": "TRPO"}, {"env_step": 2457600, "rew": 4423.0516, "rew_std": 598.6857, "Agent": "TRPO"}, {"env_step": 2488320, "rew": 4534.2491, "rew_std": 851.5078, "Agent": "TRPO"}, {"env_step": 2519040, "rew": 4866.6011, "rew_std": 663.749, "Agent": "TRPO"}, {"env_step": 2549760, "rew": 4615.6011, "rew_std": 661.0308, "Agent": "TRPO"}, {"env_step": 2580480, "rew": 4413.3694, "rew_std": 454.5142, "Agent": "TRPO"}, {"env_step": 2611200, "rew": 4739.428, "rew_std": 466.3908, "Agent": "TRPO"}, {"env_step": 2641920, "rew": 4782.8166, "rew_std": 596.5892, "Agent": "TRPO"}, {"env_step": 2672640, "rew": 5095.0046, "rew_std": 553.9764, "Agent": "TRPO"}, {"env_step": 2703360, "rew": 4854.7521, "rew_std": 550.9194, "Agent": "TRPO"}, {"env_step": 2734080, "rew": 4305.3093, "rew_std": 583.5533, "Agent": "TRPO"}, {"env_step": 2764800, "rew": 4799.1434, "rew_std": 495.221, "Agent": "TRPO"}, {"env_step": 2795520, "rew": 4692.5081, "rew_std": 647.1961, "Agent": "TRPO"}, {"env_step": 2826240, "rew": 4610.8764, "rew_std": 651.0562, "Agent": "TRPO"}, {"env_step": 2856960, "rew": 4856.4497, "rew_std": 779.8863, "Agent": "TRPO"}, {"env_step": 2887680, "rew": 4974.5723, "rew_std": 568.98, "Agent": "TRPO"}, {"env_step": 2918400, "rew": 4847.5896, "rew_std": 528.4401, "Agent": "TRPO"}, {"env_step": 2949120, "rew": 5154.396, "rew_std": 594.126, "Agent": "TRPO"}, {"env_step": 2979840, "rew": 4712.9747, "rew_std": 616.0265, "Agent": "TRPO"}, {"env_step": 3010560, "rew": 4646.6107, "rew_std": 705.5114, "Agent": "TRPO"}, {"env_step": 3041280, "rew": 4992.6209, "rew_std": 443.3291, "Agent": "TRPO"}, {"env_step": 3072000, "rew": 4956.3584, "rew_std": 673.7065, "Agent": "TRPO"}, {"env_step": 0, "rew": 130.7126, "rew_std": 15.6136, "Agent": "A2C"}, {"env_step": 30000, "rew": 353.9919, "rew_std": 44.5764, "Agent": "A2C"}, {"env_step": 60000, "rew": 383.1186, "rew_std": 37.3552, "Agent": "A2C"}, {"env_step": 90000, "rew": 426.6209, "rew_std": 35.6024, "Agent": "A2C"}, {"env_step": 120000, "rew": 430.859, "rew_std": 44.2118, "Agent": "A2C"}, {"env_step": 150000, "rew": 467.4777, "rew_std": 41.7401, "Agent": "A2C"}, {"env_step": 180000, "rew": 520.8538, "rew_std": 68.7925, "Agent": "A2C"}, {"env_step": 210000, "rew": 500.8319, "rew_std": 83.603, "Agent": "A2C"}, {"env_step": 240000, "rew": 496.1667, "rew_std": 39.6322, "Agent": "A2C"}, {"env_step": 270000, "rew": 531.1016, "rew_std": 50.328, "Agent": "A2C"}, {"env_step": 300000, "rew": 536.9946, "rew_std": 36.1136, "Agent": "A2C"}, {"env_step": 330000, "rew": 528.5104, "rew_std": 50.3768, "Agent": "A2C"}, {"env_step": 360000, "rew": 559.3917, "rew_std": 45.3429, "Agent": "A2C"}, {"env_step": 390000, "rew": 525.345, "rew_std": 56.0154, "Agent": "A2C"}, {"env_step": 420000, "rew": 549.3972, "rew_std": 47.0919, "Agent": "A2C"}, {"env_step": 450000, "rew": 551.0984, "rew_std": 50.0343, "Agent": "A2C"}, {"env_step": 480000, "rew": 562.8467, "rew_std": 37.7813, "Agent": "A2C"}, {"env_step": 510000, "rew": 554.9192, "rew_std": 37.7401, "Agent": "A2C"}, {"env_step": 540000, "rew": 613.7179, "rew_std": 109.5216, "Agent": "A2C"}, {"env_step": 570000, "rew": 614.4935, "rew_std": 92.6857, "Agent": "A2C"}, {"env_step": 600000, "rew": 613.4367, "rew_std": 105.5949, "Agent": "A2C"}, {"env_step": 630000, "rew": 671.3968, "rew_std": 117.3872, "Agent": "A2C"}, {"env_step": 660000, "rew": 635.6361, "rew_std": 118.8407, "Agent": "A2C"}, {"env_step": 690000, "rew": 706.9048, "rew_std": 174.3268, "Agent": "A2C"}, {"env_step": 720000, "rew": 855.8826, "rew_std": 337.6497, "Agent": "A2C"}, {"env_step": 750000, "rew": 1007.2058, "rew_std": 564.3479, "Agent": "A2C"}, {"env_step": 780000, "rew": 1003.8926, "rew_std": 625.1997, "Agent": "A2C"}, {"env_step": 810000, "rew": 1359.2944, "rew_std": 909.4713, "Agent": "A2C"}, {"env_step": 840000, "rew": 1214.6042, "rew_std": 851.1437, "Agent": "A2C"}, {"env_step": 870000, "rew": 1349.1214, "rew_std": 731.7768, "Agent": "A2C"}, {"env_step": 900000, "rew": 1412.6869, "rew_std": 851.1827, "Agent": "A2C"}, {"env_step": 930000, "rew": 1726.0036, "rew_std": 1070.0676, "Agent": "A2C"}, {"env_step": 960000, "rew": 1331.9998, "rew_std": 718.4679, "Agent": "A2C"}, {"env_step": 990000, "rew": 1765.9037, "rew_std": 1235.2031, "Agent": "A2C"}, {"env_step": 1020000, "rew": 2476.1129, "rew_std": 1305.1744, "Agent": "A2C"}, {"env_step": 1050000, "rew": 2258.8718, "rew_std": 1242.0474, "Agent": "A2C"}, {"env_step": 1080000, "rew": 2349.4063, "rew_std": 1315.8576, "Agent": "A2C"}, {"env_step": 1110000, "rew": 2802.3667, "rew_std": 1370.2395, "Agent": "A2C"}, {"env_step": 1140000, "rew": 2604.3733, "rew_std": 1407.5554, "Agent": "A2C"}, {"env_step": 1170000, "rew": 2812.3223, "rew_std": 1597.652, "Agent": "A2C"}, {"env_step": 1200000, "rew": 2826.2653, "rew_std": 1363.381, "Agent": "A2C"}, {"env_step": 1230000, "rew": 2606.3455, "rew_std": 1404.4811, "Agent": "A2C"}, {"env_step": 1260000, "rew": 3003.1294, "rew_std": 1444.6226, "Agent": "A2C"}, {"env_step": 1290000, "rew": 2607.4257, "rew_std": 1319.1591, "Agent": "A2C"}, {"env_step": 1320000, "rew": 3091.2105, "rew_std": 1413.2513, "Agent": "A2C"}, {"env_step": 1350000, "rew": 3144.1315, "rew_std": 1492.1207, "Agent": "A2C"}, {"env_step": 1380000, "rew": 3326.8287, "rew_std": 1568.8489, "Agent": "A2C"}, {"env_step": 1410000, "rew": 3587.6421, "rew_std": 1439.4819, "Agent": "A2C"}, {"env_step": 1440000, "rew": 2980.8724, "rew_std": 1454.9531, "Agent": "A2C"}, {"env_step": 1470000, "rew": 3583.043, "rew_std": 1493.8679, "Agent": "A2C"}, {"env_step": 1500000, "rew": 3462.9114, "rew_std": 1451.1828, "Agent": "A2C"}, {"env_step": 1530000, "rew": 3472.9946, "rew_std": 1540.7852, "Agent": "A2C"}, {"env_step": 1560000, "rew": 2653.2359, "rew_std": 1141.8654, "Agent": "A2C"}, {"env_step": 1590000, "rew": 3698.7924, "rew_std": 1472.0893, "Agent": "A2C"}, {"env_step": 1620000, "rew": 3369.2388, "rew_std": 1185.2593, "Agent": "A2C"}, {"env_step": 1650000, "rew": 3751.0162, "rew_std": 1372.8344, "Agent": "A2C"}, {"env_step": 1680000, "rew": 3460.9345, "rew_std": 1359.9235, "Agent": "A2C"}, {"env_step": 1710000, "rew": 4017.4043, "rew_std": 1516.6362, "Agent": "A2C"}, {"env_step": 1740000, "rew": 3841.3238, "rew_std": 1169.35, "Agent": "A2C"}, {"env_step": 1770000, "rew": 4317.4256, "rew_std": 1351.0404, "Agent": "A2C"}, {"env_step": 1800000, "rew": 3615.3238, "rew_std": 1324.6659, "Agent": "A2C"}, {"env_step": 1830000, "rew": 3990.3708, "rew_std": 1115.5551, "Agent": "A2C"}, {"env_step": 1860000, "rew": 4051.3542, "rew_std": 999.8893, "Agent": "A2C"}, {"env_step": 1890000, "rew": 4374.4812, "rew_std": 1537.1536, "Agent": "A2C"}, {"env_step": 1920000, "rew": 4263.77, "rew_std": 1002.1095, "Agent": "A2C"}, {"env_step": 1950000, "rew": 4083.6131, "rew_std": 1265.3289, "Agent": "A2C"}, {"env_step": 1980000, "rew": 4533.5691, "rew_std": 903.9607, "Agent": "A2C"}, {"env_step": 2010000, "rew": 4359.9509, "rew_std": 1059.9943, "Agent": "A2C"}, {"env_step": 2040000, "rew": 4260.8664, "rew_std": 1053.3046, "Agent": "A2C"}, {"env_step": 2070000, "rew": 3934.3529, "rew_std": 1003.8132, "Agent": "A2C"}, {"env_step": 2100000, "rew": 4516.3735, "rew_std": 679.4857, "Agent": "A2C"}, {"env_step": 2130000, "rew": 4899.1379, "rew_std": 650.4817, "Agent": "A2C"}, {"env_step": 2160000, "rew": 4413.6033, "rew_std": 580.1522, "Agent": "A2C"}, {"env_step": 2190000, "rew": 4688.5056, "rew_std": 570.3642, "Agent": "A2C"}, {"env_step": 2220000, "rew": 4468.6075, "rew_std": 710.3848, "Agent": "A2C"}, {"env_step": 2250000, "rew": 4835.1334, "rew_std": 760.7642, "Agent": "A2C"}, {"env_step": 2280000, "rew": 4374.0217, "rew_std": 776.1664, "Agent": "A2C"}, {"env_step": 2310000, "rew": 4442.3485, "rew_std": 710.9176, "Agent": "A2C"}, {"env_step": 2340000, "rew": 4771.5979, "rew_std": 737.0396, "Agent": "A2C"}, {"env_step": 2370000, "rew": 4354.7658, "rew_std": 719.8449, "Agent": "A2C"}, {"env_step": 2400000, "rew": 4510.2853, "rew_std": 732.1358, "Agent": "A2C"}, {"env_step": 2430000, "rew": 4661.3797, "rew_std": 887.0676, "Agent": "A2C"}, {"env_step": 2460000, "rew": 4849.6007, "rew_std": 729.8122, "Agent": "A2C"}, {"env_step": 2490000, "rew": 4860.8034, "rew_std": 752.8378, "Agent": "A2C"}, {"env_step": 2520000, "rew": 5118.544, "rew_std": 512.6474, "Agent": "A2C"}, {"env_step": 2550000, "rew": 5234.9514, "rew_std": 749.6186, "Agent": "A2C"}, {"env_step": 2580000, "rew": 5014.9994, "rew_std": 851.1116, "Agent": "A2C"}, {"env_step": 2610000, "rew": 4910.4339, "rew_std": 593.0186, "Agent": "A2C"}, {"env_step": 2640000, "rew": 5285.795, "rew_std": 588.8437, "Agent": "A2C"}, {"env_step": 2670000, "rew": 5061.3064, "rew_std": 570.5551, "Agent": "A2C"}, {"env_step": 2700000, "rew": 5231.117, "rew_std": 574.5865, "Agent": "A2C"}, {"env_step": 2730000, "rew": 5001.9283, "rew_std": 701.5343, "Agent": "A2C"}, {"env_step": 2760000, "rew": 4992.397, "rew_std": 500.2804, "Agent": "A2C"}, {"env_step": 2790000, "rew": 5147.4111, "rew_std": 510.2497, "Agent": "A2C"}, {"env_step": 2820000, "rew": 4734.8069, "rew_std": 661.113, "Agent": "A2C"}, {"env_step": 2850000, "rew": 5067.7192, "rew_std": 581.2196, "Agent": "A2C"}, {"env_step": 2880000, "rew": 5300.8283, "rew_std": 668.5736, "Agent": "A2C"}, {"env_step": 2910000, "rew": 5316.5694, "rew_std": 554.7586, "Agent": "A2C"}, {"env_step": 2940000, "rew": 5112.4173, "rew_std": 489.4034, "Agent": "A2C"}, {"env_step": 2970000, "rew": 4819.7192, "rew_std": 603.6194, "Agent": "A2C"}, {"env_step": 3000000, "rew": 5138.2266, "rew_std": 458.5997, "Agent": "A2C"}, {"env_step": 0, "rew": 130.2371, "rew_std": 14.6922, "Agent": "ACKTR"}, {"env_step": 30000, "rew": 138.8216, "rew_std": 11.4886, "Agent": "ACKTR"}, {"env_step": 60000, "rew": 164.9226, "rew_std": 19.4707, "Agent": "ACKTR"}, {"env_step": 90000, "rew": 198.3888, "rew_std": 37.2572, "Agent": "ACKTR"}, {"env_step": 120000, "rew": 237.1055, "rew_std": 31.6248, "Agent": "ACKTR"}, {"env_step": 150000, "rew": 271.4301, "rew_std": 43.5939, "Agent": "ACKTR"}, {"env_step": 180000, "rew": 302.5788, "rew_std": 47.0946, "Agent": "ACKTR"}, {"env_step": 210000, "rew": 316.7206, "rew_std": 43.713, "Agent": "ACKTR"}, {"env_step": 240000, "rew": 324.2093, "rew_std": 32.2148, "Agent": "ACKTR"}, {"env_step": 270000, "rew": 334.9953, "rew_std": 29.1609, "Agent": "ACKTR"}, {"env_step": 300000, "rew": 327.3075, "rew_std": 26.6873, "Agent": "ACKTR"}, {"env_step": 330000, "rew": 321.1282, "rew_std": 36.9124, "Agent": "ACKTR"}, {"env_step": 360000, "rew": 361.2524, "rew_std": 38.5395, "Agent": "ACKTR"}, {"env_step": 390000, "rew": 325.8244, "rew_std": 29.4945, "Agent": "ACKTR"}, {"env_step": 420000, "rew": 336.9366, "rew_std": 34.1756, "Agent": "ACKTR"}, {"env_step": 450000, "rew": 354.6768, "rew_std": 37.1133, "Agent": "ACKTR"}, {"env_step": 480000, "rew": 336.1224, "rew_std": 27.6541, "Agent": "ACKTR"}, {"env_step": 510000, "rew": 349.5337, "rew_std": 42.9355, "Agent": "ACKTR"}, {"env_step": 540000, "rew": 361.132, "rew_std": 39.6285, "Agent": "ACKTR"}, {"env_step": 570000, "rew": 330.1614, "rew_std": 29.2725, "Agent": "ACKTR"}, {"env_step": 600000, "rew": 351.1658, "rew_std": 27.9394, "Agent": "ACKTR"}, {"env_step": 630000, "rew": 343.2164, "rew_std": 37.2824, "Agent": "ACKTR"}, {"env_step": 660000, "rew": 345.9966, "rew_std": 52.9727, "Agent": "ACKTR"}, {"env_step": 690000, "rew": 339.2842, "rew_std": 38.5878, "Agent": "ACKTR"}, {"env_step": 720000, "rew": 337.1782, "rew_std": 38.0244, "Agent": "ACKTR"}, {"env_step": 750000, "rew": 320.0956, "rew_std": 19.8551, "Agent": "ACKTR"}, {"env_step": 780000, "rew": 332.5159, "rew_std": 38.2012, "Agent": "ACKTR"}, {"env_step": 810000, "rew": 329.8925, "rew_std": 40.5504, "Agent": "ACKTR"}, {"env_step": 840000, "rew": 327.9263, "rew_std": 33.703, "Agent": "ACKTR"}, {"env_step": 870000, "rew": 329.9293, "rew_std": 33.4927, "Agent": "ACKTR"}, {"env_step": 900000, "rew": 328.2912, "rew_std": 26.8944, "Agent": "ACKTR"}, {"env_step": 930000, "rew": 327.0103, "rew_std": 31.5154, "Agent": "ACKTR"}, {"env_step": 960000, "rew": 339.9061, "rew_std": 28.7103, "Agent": "ACKTR"}, {"env_step": 990000, "rew": 338.6159, "rew_std": 19.0502, "Agent": "ACKTR"}, {"env_step": 1020000, "rew": 330.5302, "rew_std": 34.3422, "Agent": "ACKTR"}, {"env_step": 1050000, "rew": 336.1799, "rew_std": 31.2653, "Agent": "ACKTR"}, {"env_step": 1080000, "rew": 331.4958, "rew_std": 33.5308, "Agent": "ACKTR"}, {"env_step": 1110000, "rew": 344.1079, "rew_std": 38.1431, "Agent": "ACKTR"}, {"env_step": 1140000, "rew": 327.4818, "rew_std": 29.5658, "Agent": "ACKTR"}, {"env_step": 1170000, "rew": 346.0026, "rew_std": 35.9292, "Agent": "ACKTR"}, {"env_step": 1200000, "rew": 340.0773, "rew_std": 36.9668, "Agent": "ACKTR"}, {"env_step": 1230000, "rew": 345.92, "rew_std": 24.8816, "Agent": "ACKTR"}, {"env_step": 1260000, "rew": 341.0296, "rew_std": 34.6181, "Agent": "ACKTR"}, {"env_step": 1290000, "rew": 338.4484, "rew_std": 29.8942, "Agent": "ACKTR"}, {"env_step": 1320000, "rew": 350.9085, "rew_std": 43.6155, "Agent": "ACKTR"}, {"env_step": 1350000, "rew": 336.2607, "rew_std": 32.7689, "Agent": "ACKTR"}, {"env_step": 1380000, "rew": 331.7369, "rew_std": 30.269, "Agent": "ACKTR"}, {"env_step": 1410000, "rew": 338.2156, "rew_std": 31.0497, "Agent": "ACKTR"}, {"env_step": 1440000, "rew": 327.8085, "rew_std": 23.7205, "Agent": "ACKTR"}, {"env_step": 1470000, "rew": 333.4152, "rew_std": 21.6442, "Agent": "ACKTR"}, {"env_step": 1500000, "rew": 324.8708, "rew_std": 30.9509, "Agent": "ACKTR"}, {"env_step": 1530000, "rew": 322.9822, "rew_std": 39.133, "Agent": "ACKTR"}, {"env_step": 1560000, "rew": 332.5282, "rew_std": 42.846, "Agent": "ACKTR"}, {"env_step": 1590000, "rew": 324.8569, "rew_std": 25.8733, "Agent": "ACKTR"}, {"env_step": 1620000, "rew": 335.496, "rew_std": 40.2427, "Agent": "ACKTR"}, {"env_step": 1650000, "rew": 327.3037, "rew_std": 36.256, "Agent": "ACKTR"}, {"env_step": 1680000, "rew": 331.141, "rew_std": 37.3948, "Agent": "ACKTR"}, {"env_step": 1710000, "rew": 312.7652, "rew_std": 21.8551, "Agent": "ACKTR"}, {"env_step": 1740000, "rew": 328.4288, "rew_std": 38.836, "Agent": "ACKTR"}, {"env_step": 1770000, "rew": 323.7323, "rew_std": 32.5279, "Agent": "ACKTR"}, {"env_step": 1800000, "rew": 324.9909, "rew_std": 28.8213, "Agent": "ACKTR"}, {"env_step": 1830000, "rew": 328.8011, "rew_std": 27.6594, "Agent": "ACKTR"}, {"env_step": 1860000, "rew": 337.1219, "rew_std": 36.6454, "Agent": "ACKTR"}, {"env_step": 1890000, "rew": 323.6468, "rew_std": 23.7499, "Agent": "ACKTR"}, {"env_step": 1920000, "rew": 336.0521, "rew_std": 28.4636, "Agent": "ACKTR"}, {"env_step": 1950000, "rew": 316.9374, "rew_std": 33.764, "Agent": "ACKTR"}, {"env_step": 1980000, "rew": 324.809, "rew_std": 16.3125, "Agent": "ACKTR"}, {"env_step": 2010000, "rew": 331.756, "rew_std": 35.7746, "Agent": "ACKTR"}, {"env_step": 2040000, "rew": 331.8604, "rew_std": 31.4516, "Agent": "ACKTR"}, {"env_step": 2070000, "rew": 333.4709, "rew_std": 37.8808, "Agent": "ACKTR"}, {"env_step": 2100000, "rew": 327.8076, "rew_std": 29.9532, "Agent": "ACKTR"}, {"env_step": 2130000, "rew": 330.1836, "rew_std": 29.7042, "Agent": "ACKTR"}, {"env_step": 2160000, "rew": 340.5726, "rew_std": 22.8185, "Agent": "ACKTR"}, {"env_step": 2190000, "rew": 332.1629, "rew_std": 36.0735, "Agent": "ACKTR"}, {"env_step": 2220000, "rew": 323.4985, "rew_std": 28.3859, "Agent": "ACKTR"}, {"env_step": 2250000, "rew": 341.7284, "rew_std": 33.9916, "Agent": "ACKTR"}, {"env_step": 2280000, "rew": 329.6508, "rew_std": 24.4636, "Agent": "ACKTR"}, {"env_step": 2310000, "rew": 325.7434, "rew_std": 25.8358, "Agent": "ACKTR"}, {"env_step": 2340000, "rew": 329.8479, "rew_std": 29.5135, "Agent": "ACKTR"}, {"env_step": 2370000, "rew": 320.347, "rew_std": 26.9729, "Agent": "ACKTR"}, {"env_step": 2400000, "rew": 336.0676, "rew_std": 23.3404, "Agent": "ACKTR"}, {"env_step": 2430000, "rew": 332.4239, "rew_std": 31.2853, "Agent": "ACKTR"}, {"env_step": 2460000, "rew": 337.8918, "rew_std": 32.1914, "Agent": "ACKTR"}, {"env_step": 2490000, "rew": 318.3681, "rew_std": 23.8972, "Agent": "ACKTR"}, {"env_step": 2520000, "rew": 327.5128, "rew_std": 22.2842, "Agent": "ACKTR"}, {"env_step": 2550000, "rew": 324.0976, "rew_std": 20.1685, "Agent": "ACKTR"}, {"env_step": 2580000, "rew": 328.825, "rew_std": 35.4503, "Agent": "ACKTR"}, {"env_step": 2610000, "rew": 345.4419, "rew_std": 33.8137, "Agent": "ACKTR"}, {"env_step": 2640000, "rew": 334.3103, "rew_std": 26.3187, "Agent": "ACKTR"}, {"env_step": 2670000, "rew": 326.1392, "rew_std": 33.8469, "Agent": "ACKTR"}, {"env_step": 2700000, "rew": 331.0169, "rew_std": 25.8849, "Agent": "ACKTR"}, {"env_step": 2730000, "rew": 342.7292, "rew_std": 38.3722, "Agent": "ACKTR"}, {"env_step": 2760000, "rew": 321.6434, "rew_std": 27.5761, "Agent": "ACKTR"}, {"env_step": 2790000, "rew": 335.2755, "rew_std": 36.7107, "Agent": "ACKTR"}, {"env_step": 2820000, "rew": 341.6504, "rew_std": 29.8181, "Agent": "ACKTR"}, {"env_step": 2850000, "rew": 326.5556, "rew_std": 32.4602, "Agent": "ACKTR"}, {"env_step": 2880000, "rew": 330.6679, "rew_std": 28.896, "Agent": "ACKTR"}, {"env_step": 2910000, "rew": 345.8178, "rew_std": 28.9973, "Agent": "ACKTR"}, {"env_step": 2940000, "rew": 337.5051, "rew_std": 34.4284, "Agent": "ACKTR"}, {"env_step": 2970000, "rew": 350.4975, "rew_std": 37.2138, "Agent": "ACKTR"}, {"env_step": 3000000, "rew": 342.4223, "rew_std": 34.963, "Agent": "ACKTR"}, {"env_step": 0, "rew": 177.3211, "rew_std": 77.5947, "Agent": "DDPG"}, {"env_step": 5000, "rew": 107.4722, "rew_std": 49.5394, "Agent": "DDPG"}, {"env_step": 10000, "rew": 107.419, "rew_std": 48.3793, "Agent": "DDPG"}, {"env_step": 15000, "rew": 107.8837, "rew_std": 48.1536, "Agent": "DDPG"}, {"env_step": 20000, "rew": 108.3848, "rew_std": 49.3729, "Agent": "DDPG"}, {"env_step": 25000, "rew": 109.1298, "rew_std": 50.4306, "Agent": "DDPG"}, {"env_step": 30000, "rew": 107.7117, "rew_std": 48.689, "Agent": "DDPG"}, {"env_step": 35000, "rew": 108.4788, "rew_std": 50.029, "Agent": "DDPG"}, {"env_step": 40000, "rew": 106.8252, "rew_std": 47.411, "Agent": "DDPG"}, {"env_step": 45000, "rew": 107.2152, "rew_std": 49.5615, "Agent": "DDPG"}, {"env_step": 50000, "rew": 108.1668, "rew_std": 49.1587, "Agent": "DDPG"}, {"env_step": 55000, "rew": 107.585, "rew_std": 48.4752, "Agent": "DDPG"}, {"env_step": 60000, "rew": 107.9617, "rew_std": 48.7848, "Agent": "DDPG"}, {"env_step": 65000, "rew": 108.5746, "rew_std": 49.0814, "Agent": "DDPG"}, {"env_step": 70000, "rew": 108.5917, "rew_std": 49.2006, "Agent": "DDPG"}, {"env_step": 75000, "rew": 108.2389, "rew_std": 48.5646, "Agent": "DDPG"}, {"env_step": 80000, "rew": 106.9407, "rew_std": 47.9692, "Agent": "DDPG"}, {"env_step": 85000, "rew": 107.1787, "rew_std": 48.6623, "Agent": "DDPG"}, {"env_step": 90000, "rew": 108.0858, "rew_std": 49.8083, "Agent": "DDPG"}, {"env_step": 95000, "rew": 107.9608, "rew_std": 49.5357, "Agent": "DDPG"}, {"env_step": 100000, "rew": 107.8685, "rew_std": 49.102, "Agent": "DDPG"}, {"env_step": 105000, "rew": 108.3229, "rew_std": 49.2733, "Agent": "DDPG"}, {"env_step": 110000, "rew": 108.9463, "rew_std": 49.2226, "Agent": "DDPG"}, {"env_step": 115000, "rew": 108.6805, "rew_std": 49.843, "Agent": "DDPG"}, {"env_step": 120000, "rew": 107.3607, "rew_std": 48.9263, "Agent": "DDPG"}, {"env_step": 125000, "rew": 109.0114, "rew_std": 50.1977, "Agent": "DDPG"}, {"env_step": 130000, "rew": 108.7159, "rew_std": 50.2207, "Agent": "DDPG"}, {"env_step": 135000, "rew": 107.8893, "rew_std": 49.0612, "Agent": "DDPG"}, {"env_step": 140000, "rew": 109.5944, "rew_std": 51.1663, "Agent": "DDPG"}, {"env_step": 145000, "rew": 109.2089, "rew_std": 50.4391, "Agent": "DDPG"}, {"env_step": 150000, "rew": 108.8583, "rew_std": 49.8412, "Agent": "DDPG"}, {"env_step": 155000, "rew": 108.5092, "rew_std": 49.0027, "Agent": "DDPG"}, {"env_step": 160000, "rew": 107.0541, "rew_std": 47.7677, "Agent": "DDPG"}, {"env_step": 165000, "rew": 108.3194, "rew_std": 49.2564, "Agent": "DDPG"}, {"env_step": 170000, "rew": 108.7133, "rew_std": 50.4113, "Agent": "DDPG"}, {"env_step": 175000, "rew": 108.8514, "rew_std": 50.5438, "Agent": "DDPG"}, {"env_step": 180000, "rew": 108.6988, "rew_std": 49.5952, "Agent": "DDPG"}, {"env_step": 185000, "rew": 107.0648, "rew_std": 47.8116, "Agent": "DDPG"}, {"env_step": 190000, "rew": 107.8391, "rew_std": 48.4472, "Agent": "DDPG"}, {"env_step": 195000, "rew": 108.5129, "rew_std": 49.9494, "Agent": "DDPG"}, {"env_step": 200000, "rew": 108.1958, "rew_std": 50.1158, "Agent": "DDPG"}, {"env_step": 205000, "rew": 108.3988, "rew_std": 49.3048, "Agent": "DDPG"}, {"env_step": 210000, "rew": 107.4057, "rew_std": 48.2847, "Agent": "DDPG"}, {"env_step": 215000, "rew": 107.1662, "rew_std": 48.5738, "Agent": "DDPG"}, {"env_step": 220000, "rew": 108.6186, "rew_std": 49.7125, "Agent": "DDPG"}, {"env_step": 225000, "rew": 108.11, "rew_std": 48.6119, "Agent": "DDPG"}, {"env_step": 230000, "rew": 107.9753, "rew_std": 49.3788, "Agent": "DDPG"}, {"env_step": 235000, "rew": 108.1134, "rew_std": 48.8535, "Agent": "DDPG"}, {"env_step": 240000, "rew": 108.3508, "rew_std": 49.4337, "Agent": "DDPG"}, {"env_step": 245000, "rew": 107.1296, "rew_std": 47.9657, "Agent": "DDPG"}, {"env_step": 250000, "rew": 109.8651, "rew_std": 51.256, "Agent": "DDPG"}, {"env_step": 255000, "rew": 107.0648, "rew_std": 48.2469, "Agent": "DDPG"}, {"env_step": 260000, "rew": 107.1931, "rew_std": 48.5244, "Agent": "DDPG"}, {"env_step": 265000, "rew": 108.8675, "rew_std": 50.6869, "Agent": "DDPG"}, {"env_step": 270000, "rew": 107.7211, "rew_std": 48.9009, "Agent": "DDPG"}, {"env_step": 275000, "rew": 106.8022, "rew_std": 47.7847, "Agent": "DDPG"}, {"env_step": 280000, "rew": 108.1544, "rew_std": 48.4929, "Agent": "DDPG"}, {"env_step": 285000, "rew": 107.3888, "rew_std": 48.73, "Agent": "DDPG"}, {"env_step": 290000, "rew": 108.1, "rew_std": 49.7088, "Agent": "DDPG"}, {"env_step": 295000, "rew": 107.7946, "rew_std": 48.7758, "Agent": "DDPG"}, {"env_step": 300000, "rew": 108.2477, "rew_std": 49.7653, "Agent": "DDPG"}, {"env_step": 305000, "rew": 106.3818, "rew_std": 48.0367, "Agent": "DDPG"}, {"env_step": 310000, "rew": 108.6188, "rew_std": 49.6778, "Agent": "DDPG"}, {"env_step": 315000, "rew": 108.7012, "rew_std": 49.2731, "Agent": "DDPG"}, {"env_step": 320000, "rew": 108.9132, "rew_std": 50.1521, "Agent": "DDPG"}, {"env_step": 325000, "rew": 109.3433, "rew_std": 50.3347, "Agent": "DDPG"}, {"env_step": 330000, "rew": 106.6812, "rew_std": 48.186, "Agent": "DDPG"}, {"env_step": 335000, "rew": 107.5278, "rew_std": 48.4076, "Agent": "DDPG"}, {"env_step": 340000, "rew": 109.3871, "rew_std": 50.6109, "Agent": "DDPG"}, {"env_step": 345000, "rew": 107.0201, "rew_std": 47.9292, "Agent": "DDPG"}, {"env_step": 350000, "rew": 108.046, "rew_std": 48.6814, "Agent": "DDPG"}, {"env_step": 355000, "rew": 108.6397, "rew_std": 50.246, "Agent": "DDPG"}, {"env_step": 360000, "rew": 107.8538, "rew_std": 49.0871, "Agent": "DDPG"}, {"env_step": 365000, "rew": 108.441, "rew_std": 49.4998, "Agent": "DDPG"}, {"env_step": 370000, "rew": 108.9821, "rew_std": 49.8238, "Agent": "DDPG"}, {"env_step": 375000, "rew": 107.8918, "rew_std": 49.6536, "Agent": "DDPG"}, {"env_step": 380000, "rew": 107.9529, "rew_std": 49.4383, "Agent": "DDPG"}, {"env_step": 385000, "rew": 107.6085, "rew_std": 49.2473, "Agent": "DDPG"}, {"env_step": 390000, "rew": 108.3302, "rew_std": 49.122, "Agent": "DDPG"}, {"env_step": 395000, "rew": 109.8158, "rew_std": 51.3892, "Agent": "DDPG"}, {"env_step": 400000, "rew": 107.381, "rew_std": 48.4753, "Agent": "DDPG"}, {"env_step": 405000, "rew": 108.6191, "rew_std": 49.4195, "Agent": "DDPG"}, {"env_step": 410000, "rew": 107.41, "rew_std": 48.837, "Agent": "DDPG"}, {"env_step": 415000, "rew": 108.4352, "rew_std": 49.2737, "Agent": "DDPG"}, {"env_step": 420000, "rew": 107.9026, "rew_std": 48.534, "Agent": "DDPG"}, {"env_step": 425000, "rew": 108.478, "rew_std": 48.7426, "Agent": "DDPG"}, {"env_step": 430000, "rew": 107.1057, "rew_std": 47.5283, "Agent": "DDPG"}, {"env_step": 435000, "rew": 107.6836, "rew_std": 48.4309, "Agent": "DDPG"}, {"env_step": 440000, "rew": 108.1322, "rew_std": 48.2125, "Agent": "DDPG"}, {"env_step": 445000, "rew": 107.9857, "rew_std": 49.0165, "Agent": "DDPG"}, {"env_step": 450000, "rew": 109.4034, "rew_std": 51.0131, "Agent": "DDPG"}, {"env_step": 455000, "rew": 107.6908, "rew_std": 48.9333, "Agent": "DDPG"}, {"env_step": 460000, "rew": 107.0666, "rew_std": 47.51, "Agent": "DDPG"}, {"env_step": 465000, "rew": 109.4376, "rew_std": 50.1125, "Agent": "DDPG"}, {"env_step": 470000, "rew": 108.6718, "rew_std": 49.2696, "Agent": "DDPG"}, {"env_step": 475000, "rew": 107.5808, "rew_std": 49.0431, "Agent": "DDPG"}, {"env_step": 480000, "rew": 107.2121, "rew_std": 48.7748, "Agent": "DDPG"}, {"env_step": 485000, "rew": 107.1728, "rew_std": 48.2687, "Agent": "DDPG"}, {"env_step": 490000, "rew": 108.0973, "rew_std": 49.3657, "Agent": "DDPG"}, {"env_step": 495000, "rew": 107.7327, "rew_std": 48.7304, "Agent": "DDPG"}, {"env_step": 500000, "rew": 108.8858, "rew_std": 49.8917, "Agent": "DDPG"}, {"env_step": 505000, "rew": 108.0974, "rew_std": 49.7294, "Agent": "DDPG"}, {"env_step": 510000, "rew": 107.1945, "rew_std": 47.9077, "Agent": "DDPG"}, {"env_step": 515000, "rew": 108.1582, "rew_std": 48.6089, "Agent": "DDPG"}, {"env_step": 520000, "rew": 107.6266, "rew_std": 48.4478, "Agent": "DDPG"}, {"env_step": 525000, "rew": 107.2526, "rew_std": 48.5832, "Agent": "DDPG"}, {"env_step": 530000, "rew": 107.6767, "rew_std": 48.8641, "Agent": "DDPG"}, {"env_step": 535000, "rew": 108.9989, "rew_std": 49.9125, "Agent": "DDPG"}, {"env_step": 540000, "rew": 108.1414, "rew_std": 49.2883, "Agent": "DDPG"}, {"env_step": 545000, "rew": 108.7419, "rew_std": 49.8283, "Agent": "DDPG"}, {"env_step": 550000, "rew": 107.8539, "rew_std": 48.977, "Agent": "DDPG"}, {"env_step": 555000, "rew": 108.6301, "rew_std": 49.5366, "Agent": "DDPG"}, {"env_step": 560000, "rew": 105.8462, "rew_std": 47.1965, "Agent": "DDPG"}, {"env_step": 565000, "rew": 107.7476, "rew_std": 48.4578, "Agent": "DDPG"}, {"env_step": 570000, "rew": 107.11, "rew_std": 47.5214, "Agent": "DDPG"}, {"env_step": 575000, "rew": 108.8707, "rew_std": 49.2753, "Agent": "DDPG"}, {"env_step": 580000, "rew": 108.4656, "rew_std": 49.7007, "Agent": "DDPG"}, {"env_step": 585000, "rew": 107.4115, "rew_std": 48.396, "Agent": "DDPG"}, {"env_step": 590000, "rew": 108.1877, "rew_std": 48.6477, "Agent": "DDPG"}, {"env_step": 595000, "rew": 108.6227, "rew_std": 49.4947, "Agent": "DDPG"}, {"env_step": 600000, "rew": 108.855, "rew_std": 50.5568, "Agent": "DDPG"}, {"env_step": 605000, "rew": 108.0074, "rew_std": 49.2264, "Agent": "DDPG"}, {"env_step": 610000, "rew": 106.7105, "rew_std": 47.8051, "Agent": "DDPG"}, {"env_step": 615000, "rew": 107.7101, "rew_std": 48.9149, "Agent": "DDPG"}, {"env_step": 620000, "rew": 107.2254, "rew_std": 49.1405, "Agent": "DDPG"}, {"env_step": 625000, "rew": 107.5752, "rew_std": 48.2163, "Agent": "DDPG"}, {"env_step": 630000, "rew": 108.224, "rew_std": 49.7724, "Agent": "DDPG"}, {"env_step": 635000, "rew": 108.7608, "rew_std": 50.2342, "Agent": "DDPG"}, {"env_step": 640000, "rew": 107.6411, "rew_std": 48.8166, "Agent": "DDPG"}, {"env_step": 645000, "rew": 108.7065, "rew_std": 49.4438, "Agent": "DDPG"}, {"env_step": 650000, "rew": 109.1814, "rew_std": 50.5024, "Agent": "DDPG"}, {"env_step": 655000, "rew": 109.8778, "rew_std": 50.4916, "Agent": "DDPG"}, {"env_step": 660000, "rew": 108.5942, "rew_std": 49.6353, "Agent": "DDPG"}, {"env_step": 665000, "rew": 108.0445, "rew_std": 49.3306, "Agent": "DDPG"}, {"env_step": 670000, "rew": 107.5365, "rew_std": 48.3147, "Agent": "DDPG"}, {"env_step": 675000, "rew": 107.4953, "rew_std": 47.9975, "Agent": "DDPG"}, {"env_step": 680000, "rew": 108.0237, "rew_std": 48.7486, "Agent": "DDPG"}, {"env_step": 685000, "rew": 108.4675, "rew_std": 48.824, "Agent": "DDPG"}, {"env_step": 690000, "rew": 107.6245, "rew_std": 48.3674, "Agent": "DDPG"}, {"env_step": 695000, "rew": 108.8214, "rew_std": 49.8349, "Agent": "DDPG"}, {"env_step": 700000, "rew": 107.5492, "rew_std": 48.4227, "Agent": "DDPG"}, {"env_step": 705000, "rew": 107.18, "rew_std": 48.8275, "Agent": "DDPG"}, {"env_step": 710000, "rew": 108.5283, "rew_std": 49.5153, "Agent": "DDPG"}, {"env_step": 715000, "rew": 106.5051, "rew_std": 47.4221, "Agent": "DDPG"}, {"env_step": 720000, "rew": 106.9291, "rew_std": 49.2053, "Agent": "DDPG"}, {"env_step": 725000, "rew": 108.4394, "rew_std": 49.4338, "Agent": "DDPG"}, {"env_step": 730000, "rew": 107.6665, "rew_std": 49.4634, "Agent": "DDPG"}, {"env_step": 735000, "rew": 107.7959, "rew_std": 48.591, "Agent": "DDPG"}, {"env_step": 740000, "rew": 108.0495, "rew_std": 49.8033, "Agent": "DDPG"}, {"env_step": 745000, "rew": 107.4518, "rew_std": 48.6424, "Agent": "DDPG"}, {"env_step": 750000, "rew": 108.1426, "rew_std": 49.1501, "Agent": "DDPG"}, {"env_step": 755000, "rew": 108.2628, "rew_std": 50.0382, "Agent": "DDPG"}, {"env_step": 760000, "rew": 107.2477, "rew_std": 48.0286, "Agent": "DDPG"}, {"env_step": 765000, "rew": 109.0266, "rew_std": 49.8274, "Agent": "DDPG"}, {"env_step": 770000, "rew": 109.0255, "rew_std": 49.9443, "Agent": "DDPG"}, {"env_step": 775000, "rew": 108.1221, "rew_std": 49.8079, "Agent": "DDPG"}, {"env_step": 780000, "rew": 108.4238, "rew_std": 49.3669, "Agent": "DDPG"}, {"env_step": 785000, "rew": 108.115, "rew_std": 48.8943, "Agent": "DDPG"}, {"env_step": 790000, "rew": 106.6352, "rew_std": 47.2801, "Agent": "DDPG"}, {"env_step": 795000, "rew": 108.7755, "rew_std": 49.2822, "Agent": "DDPG"}, {"env_step": 800000, "rew": 107.1741, "rew_std": 48.0624, "Agent": "DDPG"}, {"env_step": 805000, "rew": 107.5149, "rew_std": 48.7057, "Agent": "DDPG"}, {"env_step": 810000, "rew": 108.7222, "rew_std": 50.0176, "Agent": "DDPG"}, {"env_step": 815000, "rew": 107.5641, "rew_std": 48.7545, "Agent": "DDPG"}, {"env_step": 820000, "rew": 107.6578, "rew_std": 49.0399, "Agent": "DDPG"}, {"env_step": 825000, "rew": 108.2342, "rew_std": 49.4261, "Agent": "DDPG"}, {"env_step": 830000, "rew": 107.9824, "rew_std": 49.6815, "Agent": "DDPG"}, {"env_step": 835000, "rew": 108.5656, "rew_std": 49.6647, "Agent": "DDPG"}, {"env_step": 840000, "rew": 107.2489, "rew_std": 48.1444, "Agent": "DDPG"}, {"env_step": 845000, "rew": 108.5607, "rew_std": 48.6598, "Agent": "DDPG"}, {"env_step": 850000, "rew": 108.9987, "rew_std": 49.9275, "Agent": "DDPG"}, {"env_step": 855000, "rew": 108.4097, "rew_std": 49.2914, "Agent": "DDPG"}, {"env_step": 860000, "rew": 108.8319, "rew_std": 50.0234, "Agent": "DDPG"}, {"env_step": 865000, "rew": 107.2195, "rew_std": 48.4018, "Agent": "DDPG"}, {"env_step": 870000, "rew": 107.3554, "rew_std": 48.6998, "Agent": "DDPG"}, {"env_step": 875000, "rew": 108.5066, "rew_std": 49.5775, "Agent": "DDPG"}, {"env_step": 880000, "rew": 107.5358, "rew_std": 48.8969, "Agent": "DDPG"}, {"env_step": 885000, "rew": 107.4236, "rew_std": 48.9267, "Agent": "DDPG"}, {"env_step": 890000, "rew": 109.3625, "rew_std": 50.3215, "Agent": "DDPG"}, {"env_step": 895000, "rew": 107.8831, "rew_std": 48.6233, "Agent": "DDPG"}, {"env_step": 900000, "rew": 109.3476, "rew_std": 50.3894, "Agent": "DDPG"}, {"env_step": 905000, "rew": 107.8047, "rew_std": 49.2224, "Agent": "DDPG"}, {"env_step": 910000, "rew": 107.7403, "rew_std": 48.9944, "Agent": "DDPG"}, {"env_step": 915000, "rew": 107.7707, "rew_std": 48.8078, "Agent": "DDPG"}, {"env_step": 920000, "rew": 108.6377, "rew_std": 49.3496, "Agent": "DDPG"}, {"env_step": 925000, "rew": 108.3392, "rew_std": 48.886, "Agent": "DDPG"}, {"env_step": 930000, "rew": 107.7412, "rew_std": 49.0511, "Agent": "DDPG"}, {"env_step": 935000, "rew": 108.4689, "rew_std": 49.3729, "Agent": "DDPG"}, {"env_step": 940000, "rew": 108.3622, "rew_std": 48.773, "Agent": "DDPG"}, {"env_step": 945000, "rew": 108.3962, "rew_std": 49.1464, "Agent": "DDPG"}, {"env_step": 950000, "rew": 107.2917, "rew_std": 48.0124, "Agent": "DDPG"}, {"env_step": 955000, "rew": 107.329, "rew_std": 48.7632, "Agent": "DDPG"}, {"env_step": 960000, "rew": 107.8866, "rew_std": 49.1713, "Agent": "DDPG"}, {"env_step": 965000, "rew": 107.5759, "rew_std": 48.6815, "Agent": "DDPG"}, {"env_step": 970000, "rew": 108.133, "rew_std": 49.4281, "Agent": "DDPG"}, {"env_step": 975000, "rew": 107.6389, "rew_std": 48.2696, "Agent": "DDPG"}, {"env_step": 980000, "rew": 107.4483, "rew_std": 48.6085, "Agent": "DDPG"}, {"env_step": 985000, "rew": 108.0189, "rew_std": 48.8417, "Agent": "DDPG"}, {"env_step": 990000, "rew": 109.3234, "rew_std": 50.5991, "Agent": "DDPG"}, {"env_step": 995000, "rew": 109.0151, "rew_std": 50.4905, "Agent": "DDPG"}, {"env_step": 1000000, "rew": 108.814, "rew_std": 49.8831, "Agent": "DDPG"}, {"env_step": 1005000, "rew": 108.3801, "rew_std": 49.4534, "Agent": "DDPG"}, {"env_step": 1010000, "rew": 108.5171, "rew_std": 49.7201, "Agent": "DDPG"}, {"env_step": 1015000, "rew": 108.6333, "rew_std": 49.3683, "Agent": "DDPG"}, {"env_step": 1020000, "rew": 107.8037, "rew_std": 48.8344, "Agent": "DDPG"}, {"env_step": 1025000, "rew": 109.6875, "rew_std": 51.1063, "Agent": "DDPG"}, {"env_step": 1030000, "rew": 107.952, "rew_std": 49.3687, "Agent": "DDPG"}, {"env_step": 1035000, "rew": 108.3813, "rew_std": 48.8169, "Agent": "DDPG"}, {"env_step": 1040000, "rew": 108.3889, "rew_std": 49.3835, "Agent": "DDPG"}, {"env_step": 1045000, "rew": 108.832, "rew_std": 50.5686, "Agent": "DDPG"}, {"env_step": 1050000, "rew": 108.2503, "rew_std": 49.4035, "Agent": "DDPG"}, {"env_step": 1055000, "rew": 107.518, "rew_std": 48.8938, "Agent": "DDPG"}, {"env_step": 1060000, "rew": 108.592, "rew_std": 50.0621, "Agent": "DDPG"}, {"env_step": 1065000, "rew": 108.156, "rew_std": 48.9436, "Agent": "DDPG"}, {"env_step": 1070000, "rew": 107.79, "rew_std": 49.1456, "Agent": "DDPG"}, {"env_step": 1075000, "rew": 107.3237, "rew_std": 48.2445, "Agent": "DDPG"}, {"env_step": 1080000, "rew": 108.0468, "rew_std": 49.3038, "Agent": "DDPG"}, {"env_step": 1085000, "rew": 107.2851, "rew_std": 48.7523, "Agent": "DDPG"}, {"env_step": 1090000, "rew": 109.5256, "rew_std": 50.6178, "Agent": "DDPG"}, {"env_step": 1095000, "rew": 107.6415, "rew_std": 49.1169, "Agent": "DDPG"}, {"env_step": 1100000, "rew": 108.1626, "rew_std": 49.8981, "Agent": "DDPG"}, {"env_step": 1105000, "rew": 106.2928, "rew_std": 47.0271, "Agent": "DDPG"}, {"env_step": 1110000, "rew": 107.5527, "rew_std": 49.2958, "Agent": "DDPG"}, {"env_step": 1115000, "rew": 108.6973, "rew_std": 49.8643, "Agent": "DDPG"}, {"env_step": 1120000, "rew": 108.662, "rew_std": 49.4262, "Agent": "DDPG"}, {"env_step": 1125000, "rew": 106.7754, "rew_std": 47.1026, "Agent": "DDPG"}, {"env_step": 1130000, "rew": 107.6413, "rew_std": 48.6138, "Agent": "DDPG"}, {"env_step": 1135000, "rew": 108.61, "rew_std": 49.4814, "Agent": "DDPG"}, {"env_step": 1140000, "rew": 108.4586, "rew_std": 49.4734, "Agent": "DDPG"}, {"env_step": 1145000, "rew": 108.5004, "rew_std": 49.183, "Agent": "DDPG"}, {"env_step": 1150000, "rew": 107.3857, "rew_std": 48.3934, "Agent": "DDPG"}, {"env_step": 1155000, "rew": 107.8232, "rew_std": 49.21, "Agent": "DDPG"}, {"env_step": 1160000, "rew": 107.4314, "rew_std": 48.6418, "Agent": "DDPG"}, {"env_step": 1165000, "rew": 108.6097, "rew_std": 50.0509, "Agent": "DDPG"}, {"env_step": 1170000, "rew": 106.9657, "rew_std": 48.2271, "Agent": "DDPG"}, {"env_step": 1175000, "rew": 107.1207, "rew_std": 47.8233, "Agent": "DDPG"}, {"env_step": 1180000, "rew": 108.4552, "rew_std": 48.7664, "Agent": "DDPG"}, {"env_step": 1185000, "rew": 107.2896, "rew_std": 47.9247, "Agent": "DDPG"}, {"env_step": 1190000, "rew": 109.0348, "rew_std": 50.3553, "Agent": "DDPG"}, {"env_step": 1195000, "rew": 107.02, "rew_std": 47.8831, "Agent": "DDPG"}, {"env_step": 1200000, "rew": 107.8539, "rew_std": 48.963, "Agent": "DDPG"}, {"env_step": 1205000, "rew": 109.2758, "rew_std": 50.1332, "Agent": "DDPG"}, {"env_step": 1210000, "rew": 108.532, "rew_std": 49.2018, "Agent": "DDPG"}, {"env_step": 1215000, "rew": 107.9433, "rew_std": 49.1756, "Agent": "DDPG"}, {"env_step": 1220000, "rew": 108.429, "rew_std": 50.3263, "Agent": "DDPG"}, {"env_step": 1225000, "rew": 108.4288, "rew_std": 49.6, "Agent": "DDPG"}, {"env_step": 1230000, "rew": 108.0104, "rew_std": 49.69, "Agent": "DDPG"}, {"env_step": 1235000, "rew": 106.8428, "rew_std": 48.5726, "Agent": "DDPG"}, {"env_step": 1240000, "rew": 107.897, "rew_std": 49.5459, "Agent": "DDPG"}, {"env_step": 1245000, "rew": 107.7359, "rew_std": 48.8844, "Agent": "DDPG"}, {"env_step": 1250000, "rew": 107.0363, "rew_std": 48.3924, "Agent": "DDPG"}, {"env_step": 0, "rew": 130.7126, "rew_std": 15.6136, "Agent": "NPG"}, {"env_step": 30720, "rew": 204.1936, "rew_std": 14.0472, "Agent": "NPG"}, {"env_step": 61440, "rew": 339.4966, "rew_std": 20.7894, "Agent": "NPG"}, {"env_step": 92160, "rew": 416.5825, "rew_std": 27.0585, "Agent": "NPG"}, {"env_step": 122880, "rew": 433.643, "rew_std": 25.155, "Agent": "NPG"}, {"env_step": 153600, "rew": 467.6656, "rew_std": 37.6244, "Agent": "NPG"}, {"env_step": 184320, "rew": 449.881, "rew_std": 26.7401, "Agent": "NPG"}, {"env_step": 215040, "rew": 500.8714, "rew_std": 32.64, "Agent": "NPG"}, {"env_step": 245760, "rew": 521.3331, "rew_std": 37.498, "Agent": "NPG"}, {"env_step": 276480, "rew": 535.6495, "rew_std": 49.0992, "Agent": "NPG"}, {"env_step": 307200, "rew": 527.3379, "rew_std": 29.7799, "Agent": "NPG"}, {"env_step": 337920, "rew": 533.5609, "rew_std": 45.2783, "Agent": "NPG"}, {"env_step": 368640, "rew": 538.9746, "rew_std": 38.9739, "Agent": "NPG"}, {"env_step": 399360, "rew": 546.3672, "rew_std": 35.0729, "Agent": "NPG"}, {"env_step": 430080, "rew": 554.849, "rew_std": 43.1286, "Agent": "NPG"}, {"env_step": 460800, "rew": 551.0495, "rew_std": 41.6599, "Agent": "NPG"}, {"env_step": 491520, "rew": 559.351, "rew_std": 38.2528, "Agent": "NPG"}, {"env_step": 522240, "rew": 590.965, "rew_std": 33.7071, "Agent": "NPG"}, {"env_step": 552960, "rew": 575.8513, "rew_std": 46.799, "Agent": "NPG"}, {"env_step": 583680, "rew": 593.3327, "rew_std": 51.5337, "Agent": "NPG"}, {"env_step": 614400, "rew": 613.6212, "rew_std": 39.0163, "Agent": "NPG"}, {"env_step": 645120, "rew": 602.1067, "rew_std": 68.7681, "Agent": "NPG"}, {"env_step": 675840, "rew": 619.7777, "rew_std": 45.8641, "Agent": "NPG"}, {"env_step": 706560, "rew": 601.1798, "rew_std": 55.9149, "Agent": "NPG"}, {"env_step": 737280, "rew": 632.423, "rew_std": 62.0028, "Agent": "NPG"}, {"env_step": 768000, "rew": 614.2294, "rew_std": 52.2342, "Agent": "NPG"}, {"env_step": 798720, "rew": 646.6038, "rew_std": 52.8697, "Agent": "NPG"}, {"env_step": 829440, "rew": 674.5708, "rew_std": 67.6018, "Agent": "NPG"}, {"env_step": 860160, "rew": 652.7017, "rew_std": 58.1917, "Agent": "NPG"}, {"env_step": 890880, "rew": 678.0284, "rew_std": 66.6736, "Agent": "NPG"}, {"env_step": 921600, "rew": 704.4138, "rew_std": 63.1514, "Agent": "NPG"}, {"env_step": 952320, "rew": 715.6711, "rew_std": 78.4424, "Agent": "NPG"}, {"env_step": 983040, "rew": 753.2429, "rew_std": 104.9714, "Agent": "NPG"}, {"env_step": 1013760, "rew": 774.7323, "rew_std": 80.2417, "Agent": "NPG"}, {"env_step": 1044480, "rew": 782.5322, "rew_std": 137.5952, "Agent": "NPG"}, {"env_step": 1075200, "rew": 845.1488, "rew_std": 135.6502, "Agent": "NPG"}, {"env_step": 1105920, "rew": 918.8586, "rew_std": 209.3586, "Agent": "NPG"}, {"env_step": 1136640, "rew": 856.446, "rew_std": 118.0626, "Agent": "NPG"}, {"env_step": 1167360, "rew": 1025.0273, "rew_std": 242.0878, "Agent": "NPG"}, {"env_step": 1198080, "rew": 1007.6808, "rew_std": 261.4351, "Agent": "NPG"}, {"env_step": 1228800, "rew": 992.563, "rew_std": 190.4303, "Agent": "NPG"}, {"env_step": 1259520, "rew": 1057.9305, "rew_std": 268.7743, "Agent": "NPG"}, {"env_step": 1290240, "rew": 1202.8359, "rew_std": 429.4217, "Agent": "NPG"}, {"env_step": 1320960, "rew": 1235.7178, "rew_std": 375.5561, "Agent": "NPG"}, {"env_step": 1351680, "rew": 1343.8614, "rew_std": 572.9457, "Agent": "NPG"}, {"env_step": 1382400, "rew": 1343.9765, "rew_std": 539.2107, "Agent": "NPG"}, {"env_step": 1413120, "rew": 1413.9654, "rew_std": 623.4225, "Agent": "NPG"}, {"env_step": 1443840, "rew": 1427.2317, "rew_std": 623.5584, "Agent": "NPG"}, {"env_step": 1474560, "rew": 1595.0829, "rew_std": 695.3703, "Agent": "NPG"}, {"env_step": 1505280, "rew": 1733.6694, "rew_std": 763.9628, "Agent": "NPG"}, {"env_step": 1536000, "rew": 1459.7915, "rew_std": 627.7681, "Agent": "NPG"}, {"env_step": 1566720, "rew": 1836.4496, "rew_std": 733.3426, "Agent": "NPG"}, {"env_step": 1597440, "rew": 1799.7874, "rew_std": 879.0576, "Agent": "NPG"}, {"env_step": 1628160, "rew": 1915.8978, "rew_std": 903.326, "Agent": "NPG"}, {"env_step": 1658880, "rew": 1919.824, "rew_std": 973.4952, "Agent": "NPG"}, {"env_step": 1689600, "rew": 2222.8247, "rew_std": 1029.183, "Agent": "NPG"}, {"env_step": 1720320, "rew": 2123.0353, "rew_std": 914.354, "Agent": "NPG"}, {"env_step": 1751040, "rew": 2498.902, "rew_std": 1173.5658, "Agent": "NPG"}, {"env_step": 1781760, "rew": 2213.2595, "rew_std": 1051.8403, "Agent": "NPG"}, {"env_step": 1812480, "rew": 2475.1808, "rew_std": 1287.9709, "Agent": "NPG"}, {"env_step": 1843200, "rew": 2493.576, "rew_std": 1142.2587, "Agent": "NPG"}, {"env_step": 1873920, "rew": 2636.7974, "rew_std": 1170.2697, "Agent": "NPG"}, {"env_step": 1904640, "rew": 2679.8487, "rew_std": 1226.0742, "Agent": "NPG"}, {"env_step": 1935360, "rew": 2871.4496, "rew_std": 1250.855, "Agent": "NPG"}, {"env_step": 1966080, "rew": 2907.0378, "rew_std": 1281.2157, "Agent": "NPG"}, {"env_step": 1996800, "rew": 2988.5603, "rew_std": 1249.4198, "Agent": "NPG"}, {"env_step": 2027520, "rew": 3035.098, "rew_std": 1297.1558, "Agent": "NPG"}, {"env_step": 2058240, "rew": 3039.6056, "rew_std": 1284.4424, "Agent": "NPG"}, {"env_step": 2088960, "rew": 3212.0628, "rew_std": 1389.7895, "Agent": "NPG"}, {"env_step": 2119680, "rew": 3207.0746, "rew_std": 1329.2494, "Agent": "NPG"}, {"env_step": 2150400, "rew": 3301.2632, "rew_std": 1370.4126, "Agent": "NPG"}, {"env_step": 2181120, "rew": 3129.8601, "rew_std": 1423.0596, "Agent": "NPG"}, {"env_step": 2211840, "rew": 3261.4915, "rew_std": 1259.3788, "Agent": "NPG"}, {"env_step": 2242560, "rew": 2997.1561, "rew_std": 1433.1875, "Agent": "NPG"}, {"env_step": 2273280, "rew": 3364.489, "rew_std": 1353.9179, "Agent": "NPG"}, {"env_step": 2304000, "rew": 3313.5639, "rew_std": 1349.3013, "Agent": "NPG"}, {"env_step": 2334720, "rew": 3331.1348, "rew_std": 1414.5356, "Agent": "NPG"}, {"env_step": 2365440, "rew": 3366.3683, "rew_std": 1323.4285, "Agent": "NPG"}, {"env_step": 2396160, "rew": 3416.0622, "rew_std": 1159.1634, "Agent": "NPG"}, {"env_step": 2426880, "rew": 3447.5684, "rew_std": 1291.6741, "Agent": "NPG"}, {"env_step": 2457600, "rew": 3600.2265, "rew_std": 1172.9558, "Agent": "NPG"}, {"env_step": 2488320, "rew": 3755.61, "rew_std": 1232.5684, "Agent": "NPG"}, {"env_step": 2519040, "rew": 3937.5575, "rew_std": 1295.6958, "Agent": "NPG"}, {"env_step": 2549760, "rew": 3891.9033, "rew_std": 1119.5628, "Agent": "NPG"}, {"env_step": 2580480, "rew": 3458.7579, "rew_std": 1190.5515, "Agent": "NPG"}, {"env_step": 2611200, "rew": 3646.6966, "rew_std": 1311.4086, "Agent": "NPG"}, {"env_step": 2641920, "rew": 4082.6632, "rew_std": 1185.2542, "Agent": "NPG"}, {"env_step": 2672640, "rew": 3949.022, "rew_std": 1181.682, "Agent": "NPG"}, {"env_step": 2703360, "rew": 4034.4369, "rew_std": 1132.6729, "Agent": "NPG"}, {"env_step": 2734080, "rew": 3888.856, "rew_std": 1139.0166, "Agent": "NPG"}, {"env_step": 2764800, "rew": 3989.4274, "rew_std": 1167.2599, "Agent": "NPG"}, {"env_step": 2795520, "rew": 4028.2068, "rew_std": 1237.5093, "Agent": "NPG"}, {"env_step": 2826240, "rew": 4180.1562, "rew_std": 1282.7108, "Agent": "NPG"}, {"env_step": 2856960, "rew": 4337.1518, "rew_std": 1411.7956, "Agent": "NPG"}, {"env_step": 2887680, "rew": 4391.8549, "rew_std": 1245.5101, "Agent": "NPG"}, {"env_step": 2918400, "rew": 4288.3707, "rew_std": 1264.8927, "Agent": "NPG"}, {"env_step": 2949120, "rew": 4228.1116, "rew_std": 1184.0171, "Agent": "NPG"}, {"env_step": 2979840, "rew": 4031.2134, "rew_std": 1245.2265, "Agent": "NPG"}, {"env_step": 3010560, "rew": 4172.5567, "rew_std": 1301.0824, "Agent": "NPG"}, {"env_step": 3041280, "rew": 4342.0228, "rew_std": 1215.7579, "Agent": "NPG"}, {"env_step": 3072000, "rew": 4225.0898, "rew_std": 1276.1164, "Agent": "NPG"}]