[{"env_step": 0, "rew": 2.854, "rew_std": 2.439, "Agent": "PPO"}, {"env_step": 30720, "rew": 261.6371, "rew_std": 31.9544, "Agent": "PPO"}, {"env_step": 61440, "rew": 337.5775, "rew_std": 33.1557, "Agent": "PPO"}, {"env_step": 92160, "rew": 362.9134, "rew_std": 58.8816, "Agent": "PPO"}, {"env_step": 122880, "rew": 425.8273, "rew_std": 60.5094, "Agent": "PPO"}, {"env_step": 153600, "rew": 553.2555, "rew_std": 116.4205, "Agent": "PPO"}, {"env_step": 184320, "rew": 715.2234, "rew_std": 271.9853, "Agent": "PPO"}, {"env_step": 215040, "rew": 905.6901, "rew_std": 427.5947, "Agent": "PPO"}, {"env_step": 245760, "rew": 1126.158, "rew_std": 465.6568, "Agent": "PPO"}, {"env_step": 276480, "rew": 1337.0027, "rew_std": 444.4031, "Agent": "PPO"}, {"env_step": 307200, "rew": 1985.784, "rew_std": 756.4732, "Agent": "PPO"}, {"env_step": 337920, "rew": 1939.7872, "rew_std": 639.0395, "Agent": "PPO"}, {"env_step": 368640, "rew": 2077.5675, "rew_std": 774.0649, "Agent": "PPO"}, {"env_step": 399360, "rew": 2344.1341, "rew_std": 944.0267, "Agent": "PPO"}, {"env_step": 430080, "rew": 2608.1656, "rew_std": 686.5428, "Agent": "PPO"}, {"env_step": 460800, "rew": 2552.6508, "rew_std": 774.8729, "Agent": "PPO"}, {"env_step": 491520, "rew": 2759.0287, "rew_std": 613.4486, "Agent": "PPO"}, {"env_step": 522240, "rew": 2954.2882, "rew_std": 641.8847, "Agent": "PPO"}, {"env_step": 552960, "rew": 2740.7866, "rew_std": 597.9693, "Agent": "PPO"}, {"env_step": 583680, "rew": 2758.2169, "rew_std": 493.9706, "Agent": "PPO"}, {"env_step": 614400, "rew": 3133.3863, "rew_std": 838.3549, "Agent": "PPO"}, {"env_step": 645120, "rew": 3025.815, "rew_std": 441.8207, "Agent": "PPO"}, {"env_step": 675840, "rew": 3230.7174, "rew_std": 628.2298, "Agent": "PPO"}, {"env_step": 706560, "rew": 3501.1757, "rew_std": 661.1069, "Agent": "PPO"}, {"env_step": 737280, "rew": 3306.1529, "rew_std": 632.7268, "Agent": "PPO"}, {"env_step": 768000, "rew": 3202.6631, "rew_std": 575.353, "Agent": "PPO"}, {"env_step": 798720, "rew": 3125.1025, "rew_std": 641.088, "Agent": "PPO"}, {"env_step": 829440, "rew": 2937.7286, "rew_std": 972.9868, "Agent": "PPO"}, {"env_step": 860160, "rew": 3507.4568, "rew_std": 1043.6589, "Agent": "PPO"}, {"env_step": 890880, "rew": 3588.5181, "rew_std": 756.6306, "Agent": "PPO"}, {"env_step": 921600, "rew": 3286.1651, "rew_std": 1041.8169, "Agent": "PPO"}, {"env_step": 952320, "rew": 3515.5619, "rew_std": 1043.1778, "Agent": "PPO"}, {"env_step": 983040, "rew": 3493.7872, "rew_std": 1024.8728, "Agent": "PPO"}, {"env_step": 1013760, "rew": 3410.2609, "rew_std": 685.6092, "Agent": "PPO"}, {"env_step": 1044480, "rew": 3390.317, "rew_std": 795.0583, "Agent": "PPO"}, {"env_step": 1075200, "rew": 3297.4848, "rew_std": 847.0978, "Agent": "PPO"}, {"env_step": 1105920, "rew": 3789.9667, "rew_std": 896.1263, "Agent": "PPO"}, {"env_step": 1136640, "rew": 3485.3889, "rew_std": 775.1673, "Agent": "PPO"}, {"env_step": 1167360, "rew": 3766.0153, "rew_std": 762.1712, "Agent": "PPO"}, {"env_step": 1198080, "rew": 3916.4919, "rew_std": 637.0181, "Agent": "PPO"}, {"env_step": 1228800, "rew": 3641.0305, "rew_std": 734.5641, "Agent": "PPO"}, {"env_step": 1259520, "rew": 3838.3772, "rew_std": 871.0735, "Agent": "PPO"}, {"env_step": 1290240, "rew": 4149.6348, "rew_std": 822.515, "Agent": "PPO"}, {"env_step": 1320960, "rew": 3820.7451, "rew_std": 824.6649, "Agent": "PPO"}, {"env_step": 1351680, "rew": 3523.6159, "rew_std": 802.2996, "Agent": "PPO"}, {"env_step": 1382400, "rew": 3594.5379, "rew_std": 649.5449, "Agent": "PPO"}, {"env_step": 1413120, "rew": 4009.9213, "rew_std": 861.1393, "Agent": "PPO"}, {"env_step": 1443840, "rew": 3700.4344, "rew_std": 932.635, "Agent": "PPO"}, {"env_step": 1474560, "rew": 3810.8253, "rew_std": 948.657, "Agent": "PPO"}, {"env_step": 1505280, "rew": 3932.9272, "rew_std": 767.4963, "Agent": "PPO"}, {"env_step": 1536000, "rew": 3571.2177, "rew_std": 882.525, "Agent": "PPO"}, {"env_step": 1566720, "rew": 3637.1949, "rew_std": 878.2077, "Agent": "PPO"}, {"env_step": 1597440, "rew": 4002.2786, "rew_std": 669.5074, "Agent": "PPO"}, {"env_step": 1628160, "rew": 3986.5518, "rew_std": 651.4945, "Agent": "PPO"}, {"env_step": 1658880, "rew": 4073.0553, "rew_std": 530.0421, "Agent": "PPO"}, {"env_step": 1689600, "rew": 4123.7576, "rew_std": 836.6608, "Agent": "PPO"}, {"env_step": 1720320, "rew": 4093.6101, "rew_std": 889.4021, "Agent": "PPO"}, {"env_step": 1751040, "rew": 4012.082, "rew_std": 834.2345, "Agent": "PPO"}, {"env_step": 1781760, "rew": 4008.7549, "rew_std": 1018.6348, "Agent": "PPO"}, {"env_step": 1812480, "rew": 4002.3804, "rew_std": 935.0496, "Agent": "PPO"}, {"env_step": 1843200, "rew": 4109.2768, "rew_std": 884.4799, "Agent": "PPO"}, {"env_step": 1873920, "rew": 3893.1839, "rew_std": 1441.2806, "Agent": "PPO"}, {"env_step": 1904640, "rew": 3784.3364, "rew_std": 949.5072, "Agent": "PPO"}, {"env_step": 1935360, "rew": 4191.4698, "rew_std": 1208.749, "Agent": "PPO"}, {"env_step": 1966080, "rew": 4018.6931, "rew_std": 904.0015, "Agent": "PPO"}, {"env_step": 1996800, "rew": 4018.0772, "rew_std": 1023.582, "Agent": "PPO"}, {"env_step": 2027520, "rew": 3936.778, "rew_std": 706.0211, "Agent": "PPO"}, {"env_step": 2058240, "rew": 4521.6965, "rew_std": 844.448, "Agent": "PPO"}, {"env_step": 2088960, "rew": 4279.1014, "rew_std": 763.1104, "Agent": "PPO"}, {"env_step": 2119680, "rew": 3928.6194, "rew_std": 801.9427, "Agent": "PPO"}, {"env_step": 2150400, "rew": 4478.9202, "rew_std": 910.9486, "Agent": "PPO"}, {"env_step": 2181120, "rew": 4536.146, "rew_std": 754.0238, "Agent": "PPO"}, {"env_step": 2211840, "rew": 3723.36, "rew_std": 1065.5419, "Agent": "PPO"}, {"env_step": 2242560, "rew": 4600.0676, "rew_std": 843.5307, "Agent": "PPO"}, {"env_step": 2273280, "rew": 4646.8615, "rew_std": 693.3327, "Agent": "PPO"}, {"env_step": 2304000, "rew": 4895.5572, "rew_std": 704.2969, "Agent": "PPO"}, {"env_step": 2334720, "rew": 4682.4576, "rew_std": 771.115, "Agent": "PPO"}, {"env_step": 2365440, "rew": 3961.3622, "rew_std": 757.2372, "Agent": "PPO"}, {"env_step": 2396160, "rew": 4342.5382, "rew_std": 756.5942, "Agent": "PPO"}, {"env_step": 2426880, "rew": 4406.6723, "rew_std": 752.6507, "Agent": "PPO"}, {"env_step": 2457600, "rew": 4461.0387, "rew_std": 660.9203, "Agent": "PPO"}, {"env_step": 2488320, "rew": 4450.4049, "rew_std": 1070.5688, "Agent": "PPO"}, {"env_step": 2519040, "rew": 4628.4549, "rew_std": 883.0679, "Agent": "PPO"}, {"env_step": 2549760, "rew": 4353.2668, "rew_std": 1022.8285, "Agent": "PPO"}, {"env_step": 2580480, "rew": 4431.4896, "rew_std": 1042.5742, "Agent": "PPO"}, {"env_step": 2611200, "rew": 4444.7746, "rew_std": 978.6624, "Agent": "PPO"}, {"env_step": 2641920, "rew": 4753.0368, "rew_std": 904.3219, "Agent": "PPO"}, {"env_step": 2672640, "rew": 4475.2381, "rew_std": 716.1777, "Agent": "PPO"}, {"env_step": 2703360, "rew": 4213.8239, "rew_std": 919.9318, "Agent": "PPO"}, {"env_step": 2734080, "rew": 4766.5872, "rew_std": 942.6024, "Agent": "PPO"}, {"env_step": 2764800, "rew": 4714.3712, "rew_std": 988.3013, "Agent": "PPO"}, {"env_step": 2795520, "rew": 4654.9762, "rew_std": 985.8355, "Agent": "PPO"}, {"env_step": 2826240, "rew": 4544.4566, "rew_std": 994.8492, "Agent": "PPO"}, {"env_step": 2856960, "rew": 4454.7327, "rew_std": 971.1529, "Agent": "PPO"}, {"env_step": 2887680, "rew": 4622.6955, "rew_std": 1030.6566, "Agent": "PPO"}, {"env_step": 2918400, "rew": 4118.5372, "rew_std": 1002.9298, "Agent": "PPO"}, {"env_step": 2949120, "rew": 4404.5734, "rew_std": 797.9952, "Agent": "PPO"}, {"env_step": 2979840, "rew": 4564.1186, "rew_std": 614.9968, "Agent": "PPO"}, {"env_step": 3010560, "rew": 4674.4358, "rew_std": 688.045, "Agent": "PPO"}, {"env_step": 3041280, "rew": 4624.0476, "rew_std": 689.6915, "Agent": "PPO"}, {"env_step": 3072000, "rew": 4369.7249, "rew_std": 694.8409, "Agent": "PPO"}, {"env_step": 0, "rew": 6.442, "rew_std": 12.7772, "Agent": "TD3"}, {"env_step": 5000, "rew": 158.7514, "rew_std": 149.0815, "Agent": "TD3"}, {"env_step": 10000, "rew": 328.0599, "rew_std": 149.4269, "Agent": "TD3"}, {"env_step": 15000, "rew": 233.9062, "rew_std": 69.258, "Agent": "TD3"}, {"env_step": 20000, "rew": 201.0709, "rew_std": 80.6006, "Agent": "TD3"}, {"env_step": 25000, "rew": 225.3551, "rew_std": 94.806, "Agent": "TD3"}, {"env_step": 30000, "rew": 239.5848, "rew_std": 96.0552, "Agent": "TD3"}, {"env_step": 35000, "rew": 269.1682, "rew_std": 32.1917, "Agent": "TD3"}, {"env_step": 40000, "rew": 320.811, "rew_std": 73.1787, "Agent": "TD3"}, {"env_step": 45000, "rew": 343.9271, "rew_std": 128.5434, "Agent": "TD3"}, {"env_step": 50000, "rew": 302.3467, "rew_std": 90.5274, "Agent": "TD3"}, {"env_step": 55000, "rew": 312.8566, "rew_std": 84.0656, "Agent": "TD3"}, {"env_step": 60000, "rew": 352.6576, "rew_std": 106.7761, "Agent": "TD3"}, {"env_step": 65000, "rew": 326.7521, "rew_std": 94.8082, "Agent": "TD3"}, {"env_step": 70000, "rew": 330.8671, "rew_std": 83.0347, "Agent": "TD3"}, {"env_step": 75000, "rew": 372.7445, "rew_std": 84.5384, "Agent": "TD3"}, {"env_step": 80000, "rew": 375.3707, "rew_std": 115.8116, "Agent": "TD3"}, {"env_step": 85000, "rew": 400.8054, "rew_std": 161.2748, "Agent": "TD3"}, {"env_step": 90000, "rew": 388.8271, "rew_std": 102.1788, "Agent": "TD3"}, {"env_step": 95000, "rew": 372.0491, "rew_std": 93.8757, "Agent": "TD3"}, {"env_step": 100000, "rew": 483.179, "rew_std": 173.8667, "Agent": "TD3"}, {"env_step": 105000, "rew": 433.9904, "rew_std": 230.4379, "Agent": "TD3"}, {"env_step": 110000, "rew": 399.904, "rew_std": 146.0952, "Agent": "TD3"}, {"env_step": 115000, "rew": 429.8596, "rew_std": 186.4218, "Agent": "TD3"}, {"env_step": 120000, "rew": 516.3706, "rew_std": 239.1313, "Agent": "TD3"}, {"env_step": 125000, "rew": 442.9991, "rew_std": 141.8523, "Agent": "TD3"}, {"env_step": 130000, "rew": 557.6177, "rew_std": 265.7382, "Agent": "TD3"}, {"env_step": 135000, "rew": 469.2168, "rew_std": 133.5503, "Agent": "TD3"}, {"env_step": 140000, "rew": 524.6685, "rew_std": 422.1725, "Agent": "TD3"}, {"env_step": 145000, "rew": 684.2732, "rew_std": 423.544, "Agent": "TD3"}, {"env_step": 150000, "rew": 734.8403, "rew_std": 482.4015, "Agent": "TD3"}, {"env_step": 155000, "rew": 683.5625, "rew_std": 305.5673, "Agent": "TD3"}, {"env_step": 160000, "rew": 611.7085, "rew_std": 144.0629, "Agent": "TD3"}, {"env_step": 165000, "rew": 706.4468, "rew_std": 359.9577, "Agent": "TD3"}, {"env_step": 170000, "rew": 601.0122, "rew_std": 169.809, "Agent": "TD3"}, {"env_step": 175000, "rew": 661.1723, "rew_std": 281.8214, "Agent": "TD3"}, {"env_step": 180000, "rew": 705.3777, "rew_std": 239.7503, "Agent": "TD3"}, {"env_step": 185000, "rew": 794.0521, "rew_std": 374.1933, "Agent": "TD3"}, {"env_step": 190000, "rew": 823.9824, "rew_std": 398.4226, "Agent": "TD3"}, {"env_step": 195000, "rew": 699.2463, "rew_std": 208.1976, "Agent": "TD3"}, {"env_step": 200000, "rew": 941.3463, "rew_std": 364.9526, "Agent": "TD3"}, {"env_step": 205000, "rew": 1112.0146, "rew_std": 558.3674, "Agent": "TD3"}, {"env_step": 210000, "rew": 841.7313, "rew_std": 344.6793, "Agent": "TD3"}, {"env_step": 215000, "rew": 855.5637, "rew_std": 342.3671, "Agent": "TD3"}, {"env_step": 220000, "rew": 1082.3426, "rew_std": 419.8525, "Agent": "TD3"}, {"env_step": 225000, "rew": 996.6779, "rew_std": 302.9571, "Agent": "TD3"}, {"env_step": 230000, "rew": 1110.0677, "rew_std": 637.767, "Agent": "TD3"}, {"env_step": 235000, "rew": 986.4518, "rew_std": 486.7762, "Agent": "TD3"}, {"env_step": 240000, "rew": 1052.8166, "rew_std": 331.3324, "Agent": "TD3"}, {"env_step": 245000, "rew": 976.0542, "rew_std": 311.9513, "Agent": "TD3"}, {"env_step": 250000, "rew": 1073.1536, "rew_std": 401.591, "Agent": "TD3"}, {"env_step": 255000, "rew": 1027.4662, "rew_std": 452.8689, "Agent": "TD3"}, {"env_step": 260000, "rew": 1255.6355, "rew_std": 366.8668, "Agent": "TD3"}, {"env_step": 265000, "rew": 1134.7905, "rew_std": 633.5713, "Agent": "TD3"}, {"env_step": 270000, "rew": 1350.4891, "rew_std": 514.0592, "Agent": "TD3"}, {"env_step": 275000, "rew": 1528.3098, "rew_std": 639.93, "Agent": "TD3"}, {"env_step": 280000, "rew": 1561.4072, "rew_std": 624.7374, "Agent": "TD3"}, {"env_step": 285000, "rew": 1394.1363, "rew_std": 755.478, "Agent": "TD3"}, {"env_step": 290000, "rew": 1487.8592, "rew_std": 619.5499, "Agent": "TD3"}, {"env_step": 295000, "rew": 1613.1424, "rew_std": 429.2336, "Agent": "TD3"}, {"env_step": 300000, "rew": 1663.4857, "rew_std": 444.9467, "Agent": "TD3"}, {"env_step": 305000, "rew": 1694.6474, "rew_std": 574.26, "Agent": "TD3"}, {"env_step": 310000, "rew": 1761.2344, "rew_std": 737.9531, "Agent": "TD3"}, {"env_step": 315000, "rew": 1737.3753, "rew_std": 690.1306, "Agent": "TD3"}, {"env_step": 320000, "rew": 1484.3802, "rew_std": 683.9933, "Agent": "TD3"}, {"env_step": 325000, "rew": 1595.0691, "rew_std": 803.0037, "Agent": "TD3"}, {"env_step": 330000, "rew": 2032.7374, "rew_std": 690.3116, "Agent": "TD3"}, {"env_step": 335000, "rew": 1934.8132, "rew_std": 666.4994, "Agent": "TD3"}, {"env_step": 340000, "rew": 1780.9275, "rew_std": 848.6981, "Agent": "TD3"}, {"env_step": 345000, "rew": 1737.634, "rew_std": 610.4062, "Agent": "TD3"}, {"env_step": 350000, "rew": 1773.278, "rew_std": 800.7065, "Agent": "TD3"}, {"env_step": 355000, "rew": 1812.198, "rew_std": 839.2482, "Agent": "TD3"}, {"env_step": 360000, "rew": 1711.6147, "rew_std": 753.6186, "Agent": "TD3"}, {"env_step": 365000, "rew": 2240.8956, "rew_std": 880.8569, "Agent": "TD3"}, {"env_step": 370000, "rew": 2087.6909, "rew_std": 902.8196, "Agent": "TD3"}, {"env_step": 375000, "rew": 2304.4965, "rew_std": 833.5611, "Agent": "TD3"}, {"env_step": 380000, "rew": 2100.6447, "rew_std": 957.1324, "Agent": "TD3"}, {"env_step": 385000, "rew": 2058.1073, "rew_std": 862.5639, "Agent": "TD3"}, {"env_step": 390000, "rew": 2363.7057, "rew_std": 771.2759, "Agent": "TD3"}, {"env_step": 395000, "rew": 2455.8049, "rew_std": 658.723, "Agent": "TD3"}, {"env_step": 400000, "rew": 2348.6439, "rew_std": 633.6437, "Agent": "TD3"}, {"env_step": 405000, "rew": 2273.554, "rew_std": 667.0168, "Agent": "TD3"}, {"env_step": 410000, "rew": 2291.7861, "rew_std": 770.9224, "Agent": "TD3"}, {"env_step": 415000, "rew": 2513.2399, "rew_std": 848.8201, "Agent": "TD3"}, {"env_step": 420000, "rew": 2208.2059, "rew_std": 696.3375, "Agent": "TD3"}, {"env_step": 425000, "rew": 2166.119, "rew_std": 715.4351, "Agent": "TD3"}, {"env_step": 430000, "rew": 2224.1711, "rew_std": 731.2473, "Agent": "TD3"}, {"env_step": 435000, "rew": 1897.0515, "rew_std": 880.6732, "Agent": "TD3"}, {"env_step": 440000, "rew": 2551.5153, "rew_std": 701.0192, "Agent": "TD3"}, {"env_step": 445000, "rew": 2334.9395, "rew_std": 703.5641, "Agent": "TD3"}, {"env_step": 450000, "rew": 2505.681, "rew_std": 686.3249, "Agent": "TD3"}, {"env_step": 455000, "rew": 2355.8402, "rew_std": 890.6842, "Agent": "TD3"}, {"env_step": 460000, "rew": 2293.5938, "rew_std": 838.344, "Agent": "TD3"}, {"env_step": 465000, "rew": 2368.7359, "rew_std": 830.1159, "Agent": "TD3"}, {"env_step": 470000, "rew": 2411.0592, "rew_std": 704.3093, "Agent": "TD3"}, {"env_step": 475000, "rew": 2751.6453, "rew_std": 705.4476, "Agent": "TD3"}, {"env_step": 480000, "rew": 2580.7633, "rew_std": 779.1095, "Agent": "TD3"}, {"env_step": 485000, "rew": 2978.5183, "rew_std": 727.8662, "Agent": "TD3"}, {"env_step": 490000, "rew": 2824.3097, "rew_std": 749.4953, "Agent": "TD3"}, {"env_step": 495000, "rew": 2485.2124, "rew_std": 769.164, "Agent": "TD3"}, {"env_step": 500000, "rew": 2854.0884, "rew_std": 661.4938, "Agent": "TD3"}, {"env_step": 505000, "rew": 2143.0347, "rew_std": 963.777, "Agent": "TD3"}, {"env_step": 510000, "rew": 3001.1841, "rew_std": 742.2609, "Agent": "TD3"}, {"env_step": 515000, "rew": 2736.8395, "rew_std": 781.8594, "Agent": "TD3"}, {"env_step": 520000, "rew": 2945.8561, "rew_std": 707.811, "Agent": "TD3"}, {"env_step": 525000, "rew": 2805.6244, "rew_std": 579.5327, "Agent": "TD3"}, {"env_step": 530000, "rew": 2796.7993, "rew_std": 681.2886, "Agent": "TD3"}, {"env_step": 535000, "rew": 2951.7061, "rew_std": 682.8467, "Agent": "TD3"}, {"env_step": 540000, "rew": 2958.4438, "rew_std": 684.3542, "Agent": "TD3"}, {"env_step": 545000, "rew": 2872.1978, "rew_std": 734.9229, "Agent": "TD3"}, {"env_step": 550000, "rew": 3019.7389, "rew_std": 756.6407, "Agent": "TD3"}, {"env_step": 555000, "rew": 3024.8354, "rew_std": 588.9253, "Agent": "TD3"}, {"env_step": 560000, "rew": 3044.8315, "rew_std": 669.2755, "Agent": "TD3"}, {"env_step": 565000, "rew": 3151.5658, "rew_std": 725.1738, "Agent": "TD3"}, {"env_step": 570000, "rew": 2815.677, "rew_std": 768.4374, "Agent": "TD3"}, {"env_step": 575000, "rew": 2930.3515, "rew_std": 882.4038, "Agent": "TD3"}, {"env_step": 580000, "rew": 3024.0144, "rew_std": 762.7719, "Agent": "TD3"}, {"env_step": 585000, "rew": 2818.3069, "rew_std": 702.1715, "Agent": "TD3"}, {"env_step": 590000, "rew": 3214.1448, "rew_std": 524.9864, "Agent": "TD3"}, {"env_step": 595000, "rew": 3194.9089, "rew_std": 602.4906, "Agent": "TD3"}, {"env_step": 600000, "rew": 3249.3552, "rew_std": 561.4048, "Agent": "TD3"}, {"env_step": 605000, "rew": 3195.2999, "rew_std": 553.2233, "Agent": "TD3"}, {"env_step": 610000, "rew": 3223.7284, "rew_std": 745.6228, "Agent": "TD3"}, {"env_step": 615000, "rew": 3494.4464, "rew_std": 460.7696, "Agent": "TD3"}, {"env_step": 620000, "rew": 3250.9882, "rew_std": 632.032, "Agent": "TD3"}, {"env_step": 625000, "rew": 3252.4065, "rew_std": 362.011, "Agent": "TD3"}, {"env_step": 630000, "rew": 3348.9026, "rew_std": 541.9568, "Agent": "TD3"}, {"env_step": 635000, "rew": 3341.5474, "rew_std": 520.4724, "Agent": "TD3"}, {"env_step": 640000, "rew": 3465.9107, "rew_std": 470.1472, "Agent": "TD3"}, {"env_step": 645000, "rew": 3447.5678, "rew_std": 339.6862, "Agent": "TD3"}, {"env_step": 650000, "rew": 3526.4283, "rew_std": 392.9445, "Agent": "TD3"}, {"env_step": 655000, "rew": 3497.1426, "rew_std": 299.4359, "Agent": "TD3"}, {"env_step": 660000, "rew": 3560.9044, "rew_std": 274.2762, "Agent": "TD3"}, {"env_step": 665000, "rew": 3481.2923, "rew_std": 508.8687, "Agent": "TD3"}, {"env_step": 670000, "rew": 3450.3515, "rew_std": 474.4117, "Agent": "TD3"}, {"env_step": 675000, "rew": 3620.2938, "rew_std": 262.9504, "Agent": "TD3"}, {"env_step": 680000, "rew": 3605.5657, "rew_std": 327.8125, "Agent": "TD3"}, {"env_step": 685000, "rew": 3693.7608, "rew_std": 285.3848, "Agent": "TD3"}, {"env_step": 690000, "rew": 3646.776, "rew_std": 251.3765, "Agent": "TD3"}, {"env_step": 695000, "rew": 3634.8418, "rew_std": 401.0298, "Agent": "TD3"}, {"env_step": 700000, "rew": 3493.2776, "rew_std": 498.0473, "Agent": "TD3"}, {"env_step": 705000, "rew": 3558.622, "rew_std": 311.7681, "Agent": "TD3"}, {"env_step": 710000, "rew": 3671.6434, "rew_std": 353.3217, "Agent": "TD3"}, {"env_step": 715000, "rew": 3455.5073, "rew_std": 537.4161, "Agent": "TD3"}, {"env_step": 720000, "rew": 3652.0814, "rew_std": 369.6568, "Agent": "TD3"}, {"env_step": 725000, "rew": 3601.9809, "rew_std": 502.9231, "Agent": "TD3"}, {"env_step": 730000, "rew": 3667.8053, "rew_std": 364.6437, "Agent": "TD3"}, {"env_step": 735000, "rew": 3734.6185, "rew_std": 379.8678, "Agent": "TD3"}, {"env_step": 740000, "rew": 3624.3996, "rew_std": 406.5599, "Agent": "TD3"}, {"env_step": 745000, "rew": 3550.2741, "rew_std": 567.7901, "Agent": "TD3"}, {"env_step": 750000, "rew": 3617.8669, "rew_std": 448.0757, "Agent": "TD3"}, {"env_step": 755000, "rew": 3741.3288, "rew_std": 326.8557, "Agent": "TD3"}, {"env_step": 760000, "rew": 3730.5887, "rew_std": 325.761, "Agent": "TD3"}, {"env_step": 765000, "rew": 3729.6041, "rew_std": 362.6786, "Agent": "TD3"}, {"env_step": 770000, "rew": 3711.055, "rew_std": 378.0649, "Agent": "TD3"}, {"env_step": 775000, "rew": 3671.1828, "rew_std": 503.9591, "Agent": "TD3"}, {"env_step": 780000, "rew": 3588.0924, "rew_std": 560.2544, "Agent": "TD3"}, {"env_step": 785000, "rew": 3698.8766, "rew_std": 416.8417, "Agent": "TD3"}, {"env_step": 790000, "rew": 3750.5026, "rew_std": 394.3008, "Agent": "TD3"}, {"env_step": 795000, "rew": 3787.7582, "rew_std": 340.0923, "Agent": "TD3"}, {"env_step": 800000, "rew": 3740.6554, "rew_std": 441.4694, "Agent": "TD3"}, {"env_step": 805000, "rew": 3659.0503, "rew_std": 441.8842, "Agent": "TD3"}, {"env_step": 810000, "rew": 3848.2124, "rew_std": 338.7611, "Agent": "TD3"}, {"env_step": 815000, "rew": 3788.2873, "rew_std": 352.9827, "Agent": "TD3"}, {"env_step": 820000, "rew": 3676.1377, "rew_std": 447.1038, "Agent": "TD3"}, {"env_step": 825000, "rew": 3655.8464, "rew_std": 500.1373, "Agent": "TD3"}, {"env_step": 830000, "rew": 3661.1425, "rew_std": 474.9795, "Agent": "TD3"}, {"env_step": 835000, "rew": 3761.5947, "rew_std": 454.3814, "Agent": "TD3"}, {"env_step": 840000, "rew": 3547.5446, "rew_std": 649.1363, "Agent": "TD3"}, {"env_step": 845000, "rew": 3782.9667, "rew_std": 393.4763, "Agent": "TD3"}, {"env_step": 850000, "rew": 3826.4287, "rew_std": 434.9649, "Agent": "TD3"}, {"env_step": 855000, "rew": 3852.4662, "rew_std": 320.955, "Agent": "TD3"}, {"env_step": 860000, "rew": 3809.3982, "rew_std": 392.2426, "Agent": "TD3"}, {"env_step": 865000, "rew": 3922.2025, "rew_std": 301.9907, "Agent": "TD3"}, {"env_step": 870000, "rew": 3897.4311, "rew_std": 291.2018, "Agent": "TD3"}, {"env_step": 875000, "rew": 3854.7866, "rew_std": 308.0508, "Agent": "TD3"}, {"env_step": 880000, "rew": 3933.806, "rew_std": 249.8089, "Agent": "TD3"}, {"env_step": 885000, "rew": 3901.5901, "rew_std": 312.7858, "Agent": "TD3"}, {"env_step": 890000, "rew": 3801.9979, "rew_std": 403.794, "Agent": "TD3"}, {"env_step": 895000, "rew": 3867.7087, "rew_std": 321.1295, "Agent": "TD3"}, {"env_step": 900000, "rew": 3822.249, "rew_std": 238.2393, "Agent": "TD3"}, {"env_step": 905000, "rew": 3964.0144, "rew_std": 256.6233, "Agent": "TD3"}, {"env_step": 910000, "rew": 3872.3271, "rew_std": 358.6703, "Agent": "TD3"}, {"env_step": 915000, "rew": 3618.269, "rew_std": 689.9244, "Agent": "TD3"}, {"env_step": 920000, "rew": 3654.5516, "rew_std": 589.5807, "Agent": "TD3"}, {"env_step": 925000, "rew": 3726.6865, "rew_std": 570.2878, "Agent": "TD3"}, {"env_step": 930000, "rew": 3660.1793, "rew_std": 822.526, "Agent": "TD3"}, {"env_step": 935000, "rew": 3924.3608, "rew_std": 309.0233, "Agent": "TD3"}, {"env_step": 940000, "rew": 3869.3083, "rew_std": 345.4325, "Agent": "TD3"}, {"env_step": 945000, "rew": 3956.3273, "rew_std": 279.5054, "Agent": "TD3"}, {"env_step": 950000, "rew": 3886.109, "rew_std": 314.0698, "Agent": "TD3"}, {"env_step": 955000, "rew": 3887.0205, "rew_std": 341.8582, "Agent": "TD3"}, {"env_step": 960000, "rew": 3709.4522, "rew_std": 516.5253, "Agent": "TD3"}, {"env_step": 965000, "rew": 3929.1202, "rew_std": 353.7442, "Agent": "TD3"}, {"env_step": 970000, "rew": 3911.8695, "rew_std": 371.1694, "Agent": "TD3"}, {"env_step": 975000, "rew": 3908.5383, "rew_std": 361.4298, "Agent": "TD3"}, {"env_step": 980000, "rew": 3859.852, "rew_std": 417.185, "Agent": "TD3"}, {"env_step": 985000, "rew": 3982.3984, "rew_std": 274.5322, "Agent": "TD3"}, {"env_step": 990000, "rew": 3958.8785, "rew_std": 290.6377, "Agent": "TD3"}, {"env_step": 995000, "rew": 3963.8609, "rew_std": 286.8225, "Agent": "TD3"}, {"env_step": 1000000, "rew": 3842.4794, "rew_std": 542.842, "Agent": "TD3"}, {"env_step": 1005000, "rew": 3974.7944, "rew_std": 309.055, "Agent": "TD3"}, {"env_step": 1010000, "rew": 4003.5151, "rew_std": 263.8881, "Agent": "TD3"}, {"env_step": 1015000, "rew": 3983.979, "rew_std": 334.1982, "Agent": "TD3"}, {"env_step": 1020000, "rew": 3935.9096, "rew_std": 310.9028, "Agent": "TD3"}, {"env_step": 1025000, "rew": 3965.1715, "rew_std": 260.2935, "Agent": "TD3"}, {"env_step": 1030000, "rew": 3957.0111, "rew_std": 289.9182, "Agent": "TD3"}, {"env_step": 1035000, "rew": 3953.037, "rew_std": 289.5479, "Agent": "TD3"}, {"env_step": 1040000, "rew": 3947.6777, "rew_std": 317.5802, "Agent": "TD3"}, {"env_step": 1045000, "rew": 3965.4811, "rew_std": 313.9896, "Agent": "TD3"}, {"env_step": 1050000, "rew": 3981.0784, "rew_std": 260.7073, "Agent": "TD3"}, {"env_step": 1055000, "rew": 3969.5636, "rew_std": 285.3478, "Agent": "TD3"}, {"env_step": 1060000, "rew": 3870.8374, "rew_std": 380.1209, "Agent": "TD3"}, {"env_step": 1065000, "rew": 3962.4485, "rew_std": 329.861, "Agent": "TD3"}, {"env_step": 1070000, "rew": 3966.8242, "rew_std": 308.1006, "Agent": "TD3"}, {"env_step": 1075000, "rew": 3760.9236, "rew_std": 612.3897, "Agent": "TD3"}, {"env_step": 1080000, "rew": 3904.4641, "rew_std": 148.3606, "Agent": "TD3"}, {"env_step": 1085000, "rew": 4023.2404, "rew_std": 308.8932, "Agent": "TD3"}, {"env_step": 1090000, "rew": 3983.7184, "rew_std": 358.6709, "Agent": "TD3"}, {"env_step": 1095000, "rew": 3818.5878, "rew_std": 671.8452, "Agent": "TD3"}, {"env_step": 1100000, "rew": 3565.3794, "rew_std": 980.5895, "Agent": "TD3"}, {"env_step": 1105000, "rew": 3992.6244, "rew_std": 344.5732, "Agent": "TD3"}, {"env_step": 1110000, "rew": 4021.0643, "rew_std": 278.6346, "Agent": "TD3"}, {"env_step": 1115000, "rew": 4055.4366, "rew_std": 245.4637, "Agent": "TD3"}, {"env_step": 1120000, "rew": 4059.6238, "rew_std": 278.8573, "Agent": "TD3"}, {"env_step": 1125000, "rew": 4077.0175, "rew_std": 286.7732, "Agent": "TD3"}, {"env_step": 1130000, "rew": 4045.8937, "rew_std": 311.3991, "Agent": "TD3"}, {"env_step": 1135000, "rew": 3912.0977, "rew_std": 395.9068, "Agent": "TD3"}, {"env_step": 1140000, "rew": 4025.0121, "rew_std": 331.3458, "Agent": "TD3"}, {"env_step": 1145000, "rew": 3989.2987, "rew_std": 464.5883, "Agent": "TD3"}, {"env_step": 1150000, "rew": 3997.7196, "rew_std": 347.4466, "Agent": "TD3"}, {"env_step": 1155000, "rew": 3773.2647, "rew_std": 761.1243, "Agent": "TD3"}, {"env_step": 1160000, "rew": 3804.4806, "rew_std": 809.5976, "Agent": "TD3"}, {"env_step": 1165000, "rew": 3905.1056, "rew_std": 407.3495, "Agent": "TD3"}, {"env_step": 1170000, "rew": 3871.2903, "rew_std": 540.1013, "Agent": "TD3"}, {"env_step": 1175000, "rew": 4088.6869, "rew_std": 261.6677, "Agent": "TD3"}, {"env_step": 1180000, "rew": 4060.7687, "rew_std": 303.4577, "Agent": "TD3"}, {"env_step": 1185000, "rew": 3922.0452, "rew_std": 467.9461, "Agent": "TD3"}, {"env_step": 1190000, "rew": 3998.1894, "rew_std": 328.7816, "Agent": "TD3"}, {"env_step": 1195000, "rew": 4083.5345, "rew_std": 278.3686, "Agent": "TD3"}, {"env_step": 1200000, "rew": 4076.6858, "rew_std": 288.7971, "Agent": "TD3"}, {"env_step": 1205000, "rew": 3645.9029, "rew_std": 1259.4616, "Agent": "TD3"}, {"env_step": 1210000, "rew": 4022.6485, "rew_std": 257.4678, "Agent": "TD3"}, {"env_step": 1215000, "rew": 4099.1548, "rew_std": 286.4948, "Agent": "TD3"}, {"env_step": 1220000, "rew": 3926.8921, "rew_std": 500.0917, "Agent": "TD3"}, {"env_step": 1225000, "rew": 4029.5039, "rew_std": 379.5839, "Agent": "TD3"}, {"env_step": 1230000, "rew": 4072.0896, "rew_std": 319.4776, "Agent": "TD3"}, {"env_step": 1235000, "rew": 4008.971, "rew_std": 424.1579, "Agent": "TD3"}, {"env_step": 1240000, "rew": 4100.0992, "rew_std": 353.1118, "Agent": "TD3"}, {"env_step": 1245000, "rew": 4101.0508, "rew_std": 312.8775, "Agent": "TD3"}, {"env_step": 1250000, "rew": 3763.9407, "rew_std": 947.9912, "Agent": "TD3"}, {"env_step": 0, "rew": 4.5535, "rew_std": 2.0756, "Agent": "REINFORCE"}, {"env_step": 30720, "rew": 13.6527, "rew_std": 5.6565, "Agent": "REINFORCE"}, {"env_step": 61440, "rew": 110.1682, "rew_std": 59.6794, "Agent": "REINFORCE"}, {"env_step": 92160, "rew": 223.5316, "rew_std": 29.8609, "Agent": "REINFORCE"}, {"env_step": 122880, "rew": 200.5065, "rew_std": 39.9608, "Agent": "REINFORCE"}, {"env_step": 153600, "rew": 187.5621, "rew_std": 34.827, "Agent": "REINFORCE"}, {"env_step": 184320, "rew": 235.2624, "rew_std": 32.9012, "Agent": "REINFORCE"}, {"env_step": 215040, "rew": 239.778, "rew_std": 33.4927, "Agent": "REINFORCE"}, {"env_step": 245760, "rew": 247.0896, "rew_std": 29.8488, "Agent": "REINFORCE"}, {"env_step": 276480, "rew": 258.3275, "rew_std": 29.6617, "Agent": "REINFORCE"}, {"env_step": 307200, "rew": 266.5922, "rew_std": 30.4123, "Agent": "REINFORCE"}, {"env_step": 337920, "rew": 295.2816, "rew_std": 50.3467, "Agent": "REINFORCE"}, {"env_step": 368640, "rew": 292.9666, "rew_std": 42.0559, "Agent": "REINFORCE"}, {"env_step": 399360, "rew": 299.5063, "rew_std": 38.3164, "Agent": "REINFORCE"}, {"env_step": 430080, "rew": 271.3942, "rew_std": 46.1242, "Agent": "REINFORCE"}, {"env_step": 460800, "rew": 296.9937, "rew_std": 54.9201, "Agent": "REINFORCE"}, {"env_step": 491520, "rew": 284.61, "rew_std": 59.2053, "Agent": "REINFORCE"}, {"env_step": 522240, "rew": 323.922, "rew_std": 54.241, "Agent": "REINFORCE"}, {"env_step": 552960, "rew": 325.3197, "rew_std": 57.678, "Agent": "REINFORCE"}, {"env_step": 583680, "rew": 309.106, "rew_std": 53.6707, "Agent": "REINFORCE"}, {"env_step": 614400, "rew": 340.3094, "rew_std": 54.4306, "Agent": "REINFORCE"}, {"env_step": 645120, "rew": 322.4308, "rew_std": 66.5441, "Agent": "REINFORCE"}, {"env_step": 675840, "rew": 359.9286, "rew_std": 46.8059, "Agent": "REINFORCE"}, {"env_step": 706560, "rew": 355.6872, "rew_std": 60.0439, "Agent": "REINFORCE"}, {"env_step": 737280, "rew": 354.6147, "rew_std": 39.4527, "Agent": "REINFORCE"}, {"env_step": 768000, "rew": 342.5682, "rew_std": 35.7644, "Agent": "REINFORCE"}, {"env_step": 798720, "rew": 385.1629, "rew_std": 48.8126, "Agent": "REINFORCE"}, {"env_step": 829440, "rew": 391.1747, "rew_std": 44.5626, "Agent": "REINFORCE"}, {"env_step": 860160, "rew": 346.6364, "rew_std": 65.094, "Agent": "REINFORCE"}, {"env_step": 890880, "rew": 353.0954, "rew_std": 69.2847, "Agent": "REINFORCE"}, {"env_step": 921600, "rew": 346.909, "rew_std": 62.2388, "Agent": "REINFORCE"}, {"env_step": 952320, "rew": 367.5316, "rew_std": 60.5551, "Agent": "REINFORCE"}, {"env_step": 983040, "rew": 354.1843, "rew_std": 63.154, "Agent": "REINFORCE"}, {"env_step": 1013760, "rew": 343.4204, "rew_std": 55.6947, "Agent": "REINFORCE"}, {"env_step": 1044480, "rew": 354.1547, "rew_std": 97.6597, "Agent": "REINFORCE"}, {"env_step": 1075200, "rew": 403.1631, "rew_std": 76.9285, "Agent": "REINFORCE"}, {"env_step": 1105920, "rew": 381.1449, "rew_std": 80.7015, "Agent": "REINFORCE"}, {"env_step": 1136640, "rew": 372.1611, "rew_std": 84.8949, "Agent": "REINFORCE"}, {"env_step": 1167360, "rew": 339.0372, "rew_std": 72.4904, "Agent": "REINFORCE"}, {"env_step": 1198080, "rew": 357.2748, "rew_std": 57.2974, "Agent": "REINFORCE"}, {"env_step": 1228800, "rew": 355.9174, "rew_std": 80.0236, "Agent": "REINFORCE"}, {"env_step": 1259520, "rew": 353.4319, "rew_std": 64.1911, "Agent": "REINFORCE"}, {"env_step": 1290240, "rew": 373.0621, "rew_std": 92.4906, "Agent": "REINFORCE"}, {"env_step": 1320960, "rew": 341.2523, "rew_std": 77.9283, "Agent": "REINFORCE"}, {"env_step": 1351680, "rew": 348.859, "rew_std": 60.7955, "Agent": "REINFORCE"}, {"env_step": 1382400, "rew": 355.2645, "rew_std": 77.5044, "Agent": "REINFORCE"}, {"env_step": 1413120, "rew": 356.7775, "rew_std": 88.4894, "Agent": "REINFORCE"}, {"env_step": 1443840, "rew": 329.7672, "rew_std": 67.3729, "Agent": "REINFORCE"}, {"env_step": 1474560, "rew": 335.196, "rew_std": 94.2459, "Agent": "REINFORCE"}, {"env_step": 1505280, "rew": 356.1628, "rew_std": 75.7139, "Agent": "REINFORCE"}, {"env_step": 1536000, "rew": 352.1588, "rew_std": 71.9885, "Agent": "REINFORCE"}, {"env_step": 1566720, "rew": 361.1192, "rew_std": 62.3489, "Agent": "REINFORCE"}, {"env_step": 1597440, "rew": 352.0869, "rew_std": 69.1096, "Agent": "REINFORCE"}, {"env_step": 1628160, "rew": 344.9398, "rew_std": 61.5555, "Agent": "REINFORCE"}, {"env_step": 1658880, "rew": 371.1304, "rew_std": 78.2817, "Agent": "REINFORCE"}, {"env_step": 1689600, "rew": 356.5322, "rew_std": 118.4185, "Agent": "REINFORCE"}, {"env_step": 1720320, "rew": 370.873, "rew_std": 86.1696, "Agent": "REINFORCE"}, {"env_step": 1751040, "rew": 361.6152, "rew_std": 85.3641, "Agent": "REINFORCE"}, {"env_step": 1781760, "rew": 366.3599, "rew_std": 82.2322, "Agent": "REINFORCE"}, {"env_step": 1812480, "rew": 367.3329, "rew_std": 80.3721, "Agent": "REINFORCE"}, {"env_step": 1843200, "rew": 362.9224, "rew_std": 86.4875, "Agent": "REINFORCE"}, {"env_step": 1873920, "rew": 388.4115, "rew_std": 80.8852, "Agent": "REINFORCE"}, {"env_step": 1904640, "rew": 352.6121, "rew_std": 89.2546, "Agent": "REINFORCE"}, {"env_step": 1935360, "rew": 354.0444, "rew_std": 105.3851, "Agent": "REINFORCE"}, {"env_step": 1966080, "rew": 371.3243, "rew_std": 87.666, "Agent": "REINFORCE"}, {"env_step": 1996800, "rew": 365.3113, "rew_std": 103.0233, "Agent": "REINFORCE"}, {"env_step": 2027520, "rew": 355.7672, "rew_std": 90.9894, "Agent": "REINFORCE"}, {"env_step": 2058240, "rew": 338.4174, "rew_std": 87.8862, "Agent": "REINFORCE"}, {"env_step": 2088960, "rew": 362.839, "rew_std": 92.0007, "Agent": "REINFORCE"}, {"env_step": 2119680, "rew": 368.269, "rew_std": 102.4378, "Agent": "REINFORCE"}, {"env_step": 2150400, "rew": 373.8035, "rew_std": 87.1727, "Agent": "REINFORCE"}, {"env_step": 2181120, "rew": 361.1823, "rew_std": 78.0693, "Agent": "REINFORCE"}, {"env_step": 2211840, "rew": 367.1892, "rew_std": 102.8876, "Agent": "REINFORCE"}, {"env_step": 2242560, "rew": 365.9658, "rew_std": 81.4782, "Agent": "REINFORCE"}, {"env_step": 2273280, "rew": 360.6872, "rew_std": 114.0468, "Agent": "REINFORCE"}, {"env_step": 2304000, "rew": 365.9783, "rew_std": 122.2242, "Agent": "REINFORCE"}, {"env_step": 2334720, "rew": 379.9675, "rew_std": 81.0374, "Agent": "REINFORCE"}, {"env_step": 2365440, "rew": 345.6967, "rew_std": 87.0767, "Agent": "REINFORCE"}, {"env_step": 2396160, "rew": 366.1253, "rew_std": 105.243, "Agent": "REINFORCE"}, {"env_step": 2426880, "rew": 352.4197, "rew_std": 74.3958, "Agent": "REINFORCE"}, {"env_step": 2457600, "rew": 380.5138, "rew_std": 77.7426, "Agent": "REINFORCE"}, {"env_step": 2488320, "rew": 367.3545, "rew_std": 109.7126, "Agent": "REINFORCE"}, {"env_step": 2519040, "rew": 369.4047, "rew_std": 88.9617, "Agent": "REINFORCE"}, {"env_step": 2549760, "rew": 355.9494, "rew_std": 84.9406, "Agent": "REINFORCE"}, {"env_step": 2580480, "rew": 361.6388, "rew_std": 77.2025, "Agent": "REINFORCE"}, {"env_step": 2611200, "rew": 385.6433, "rew_std": 56.6485, "Agent": "REINFORCE"}, {"env_step": 2641920, "rew": 383.2675, "rew_std": 59.8544, "Agent": "REINFORCE"}, {"env_step": 2672640, "rew": 383.3281, "rew_std": 53.5628, "Agent": "REINFORCE"}, {"env_step": 2703360, "rew": 380.186, "rew_std": 51.4936, "Agent": "REINFORCE"}, {"env_step": 2734080, "rew": 357.4304, "rew_std": 92.4873, "Agent": "REINFORCE"}, {"env_step": 2764800, "rew": 372.8371, "rew_std": 62.6374, "Agent": "REINFORCE"}, {"env_step": 2795520, "rew": 369.476, "rew_std": 93.6221, "Agent": "REINFORCE"}, {"env_step": 2826240, "rew": 377.2572, "rew_std": 53.0474, "Agent": "REINFORCE"}, {"env_step": 2856960, "rew": 387.0054, "rew_std": 83.6139, "Agent": "REINFORCE"}, {"env_step": 2887680, "rew": 411.9642, "rew_std": 52.4265, "Agent": "REINFORCE"}, {"env_step": 2918400, "rew": 377.7804, "rew_std": 61.193, "Agent": "REINFORCE"}, {"env_step": 2949120, "rew": 393.2933, "rew_std": 47.9778, "Agent": "REINFORCE"}, {"env_step": 2979840, "rew": 376.6218, "rew_std": 34.4225, "Agent": "REINFORCE"}, {"env_step": 3010560, "rew": 402.7766, "rew_std": 51.016, "Agent": "REINFORCE"}, {"env_step": 3041280, "rew": 397.0908, "rew_std": 52.792, "Agent": "REINFORCE"}, {"env_step": 3072000, "rew": 367.9954, "rew_std": 50.4738, "Agent": "REINFORCE"}, {"env_step": 3102720, "rew": 393.0217, "rew_std": 40.7415, "Agent": "REINFORCE"}, {"env_step": 3133440, "rew": 382.9788, "rew_std": 73.7203, "Agent": "REINFORCE"}, {"env_step": 3164160, "rew": 392.1084, "rew_std": 80.7669, "Agent": "REINFORCE"}, {"env_step": 3194880, "rew": 368.0044, "rew_std": 109.1821, "Agent": "REINFORCE"}, {"env_step": 3225600, "rew": 365.6822, "rew_std": 102.6338, "Agent": "REINFORCE"}, {"env_step": 3256320, "rew": 382.1389, "rew_std": 90.5947, "Agent": "REINFORCE"}, {"env_step": 3287040, "rew": 369.5934, "rew_std": 119.2678, "Agent": "REINFORCE"}, {"env_step": 3317760, "rew": 393.8103, "rew_std": 75.0153, "Agent": "REINFORCE"}, {"env_step": 3348480, "rew": 395.4096, "rew_std": 55.3204, "Agent": "REINFORCE"}, {"env_step": 3379200, "rew": 397.228, "rew_std": 45.0803, "Agent": "REINFORCE"}, {"env_step": 3409920, "rew": 375.64, "rew_std": 70.8521, "Agent": "REINFORCE"}, {"env_step": 3440640, "rew": 365.7149, "rew_std": 95.5683, "Agent": "REINFORCE"}, {"env_step": 3471360, "rew": 403.0538, "rew_std": 87.3548, "Agent": "REINFORCE"}, {"env_step": 3502080, "rew": 380.4232, "rew_std": 69.2007, "Agent": "REINFORCE"}, {"env_step": 3532800, "rew": 365.7752, "rew_std": 60.142, "Agent": "REINFORCE"}, {"env_step": 3563520, "rew": 412.5866, "rew_std": 75.7224, "Agent": "REINFORCE"}, {"env_step": 3594240, "rew": 381.8078, "rew_std": 49.9293, "Agent": "REINFORCE"}, {"env_step": 3624960, "rew": 365.5222, "rew_std": 71.6263, "Agent": "REINFORCE"}, {"env_step": 3655680, "rew": 377.7163, "rew_std": 91.3498, "Agent": "REINFORCE"}, {"env_step": 3686400, "rew": 383.1321, "rew_std": 85.0593, "Agent": "REINFORCE"}, {"env_step": 3717120, "rew": 383.9464, "rew_std": 66.19, "Agent": "REINFORCE"}, {"env_step": 3747840, "rew": 385.9448, "rew_std": 67.9891, "Agent": "REINFORCE"}, {"env_step": 3778560, "rew": 400.476, "rew_std": 72.4173, "Agent": "REINFORCE"}, {"env_step": 3809280, "rew": 388.3522, "rew_std": 75.5529, "Agent": "REINFORCE"}, {"env_step": 3840000, "rew": 370.6014, "rew_std": 51.1635, "Agent": "REINFORCE"}, {"env_step": 3870720, "rew": 375.0117, "rew_std": 51.0137, "Agent": "REINFORCE"}, {"env_step": 3901440, "rew": 379.3578, "rew_std": 86.254, "Agent": "REINFORCE"}, {"env_step": 3932160, "rew": 344.8633, "rew_std": 88.2011, "Agent": "REINFORCE"}, {"env_step": 3962880, "rew": 374.3863, "rew_std": 95.5118, "Agent": "REINFORCE"}, {"env_step": 3993600, "rew": 365.4688, "rew_std": 36.3682, "Agent": "REINFORCE"}, {"env_step": 4024320, "rew": 366.4785, "rew_std": 71.8855, "Agent": "REINFORCE"}, {"env_step": 4055040, "rew": 391.0318, "rew_std": 87.9838, "Agent": "REINFORCE"}, {"env_step": 4085760, "rew": 381.0298, "rew_std": 134.4287, "Agent": "REINFORCE"}, {"env_step": 4116480, "rew": 376.8203, "rew_std": 122.3133, "Agent": "REINFORCE"}, {"env_step": 4147200, "rew": 385.0486, "rew_std": 122.6676, "Agent": "REINFORCE"}, {"env_step": 4177920, "rew": 392.2119, "rew_std": 84.2356, "Agent": "REINFORCE"}, {"env_step": 4208640, "rew": 390.4859, "rew_std": 102.2499, "Agent": "REINFORCE"}, {"env_step": 4239360, "rew": 375.6258, "rew_std": 86.9314, "Agent": "REINFORCE"}, {"env_step": 4270080, "rew": 360.4221, "rew_std": 83.6774, "Agent": "REINFORCE"}, {"env_step": 4300800, "rew": 391.1976, "rew_std": 126.0342, "Agent": "REINFORCE"}, {"env_step": 4331520, "rew": 400.9994, "rew_std": 130.515, "Agent": "REINFORCE"}, {"env_step": 4362240, "rew": 390.3708, "rew_std": 130.4103, "Agent": "REINFORCE"}, {"env_step": 4392960, "rew": 418.1074, "rew_std": 143.7854, "Agent": "REINFORCE"}, {"env_step": 4423680, "rew": 389.2711, "rew_std": 127.9304, "Agent": "REINFORCE"}, {"env_step": 4454400, "rew": 400.3435, "rew_std": 93.977, "Agent": "REINFORCE"}, {"env_step": 4485120, "rew": 392.0837, "rew_std": 70.1953, "Agent": "REINFORCE"}, {"env_step": 4515840, "rew": 384.8207, "rew_std": 52.8932, "Agent": "REINFORCE"}, {"env_step": 4546560, "rew": 388.1618, "rew_std": 70.1572, "Agent": "REINFORCE"}, {"env_step": 4577280, "rew": 404.4836, "rew_std": 32.4901, "Agent": "REINFORCE"}, {"env_step": 4608000, "rew": 369.5814, "rew_std": 48.7199, "Agent": "REINFORCE"}, {"env_step": 4638720, "rew": 389.792, "rew_std": 71.4531, "Agent": "REINFORCE"}, {"env_step": 4669440, "rew": 398.5943, "rew_std": 44.3371, "Agent": "REINFORCE"}, {"env_step": 4700160, "rew": 402.502, "rew_std": 96.5453, "Agent": "REINFORCE"}, {"env_step": 4730880, "rew": 396.9333, "rew_std": 91.251, "Agent": "REINFORCE"}, {"env_step": 4761600, "rew": 417.5429, "rew_std": 78.3296, "Agent": "REINFORCE"}, {"env_step": 4792320, "rew": 387.9348, "rew_std": 104.9392, "Agent": "REINFORCE"}, {"env_step": 4823040, "rew": 380.8827, "rew_std": 73.3557, "Agent": "REINFORCE"}, {"env_step": 4853760, "rew": 373.8808, "rew_std": 85.8424, "Agent": "REINFORCE"}, {"env_step": 4884480, "rew": 407.9777, "rew_std": 105.0307, "Agent": "REINFORCE"}, {"env_step": 4915200, "rew": 402.8455, "rew_std": 66.1868, "Agent": "REINFORCE"}, {"env_step": 4945920, "rew": 404.205, "rew_std": 58.5461, "Agent": "REINFORCE"}, {"env_step": 4976640, "rew": 386.6169, "rew_std": 125.2089, "Agent": "REINFORCE"}, {"env_step": 5007360, "rew": 408.7262, "rew_std": 123.4934, "Agent": "REINFORCE"}, {"env_step": 5038080, "rew": 408.2545, "rew_std": 86.5406, "Agent": "REINFORCE"}, {"env_step": 5068800, "rew": 388.8189, "rew_std": 52.579, "Agent": "REINFORCE"}, {"env_step": 5099520, "rew": 394.7104, "rew_std": 99.5027, "Agent": "REINFORCE"}, {"env_step": 5130240, "rew": 401.2406, "rew_std": 136.2089, "Agent": "REINFORCE"}, {"env_step": 5160960, "rew": 398.7414, "rew_std": 79.958, "Agent": "REINFORCE"}, {"env_step": 5191680, "rew": 373.4073, "rew_std": 77.1063, "Agent": "REINFORCE"}, {"env_step": 5222400, "rew": 393.8529, "rew_std": 43.3438, "Agent": "REINFORCE"}, {"env_step": 5253120, "rew": 401.865, "rew_std": 102.3126, "Agent": "REINFORCE"}, {"env_step": 5283840, "rew": 380.1387, "rew_std": 54.8124, "Agent": "REINFORCE"}, {"env_step": 5314560, "rew": 387.9333, "rew_std": 86.9538, "Agent": "REINFORCE"}, {"env_step": 5345280, "rew": 415.7576, "rew_std": 97.4606, "Agent": "REINFORCE"}, {"env_step": 5376000, "rew": 411.729, "rew_std": 39.4573, "Agent": "REINFORCE"}, {"env_step": 5406720, "rew": 385.0198, "rew_std": 43.8433, "Agent": "REINFORCE"}, {"env_step": 5437440, "rew": 407.4051, "rew_std": 40.8758, "Agent": "REINFORCE"}, {"env_step": 5468160, "rew": 386.1591, "rew_std": 76.381, "Agent": "REINFORCE"}, {"env_step": 5498880, "rew": 376.209, "rew_std": 59.3498, "Agent": "REINFORCE"}, {"env_step": 5529600, "rew": 374.4433, "rew_std": 65.4441, "Agent": "REINFORCE"}, {"env_step": 5560320, "rew": 381.2189, "rew_std": 52.3455, "Agent": "REINFORCE"}, {"env_step": 5591040, "rew": 400.3018, "rew_std": 52.0294, "Agent": "REINFORCE"}, {"env_step": 5621760, "rew": 365.557, "rew_std": 72.3095, "Agent": "REINFORCE"}, {"env_step": 5652480, "rew": 385.0313, "rew_std": 59.146, "Agent": "REINFORCE"}, {"env_step": 5683200, "rew": 397.3092, "rew_std": 82.9393, "Agent": "REINFORCE"}, {"env_step": 5713920, "rew": 379.5796, "rew_std": 92.9322, "Agent": "REINFORCE"}, {"env_step": 5744640, "rew": 369.3897, "rew_std": 82.5958, "Agent": "REINFORCE"}, {"env_step": 5775360, "rew": 375.9339, "rew_std": 65.9221, "Agent": "REINFORCE"}, {"env_step": 5806080, "rew": 385.4407, "rew_std": 49.7583, "Agent": "REINFORCE"}, {"env_step": 5836800, "rew": 358.2405, "rew_std": 76.576, "Agent": "REINFORCE"}, {"env_step": 5867520, "rew": 379.1335, "rew_std": 85.8798, "Agent": "REINFORCE"}, {"env_step": 5898240, "rew": 390.6354, "rew_std": 55.6648, "Agent": "REINFORCE"}, {"env_step": 5928960, "rew": 407.4857, "rew_std": 53.7845, "Agent": "REINFORCE"}, {"env_step": 5959680, "rew": 389.4891, "rew_std": 62.8058, "Agent": "REINFORCE"}, {"env_step": 5990400, "rew": 378.5658, "rew_std": 85.5362, "Agent": "REINFORCE"}, {"env_step": 6021120, "rew": 421.8988, "rew_std": 90.1603, "Agent": "REINFORCE"}, {"env_step": 6051840, "rew": 391.6838, "rew_std": 84.9852, "Agent": "REINFORCE"}, {"env_step": 6082560, "rew": 396.7111, "rew_std": 93.5643, "Agent": "REINFORCE"}, {"env_step": 6113280, "rew": 402.8608, "rew_std": 80.8142, "Agent": "REINFORCE"}, {"env_step": 6144000, "rew": 391.1558, "rew_std": 99.2084, "Agent": "REINFORCE"}, {"env_step": 6174720, "rew": 380.1508, "rew_std": 96.9348, "Agent": "REINFORCE"}, {"env_step": 6205440, "rew": 398.3499, "rew_std": 71.4008, "Agent": "REINFORCE"}, {"env_step": 6236160, "rew": 393.8231, "rew_std": 67.8702, "Agent": "REINFORCE"}, {"env_step": 6266880, "rew": 370.8872, "rew_std": 85.2826, "Agent": "REINFORCE"}, {"env_step": 6297600, "rew": 434.32, "rew_std": 85.2785, "Agent": "REINFORCE"}, {"env_step": 6328320, "rew": 377.7296, "rew_std": 127.8071, "Agent": "REINFORCE"}, {"env_step": 6359040, "rew": 375.258, "rew_std": 131.5744, "Agent": "REINFORCE"}, {"env_step": 6389760, "rew": 380.6274, "rew_std": 100.9078, "Agent": "REINFORCE"}, {"env_step": 6420480, "rew": 395.2915, "rew_std": 96.0091, "Agent": "REINFORCE"}, {"env_step": 6451200, "rew": 415.9735, "rew_std": 144.4578, "Agent": "REINFORCE"}, {"env_step": 6481920, "rew": 388.7657, "rew_std": 98.0722, "Agent": "REINFORCE"}, {"env_step": 6512640, "rew": 410.147, "rew_std": 121.3785, "Agent": "REINFORCE"}, {"env_step": 6543360, "rew": 420.5058, "rew_std": 143.5157, "Agent": "REINFORCE"}, {"env_step": 6574080, "rew": 381.8966, "rew_std": 117.6944, "Agent": "REINFORCE"}, {"env_step": 6604800, "rew": 380.0762, "rew_std": 107.2386, "Agent": "REINFORCE"}, {"env_step": 6635520, "rew": 389.8562, "rew_std": 143.3065, "Agent": "REINFORCE"}, {"env_step": 6666240, "rew": 390.21, "rew_std": 106.5489, "Agent": "REINFORCE"}, {"env_step": 6696960, "rew": 440.9279, "rew_std": 148.2265, "Agent": "REINFORCE"}, {"env_step": 6727680, "rew": 401.6778, "rew_std": 126.5315, "Agent": "REINFORCE"}, {"env_step": 6758400, "rew": 406.0223, "rew_std": 116.1778, "Agent": "REINFORCE"}, {"env_step": 6789120, "rew": 359.3388, "rew_std": 81.5517, "Agent": "REINFORCE"}, {"env_step": 6819840, "rew": 402.2027, "rew_std": 128.0781, "Agent": "REINFORCE"}, {"env_step": 6850560, "rew": 375.5144, "rew_std": 100.1, "Agent": "REINFORCE"}, {"env_step": 6881280, "rew": 370.0802, "rew_std": 94.1041, "Agent": "REINFORCE"}, {"env_step": 6912000, "rew": 387.4542, "rew_std": 58.9515, "Agent": "REINFORCE"}, {"env_step": 6942720, "rew": 392.3885, "rew_std": 113.2836, "Agent": "REINFORCE"}, {"env_step": 6973440, "rew": 384.8551, "rew_std": 105.257, "Agent": "REINFORCE"}, {"env_step": 7004160, "rew": 392.4603, "rew_std": 131.9155, "Agent": "REINFORCE"}, {"env_step": 7034880, "rew": 373.492, "rew_std": 90.3701, "Agent": "REINFORCE"}, {"env_step": 7065600, "rew": 369.7354, "rew_std": 118.7059, "Agent": "REINFORCE"}, {"env_step": 7096320, "rew": 398.9831, "rew_std": 57.4786, "Agent": "REINFORCE"}, {"env_step": 7127040, "rew": 366.8138, "rew_std": 101.1937, "Agent": "REINFORCE"}, {"env_step": 7157760, "rew": 385.3933, "rew_std": 115.2182, "Agent": "REINFORCE"}, {"env_step": 7188480, "rew": 363.0968, "rew_std": 106.2384, "Agent": "REINFORCE"}, {"env_step": 7219200, "rew": 364.1249, "rew_std": 132.2329, "Agent": "REINFORCE"}, {"env_step": 7249920, "rew": 386.8129, "rew_std": 106.5349, "Agent": "REINFORCE"}, {"env_step": 7280640, "rew": 361.4476, "rew_std": 92.2265, "Agent": "REINFORCE"}, {"env_step": 7311360, "rew": 367.8644, "rew_std": 76.1768, "Agent": "REINFORCE"}, {"env_step": 7342080, "rew": 372.2277, "rew_std": 61.5203, "Agent": "REINFORCE"}, {"env_step": 7372800, "rew": 383.5695, "rew_std": 65.289, "Agent": "REINFORCE"}, {"env_step": 7403520, "rew": 376.8635, "rew_std": 111.4057, "Agent": "REINFORCE"}, {"env_step": 7434240, "rew": 364.5879, "rew_std": 100.5854, "Agent": "REINFORCE"}, {"env_step": 7464960, "rew": 368.2759, "rew_std": 99.9324, "Agent": "REINFORCE"}, {"env_step": 7495680, "rew": 381.457, "rew_std": 92.2431, "Agent": "REINFORCE"}, {"env_step": 7526400, "rew": 351.8763, "rew_std": 132.2134, "Agent": "REINFORCE"}, {"env_step": 7557120, "rew": 383.2411, "rew_std": 74.2994, "Agent": "REINFORCE"}, {"env_step": 7587840, "rew": 350.1911, "rew_std": 92.5451, "Agent": "REINFORCE"}, {"env_step": 7618560, "rew": 363.1767, "rew_std": 88.2368, "Agent": "REINFORCE"}, {"env_step": 7649280, "rew": 382.3549, "rew_std": 132.6238, "Agent": "REINFORCE"}, {"env_step": 7680000, "rew": 359.9137, "rew_std": 101.0479, "Agent": "REINFORCE"}, {"env_step": 7710720, "rew": 367.2583, "rew_std": 101.4204, "Agent": "REINFORCE"}, {"env_step": 7741440, "rew": 343.4797, "rew_std": 113.3278, "Agent": "REINFORCE"}, {"env_step": 7772160, "rew": 357.4038, "rew_std": 120.2726, "Agent": "REINFORCE"}, {"env_step": 7802880, "rew": 371.3363, "rew_std": 68.6317, "Agent": "REINFORCE"}, {"env_step": 7833600, "rew": 380.6468, "rew_std": 62.7897, "Agent": "REINFORCE"}, {"env_step": 7864320, "rew": 364.0078, "rew_std": 102.1884, "Agent": "REINFORCE"}, {"env_step": 7895040, "rew": 390.4208, "rew_std": 64.8, "Agent": "REINFORCE"}, {"env_step": 7925760, "rew": 367.6176, "rew_std": 57.5819, "Agent": "REINFORCE"}, {"env_step": 7956480, "rew": 374.8038, "rew_std": 75.8725, "Agent": "REINFORCE"}, {"env_step": 7987200, "rew": 372.3415, "rew_std": 75.1058, "Agent": "REINFORCE"}, {"env_step": 8017920, "rew": 364.4274, "rew_std": 126.2467, "Agent": "REINFORCE"}, {"env_step": 8048640, "rew": 333.2996, "rew_std": 100.0399, "Agent": "REINFORCE"}, {"env_step": 8079360, "rew": 347.481, "rew_std": 100.2056, "Agent": "REINFORCE"}, {"env_step": 8110080, "rew": 370.4996, "rew_std": 95.8974, "Agent": "REINFORCE"}, {"env_step": 8140800, "rew": 374.8886, "rew_std": 118.6889, "Agent": "REINFORCE"}, {"env_step": 8171520, "rew": 379.4134, "rew_std": 118.8234, "Agent": "REINFORCE"}, {"env_step": 8202240, "rew": 383.0012, "rew_std": 64.9941, "Agent": "REINFORCE"}, {"env_step": 8232960, "rew": 375.0866, "rew_std": 89.8378, "Agent": "REINFORCE"}, {"env_step": 8263680, "rew": 375.1638, "rew_std": 101.1116, "Agent": "REINFORCE"}, {"env_step": 8294400, "rew": 385.6165, "rew_std": 69.0373, "Agent": "REINFORCE"}, {"env_step": 8325120, "rew": 375.2498, "rew_std": 104.7292, "Agent": "REINFORCE"}, {"env_step": 8355840, "rew": 402.2431, "rew_std": 79.0858, "Agent": "REINFORCE"}, {"env_step": 8386560, "rew": 382.6706, "rew_std": 91.6997, "Agent": "REINFORCE"}, {"env_step": 8417280, "rew": 372.3715, "rew_std": 82.5468, "Agent": "REINFORCE"}, {"env_step": 8448000, "rew": 401.3655, "rew_std": 98.7974, "Agent": "REINFORCE"}, {"env_step": 8478720, "rew": 385.1743, "rew_std": 58.1178, "Agent": "REINFORCE"}, {"env_step": 8509440, "rew": 375.3559, "rew_std": 104.8732, "Agent": "REINFORCE"}, {"env_step": 8540160, "rew": 349.357, "rew_std": 93.2866, "Agent": "REINFORCE"}, {"env_step": 8570880, "rew": 376.5432, "rew_std": 69.9092, "Agent": "REINFORCE"}, {"env_step": 8601600, "rew": 382.909, "rew_std": 65.2545, "Agent": "REINFORCE"}, {"env_step": 8632320, "rew": 377.8138, "rew_std": 87.565, "Agent": "REINFORCE"}, {"env_step": 8663040, "rew": 383.207, "rew_std": 80.1754, "Agent": "REINFORCE"}, {"env_step": 8693760, "rew": 371.4133, "rew_std": 89.9161, "Agent": "REINFORCE"}, {"env_step": 8724480, "rew": 376.919, "rew_std": 69.2769, "Agent": "REINFORCE"}, {"env_step": 8755200, "rew": 379.47, "rew_std": 76.5879, "Agent": "REINFORCE"}, {"env_step": 8785920, "rew": 366.7001, "rew_std": 104.0949, "Agent": "REINFORCE"}, {"env_step": 8816640, "rew": 382.4882, "rew_std": 62.5922, "Agent": "REINFORCE"}, {"env_step": 8847360, "rew": 372.0743, "rew_std": 79.0617, "Agent": "REINFORCE"}, {"env_step": 8878080, "rew": 357.0979, "rew_std": 101.0783, "Agent": "REINFORCE"}, {"env_step": 8908800, "rew": 402.782, "rew_std": 73.662, "Agent": "REINFORCE"}, {"env_step": 8939520, "rew": 383.05, "rew_std": 95.7289, "Agent": "REINFORCE"}, {"env_step": 8970240, "rew": 398.7126, "rew_std": 49.3771, "Agent": "REINFORCE"}, {"env_step": 9000960, "rew": 342.6036, "rew_std": 102.5794, "Agent": "REINFORCE"}, {"env_step": 9031680, "rew": 393.9359, "rew_std": 55.8315, "Agent": "REINFORCE"}, {"env_step": 9062400, "rew": 358.2121, "rew_std": 98.775, "Agent": "REINFORCE"}, {"env_step": 9093120, "rew": 396.7736, "rew_std": 47.5404, "Agent": "REINFORCE"}, {"env_step": 9123840, "rew": 390.0685, "rew_std": 64.218, "Agent": "REINFORCE"}, {"env_step": 9154560, "rew": 367.538, "rew_std": 85.9344, "Agent": "REINFORCE"}, {"env_step": 9185280, "rew": 367.0394, "rew_std": 96.7543, "Agent": "REINFORCE"}, {"env_step": 9216000, "rew": 365.089, "rew_std": 97.8226, "Agent": "REINFORCE"}, {"env_step": 9246720, "rew": 394.2243, "rew_std": 83.5708, "Agent": "REINFORCE"}, {"env_step": 9277440, "rew": 374.55, "rew_std": 118.3468, "Agent": "REINFORCE"}, {"env_step": 9308160, "rew": 349.5582, "rew_std": 95.0112, "Agent": "REINFORCE"}, {"env_step": 9338880, "rew": 370.6759, "rew_std": 67.2228, "Agent": "REINFORCE"}, {"env_step": 9369600, "rew": 386.7887, "rew_std": 83.2882, "Agent": "REINFORCE"}, {"env_step": 9400320, "rew": 374.7842, "rew_std": 83.7501, "Agent": "REINFORCE"}, {"env_step": 9431040, "rew": 382.3645, "rew_std": 79.8977, "Agent": "REINFORCE"}, {"env_step": 9461760, "rew": 359.2723, "rew_std": 106.1609, "Agent": "REINFORCE"}, {"env_step": 9492480, "rew": 411.7006, "rew_std": 32.7818, "Agent": "REINFORCE"}, {"env_step": 9523200, "rew": 381.7046, "rew_std": 82.238, "Agent": "REINFORCE"}, {"env_step": 9553920, "rew": 395.8383, "rew_std": 52.7248, "Agent": "REINFORCE"}, {"env_step": 9584640, "rew": 382.9098, "rew_std": 64.35, "Agent": "REINFORCE"}, {"env_step": 9615360, "rew": 374.4013, "rew_std": 104.142, "Agent": "REINFORCE"}, {"env_step": 9646080, "rew": 380.0431, "rew_std": 80.4186, "Agent": "REINFORCE"}, {"env_step": 9676800, "rew": 380.1886, "rew_std": 81.4481, "Agent": "REINFORCE"}, {"env_step": 9707520, "rew": 363.2701, "rew_std": 86.7719, "Agent": "REINFORCE"}, {"env_step": 9738240, "rew": 373.5595, "rew_std": 72.1207, "Agent": "REINFORCE"}, {"env_step": 9768960, "rew": 384.6104, "rew_std": 71.9801, "Agent": "REINFORCE"}, {"env_step": 9799680, "rew": 375.595, "rew_std": 63.4577, "Agent": "REINFORCE"}, {"env_step": 9830400, "rew": 360.9498, "rew_std": 73.2914, "Agent": "REINFORCE"}, {"env_step": 9861120, "rew": 378.3045, "rew_std": 68.1014, "Agent": "REINFORCE"}, {"env_step": 9891840, "rew": 377.6049, "rew_std": 65.1815, "Agent": "REINFORCE"}, {"env_step": 9922560, "rew": 377.4226, "rew_std": 79.2419, "Agent": "REINFORCE"}, {"env_step": 9953280, "rew": 371.0989, "rew_std": 69.7, "Agent": "REINFORCE"}, {"env_step": 9984000, "rew": 395.0888, "rew_std": 64.5988, "Agent": "REINFORCE"}, {"env_step": 10014720, "rew": 380.6971, "rew_std": 66.6752, "Agent": "REINFORCE"}, {"env_step": 10045440, "rew": 369.8089, "rew_std": 82.7607, "Agent": "REINFORCE"}, {"env_step": 10076160, "rew": 359.9013, "rew_std": 90.9538, "Agent": "REINFORCE"}, {"env_step": 10106880, "rew": 369.0725, "rew_std": 62.3956, "Agent": "REINFORCE"}, {"env_step": 10137600, "rew": 392.5896, "rew_std": 50.2816, "Agent": "REINFORCE"}, {"env_step": 10168320, "rew": 361.0641, "rew_std": 109.9217, "Agent": "REINFORCE"}, {"env_step": 10199040, "rew": 352.6764, "rew_std": 79.7465, "Agent": "REINFORCE"}, {"env_step": 10229760, "rew": 352.3748, "rew_std": 82.8586, "Agent": "REINFORCE"}, {"env_step": 0, "rew": 6.442, "rew_std": 12.7772, "Agent": "SAC"}, {"env_step": 5000, "rew": 384.2125, "rew_std": 91.1295, "Agent": "SAC"}, {"env_step": 10000, "rew": 311.4904, "rew_std": 92.4643, "Agent": "SAC"}, {"env_step": 15000, "rew": 341.5975, "rew_std": 61.666, "Agent": "SAC"}, {"env_step": 20000, "rew": 332.6649, "rew_std": 99.9772, "Agent": "SAC"}, {"env_step": 25000, "rew": 381.5184, "rew_std": 156.4263, "Agent": "SAC"}, {"env_step": 30000, "rew": 396.9952, "rew_std": 101.5131, "Agent": "SAC"}, {"env_step": 35000, "rew": 428.0762, "rew_std": 112.466, "Agent": "SAC"}, {"env_step": 40000, "rew": 538.719, "rew_std": 425.0536, "Agent": "SAC"}, {"env_step": 45000, "rew": 613.2465, "rew_std": 440.9208, "Agent": "SAC"}, {"env_step": 50000, "rew": 695.3813, "rew_std": 413.9007, "Agent": "SAC"}, {"env_step": 55000, "rew": 867.3111, "rew_std": 429.0798, "Agent": "SAC"}, {"env_step": 60000, "rew": 821.5923, "rew_std": 626.4058, "Agent": "SAC"}, {"env_step": 65000, "rew": 724.8063, "rew_std": 548.7352, "Agent": "SAC"}, {"env_step": 70000, "rew": 869.673, "rew_std": 605.068, "Agent": "SAC"}, {"env_step": 75000, "rew": 887.8157, "rew_std": 670.5667, "Agent": "SAC"}, {"env_step": 80000, "rew": 842.7084, "rew_std": 595.3462, "Agent": "SAC"}, {"env_step": 85000, "rew": 934.1402, "rew_std": 445.0447, "Agent": "SAC"}, {"env_step": 90000, "rew": 843.5223, "rew_std": 707.1264, "Agent": "SAC"}, {"env_step": 95000, "rew": 1145.929, "rew_std": 693.5426, "Agent": "SAC"}, {"env_step": 100000, "rew": 1305.246, "rew_std": 795.0855, "Agent": "SAC"}, {"env_step": 105000, "rew": 982.3865, "rew_std": 559.6456, "Agent": "SAC"}, {"env_step": 110000, "rew": 1438.316, "rew_std": 897.6387, "Agent": "SAC"}, {"env_step": 115000, "rew": 1684.2845, "rew_std": 980.9338, "Agent": "SAC"}, {"env_step": 120000, "rew": 1576.6348, "rew_std": 973.7348, "Agent": "SAC"}, {"env_step": 125000, "rew": 1635.8776, "rew_std": 1040.758, "Agent": "SAC"}, {"env_step": 130000, "rew": 1260.5658, "rew_std": 771.0769, "Agent": "SAC"}, {"env_step": 135000, "rew": 1870.8694, "rew_std": 948.5044, "Agent": "SAC"}, {"env_step": 140000, "rew": 1804.7263, "rew_std": 1012.1946, "Agent": "SAC"}, {"env_step": 145000, "rew": 1733.9893, "rew_std": 1143.5478, "Agent": "SAC"}, {"env_step": 150000, "rew": 1981.0082, "rew_std": 1216.2987, "Agent": "SAC"}, {"env_step": 155000, "rew": 2061.6254, "rew_std": 1290.993, "Agent": "SAC"}, {"env_step": 160000, "rew": 2199.765, "rew_std": 1182.4863, "Agent": "SAC"}, {"env_step": 165000, "rew": 2295.9367, "rew_std": 1338.0812, "Agent": "SAC"}, {"env_step": 170000, "rew": 2374.0511, "rew_std": 1184.7679, "Agent": "SAC"}, {"env_step": 175000, "rew": 2230.0855, "rew_std": 1255.8343, "Agent": "SAC"}, {"env_step": 180000, "rew": 2253.6271, "rew_std": 1346.9405, "Agent": "SAC"}, {"env_step": 185000, "rew": 2155.7215, "rew_std": 1412.9678, "Agent": "SAC"}, {"env_step": 190000, "rew": 2449.8378, "rew_std": 1421.6176, "Agent": "SAC"}, {"env_step": 195000, "rew": 1713.5455, "rew_std": 1319.3, "Agent": "SAC"}, {"env_step": 200000, "rew": 2530.5179, "rew_std": 1300.063, "Agent": "SAC"}, {"env_step": 205000, "rew": 2560.3269, "rew_std": 1206.713, "Agent": "SAC"}, {"env_step": 210000, "rew": 2608.8807, "rew_std": 1516.2121, "Agent": "SAC"}, {"env_step": 215000, "rew": 2940.6585, "rew_std": 1263.8721, "Agent": "SAC"}, {"env_step": 220000, "rew": 2835.1198, "rew_std": 1313.7764, "Agent": "SAC"}, {"env_step": 225000, "rew": 2795.9974, "rew_std": 1438.7164, "Agent": "SAC"}, {"env_step": 230000, "rew": 2982.4341, "rew_std": 1106.1144, "Agent": "SAC"}, {"env_step": 235000, "rew": 3005.3469, "rew_std": 1261.5498, "Agent": "SAC"}, {"env_step": 240000, "rew": 2919.6294, "rew_std": 1372.1881, "Agent": "SAC"}, {"env_step": 245000, "rew": 3230.0246, "rew_std": 964.7996, "Agent": "SAC"}, {"env_step": 250000, "rew": 3057.256, "rew_std": 1279.675, "Agent": "SAC"}, {"env_step": 255000, "rew": 2914.3693, "rew_std": 1492.3339, "Agent": "SAC"}, {"env_step": 260000, "rew": 3260.669, "rew_std": 1081.3091, "Agent": "SAC"}, {"env_step": 265000, "rew": 3395.4337, "rew_std": 1115.2453, "Agent": "SAC"}, {"env_step": 270000, "rew": 3382.5232, "rew_std": 1198.3392, "Agent": "SAC"}, {"env_step": 275000, "rew": 3343.9861, "rew_std": 1189.3488, "Agent": "SAC"}, {"env_step": 280000, "rew": 3486.7607, "rew_std": 1027.7273, "Agent": "SAC"}, {"env_step": 285000, "rew": 3407.4401, "rew_std": 1093.805, "Agent": "SAC"}, {"env_step": 290000, "rew": 3582.8111, "rew_std": 1225.0489, "Agent": "SAC"}, {"env_step": 295000, "rew": 3561.0796, "rew_std": 1143.1364, "Agent": "SAC"}, {"env_step": 300000, "rew": 3386.777, "rew_std": 1182.0262, "Agent": "SAC"}, {"env_step": 305000, "rew": 3227.8796, "rew_std": 1305.9756, "Agent": "SAC"}, {"env_step": 310000, "rew": 3755.7218, "rew_std": 908.9631, "Agent": "SAC"}, {"env_step": 315000, "rew": 3697.4154, "rew_std": 1144.1577, "Agent": "SAC"}, {"env_step": 320000, "rew": 3523.1265, "rew_std": 1185.8277, "Agent": "SAC"}, {"env_step": 325000, "rew": 3865.0648, "rew_std": 734.798, "Agent": "SAC"}, {"env_step": 330000, "rew": 3436.0228, "rew_std": 1121.3988, "Agent": "SAC"}, {"env_step": 335000, "rew": 3778.7621, "rew_std": 779.3629, "Agent": "SAC"}, {"env_step": 340000, "rew": 3853.8889, "rew_std": 784.8108, "Agent": "SAC"}, {"env_step": 345000, "rew": 3567.5159, "rew_std": 841.2435, "Agent": "SAC"}, {"env_step": 350000, "rew": 4101.7505, "rew_std": 448.9228, "Agent": "SAC"}, {"env_step": 355000, "rew": 4027.0011, "rew_std": 704.9953, "Agent": "SAC"}, {"env_step": 360000, "rew": 4103.7433, "rew_std": 525.8276, "Agent": "SAC"}, {"env_step": 365000, "rew": 4173.6105, "rew_std": 505.5541, "Agent": "SAC"}, {"env_step": 370000, "rew": 4149.5763, "rew_std": 724.6827, "Agent": "SAC"}, {"env_step": 375000, "rew": 3942.1668, "rew_std": 843.3023, "Agent": "SAC"}, {"env_step": 380000, "rew": 4152.364, "rew_std": 435.6519, "Agent": "SAC"}, {"env_step": 385000, "rew": 4189.1143, "rew_std": 475.1204, "Agent": "SAC"}, {"env_step": 390000, "rew": 4311.4203, "rew_std": 338.2765, "Agent": "SAC"}, {"env_step": 395000, "rew": 4218.0714, "rew_std": 346.1174, "Agent": "SAC"}, {"env_step": 400000, "rew": 4289.7702, "rew_std": 345.5157, "Agent": "SAC"}, {"env_step": 405000, "rew": 4251.2825, "rew_std": 417.9483, "Agent": "SAC"}, {"env_step": 410000, "rew": 4334.316, "rew_std": 352.4353, "Agent": "SAC"}, {"env_step": 415000, "rew": 4291.9864, "rew_std": 328.9922, "Agent": "SAC"}, {"env_step": 420000, "rew": 4333.559, "rew_std": 412.5937, "Agent": "SAC"}, {"env_step": 425000, "rew": 3895.0666, "rew_std": 1285.4803, "Agent": "SAC"}, {"env_step": 430000, "rew": 4089.7339, "rew_std": 976.8529, "Agent": "SAC"}, {"env_step": 435000, "rew": 4322.8754, "rew_std": 494.2115, "Agent": "SAC"}, {"env_step": 440000, "rew": 4158.0765, "rew_std": 714.8891, "Agent": "SAC"}, {"env_step": 445000, "rew": 4307.1994, "rew_std": 545.6213, "Agent": "SAC"}, {"env_step": 450000, "rew": 4471.6417, "rew_std": 460.2717, "Agent": "SAC"}, {"env_step": 455000, "rew": 4451.7838, "rew_std": 336.7615, "Agent": "SAC"}, {"env_step": 460000, "rew": 4250.6242, "rew_std": 760.2981, "Agent": "SAC"}, {"env_step": 465000, "rew": 4348.7151, "rew_std": 326.842, "Agent": "SAC"}, {"env_step": 470000, "rew": 4303.0926, "rew_std": 502.9855, "Agent": "SAC"}, {"env_step": 475000, "rew": 4474.3392, "rew_std": 296.9774, "Agent": "SAC"}, {"env_step": 480000, "rew": 4466.7216, "rew_std": 357.6031, "Agent": "SAC"}, {"env_step": 485000, "rew": 4525.9658, "rew_std": 351.0915, "Agent": "SAC"}, {"env_step": 490000, "rew": 4519.1572, "rew_std": 342.3496, "Agent": "SAC"}, {"env_step": 495000, "rew": 4336.2845, "rew_std": 617.5122, "Agent": "SAC"}, {"env_step": 500000, "rew": 4572.7087, "rew_std": 337.2333, "Agent": "SAC"}, {"env_step": 505000, "rew": 4469.0437, "rew_std": 301.8515, "Agent": "SAC"}, {"env_step": 510000, "rew": 4458.5882, "rew_std": 421.4234, "Agent": "SAC"}, {"env_step": 515000, "rew": 4375.1096, "rew_std": 746.4311, "Agent": "SAC"}, {"env_step": 520000, "rew": 3986.7109, "rew_std": 1411.5229, "Agent": "SAC"}, {"env_step": 525000, "rew": 3944.5748, "rew_std": 1475.4799, "Agent": "SAC"}, {"env_step": 530000, "rew": 4416.7452, "rew_std": 427.131, "Agent": "SAC"}, {"env_step": 535000, "rew": 4592.5295, "rew_std": 308.1874, "Agent": "SAC"}, {"env_step": 540000, "rew": 4173.1087, "rew_std": 1166.0453, "Agent": "SAC"}, {"env_step": 545000, "rew": 4636.8842, "rew_std": 286.4875, "Agent": "SAC"}, {"env_step": 550000, "rew": 4578.3448, "rew_std": 302.9395, "Agent": "SAC"}, {"env_step": 555000, "rew": 4413.4363, "rew_std": 685.7219, "Agent": "SAC"}, {"env_step": 560000, "rew": 4584.8782, "rew_std": 372.8659, "Agent": "SAC"}, {"env_step": 565000, "rew": 4636.6749, "rew_std": 284.3277, "Agent": "SAC"}, {"env_step": 570000, "rew": 4317.3934, "rew_std": 860.2242, "Agent": "SAC"}, {"env_step": 575000, "rew": 4374.3222, "rew_std": 1105.2963, "Agent": "SAC"}, {"env_step": 580000, "rew": 4571.8318, "rew_std": 298.5848, "Agent": "SAC"}, {"env_step": 585000, "rew": 4632.2289, "rew_std": 310.1531, "Agent": "SAC"}, {"env_step": 590000, "rew": 4511.29, "rew_std": 467.326, "Agent": "SAC"}, {"env_step": 595000, "rew": 4607.8163, "rew_std": 331.9071, "Agent": "SAC"}, {"env_step": 600000, "rew": 4323.4754, "rew_std": 781.4137, "Agent": "SAC"}, {"env_step": 605000, "rew": 4671.2125, "rew_std": 285.3162, "Agent": "SAC"}, {"env_step": 610000, "rew": 4643.3239, "rew_std": 344.1169, "Agent": "SAC"}, {"env_step": 615000, "rew": 4690.2549, "rew_std": 282.8784, "Agent": "SAC"}, {"env_step": 620000, "rew": 4686.0131, "rew_std": 369.3955, "Agent": "SAC"}, {"env_step": 625000, "rew": 4688.8255, "rew_std": 324.6271, "Agent": "SAC"}, {"env_step": 630000, "rew": 4506.0534, "rew_std": 567.9693, "Agent": "SAC"}, {"env_step": 635000, "rew": 4606.6157, "rew_std": 325.8416, "Agent": "SAC"}, {"env_step": 640000, "rew": 4673.6359, "rew_std": 304.2885, "Agent": "SAC"}, {"env_step": 645000, "rew": 4624.5667, "rew_std": 273.8858, "Agent": "SAC"}, {"env_step": 650000, "rew": 4723.6719, "rew_std": 298.1089, "Agent": "SAC"}, {"env_step": 655000, "rew": 4753.7342, "rew_std": 243.8481, "Agent": "SAC"}, {"env_step": 660000, "rew": 4585.5831, "rew_std": 438.7594, "Agent": "SAC"}, {"env_step": 665000, "rew": 4783.7243, "rew_std": 288.8173, "Agent": "SAC"}, {"env_step": 670000, "rew": 4760.5305, "rew_std": 216.8594, "Agent": "SAC"}, {"env_step": 675000, "rew": 4745.5199, "rew_std": 292.853, "Agent": "SAC"}, {"env_step": 680000, "rew": 4754.3869, "rew_std": 299.4585, "Agent": "SAC"}, {"env_step": 685000, "rew": 4797.6591, "rew_std": 328.1475, "Agent": "SAC"}, {"env_step": 690000, "rew": 4749.7072, "rew_std": 259.9067, "Agent": "SAC"}, {"env_step": 695000, "rew": 4800.2761, "rew_std": 266.7347, "Agent": "SAC"}, {"env_step": 700000, "rew": 4792.0478, "rew_std": 325.5644, "Agent": "SAC"}, {"env_step": 705000, "rew": 4781.8091, "rew_std": 319.7762, "Agent": "SAC"}, {"env_step": 710000, "rew": 4755.8539, "rew_std": 301.7209, "Agent": "SAC"}, {"env_step": 715000, "rew": 4801.6133, "rew_std": 313.9985, "Agent": "SAC"}, {"env_step": 720000, "rew": 4813.7196, "rew_std": 297.5344, "Agent": "SAC"}, {"env_step": 725000, "rew": 4342.3206, "rew_std": 1459.6998, "Agent": "SAC"}, {"env_step": 730000, "rew": 4871.0308, "rew_std": 294.6682, "Agent": "SAC"}, {"env_step": 735000, "rew": 4804.8159, "rew_std": 229.0327, "Agent": "SAC"}, {"env_step": 740000, "rew": 4774.688, "rew_std": 471.3831, "Agent": "SAC"}, {"env_step": 745000, "rew": 4776.7827, "rew_std": 276.7201, "Agent": "SAC"}, {"env_step": 750000, "rew": 4874.8524, "rew_std": 272.0392, "Agent": "SAC"}, {"env_step": 755000, "rew": 4828.406, "rew_std": 272.7295, "Agent": "SAC"}, {"env_step": 760000, "rew": 4839.0527, "rew_std": 321.5127, "Agent": "SAC"}, {"env_step": 765000, "rew": 4813.0792, "rew_std": 246.6873, "Agent": "SAC"}, {"env_step": 770000, "rew": 4793.6444, "rew_std": 236.0907, "Agent": "SAC"}, {"env_step": 775000, "rew": 4351.0101, "rew_std": 1468.2281, "Agent": "SAC"}, {"env_step": 780000, "rew": 4871.9559, "rew_std": 274.0046, "Agent": "SAC"}, {"env_step": 785000, "rew": 4870.5481, "rew_std": 302.3448, "Agent": "SAC"}, {"env_step": 790000, "rew": 4810.3993, "rew_std": 290.871, "Agent": "SAC"}, {"env_step": 795000, "rew": 4869.6752, "rew_std": 320.4274, "Agent": "SAC"}, {"env_step": 800000, "rew": 4929.2482, "rew_std": 281.3255, "Agent": "SAC"}, {"env_step": 805000, "rew": 4904.1074, "rew_std": 319.2952, "Agent": "SAC"}, {"env_step": 810000, "rew": 4828.2516, "rew_std": 248.9182, "Agent": "SAC"}, {"env_step": 815000, "rew": 4868.561, "rew_std": 353.0873, "Agent": "SAC"}, {"env_step": 820000, "rew": 4852.1619, "rew_std": 316.7407, "Agent": "SAC"}, {"env_step": 825000, "rew": 4888.9612, "rew_std": 304.478, "Agent": "SAC"}, {"env_step": 830000, "rew": 4879.1963, "rew_std": 323.2041, "Agent": "SAC"}, {"env_step": 835000, "rew": 4932.074, "rew_std": 269.818, "Agent": "SAC"}, {"env_step": 840000, "rew": 4865.5276, "rew_std": 266.335, "Agent": "SAC"}, {"env_step": 845000, "rew": 4919.0112, "rew_std": 288.4665, "Agent": "SAC"}, {"env_step": 850000, "rew": 4863.3539, "rew_std": 308.8071, "Agent": "SAC"}, {"env_step": 855000, "rew": 4487.3525, "rew_std": 1507.675, "Agent": "SAC"}, {"env_step": 860000, "rew": 4595.9993, "rew_std": 1208.7824, "Agent": "SAC"}, {"env_step": 865000, "rew": 4586.4829, "rew_std": 1208.126, "Agent": "SAC"}, {"env_step": 870000, "rew": 4624.6886, "rew_std": 1072.1255, "Agent": "SAC"}, {"env_step": 875000, "rew": 4927.1432, "rew_std": 333.9255, "Agent": "SAC"}, {"env_step": 880000, "rew": 4713.0344, "rew_std": 505.1897, "Agent": "SAC"}, {"env_step": 885000, "rew": 4863.7618, "rew_std": 289.8723, "Agent": "SAC"}, {"env_step": 890000, "rew": 4906.5223, "rew_std": 309.4497, "Agent": "SAC"}, {"env_step": 895000, "rew": 4903.552, "rew_std": 334.2238, "Agent": "SAC"}, {"env_step": 900000, "rew": 4975.752, "rew_std": 204.8283, "Agent": "SAC"}, {"env_step": 905000, "rew": 4939.0452, "rew_std": 294.1009, "Agent": "SAC"}, {"env_step": 910000, "rew": 4932.2537, "rew_std": 266.7105, "Agent": "SAC"}, {"env_step": 915000, "rew": 4923.4304, "rew_std": 286.5257, "Agent": "SAC"}, {"env_step": 920000, "rew": 4925.4901, "rew_std": 321.2685, "Agent": "SAC"}, {"env_step": 925000, "rew": 4930.469, "rew_std": 258.552, "Agent": "SAC"}, {"env_step": 930000, "rew": 4956.2111, "rew_std": 247.6533, "Agent": "SAC"}, {"env_step": 935000, "rew": 4976.9714, "rew_std": 262.3986, "Agent": "SAC"}, {"env_step": 940000, "rew": 4939.6174, "rew_std": 303.659, "Agent": "SAC"}, {"env_step": 945000, "rew": 4902.8756, "rew_std": 302.1218, "Agent": "SAC"}, {"env_step": 950000, "rew": 4922.0174, "rew_std": 275.016, "Agent": "SAC"}, {"env_step": 955000, "rew": 4709.7878, "rew_std": 763.3719, "Agent": "SAC"}, {"env_step": 960000, "rew": 4433.3008, "rew_std": 1511.4133, "Agent": "SAC"}, {"env_step": 965000, "rew": 4950.9803, "rew_std": 334.9916, "Agent": "SAC"}, {"env_step": 970000, "rew": 4717.4681, "rew_std": 735.1069, "Agent": "SAC"}, {"env_step": 975000, "rew": 4871.5042, "rew_std": 302.9081, "Agent": "SAC"}, {"env_step": 980000, "rew": 4969.5632, "rew_std": 283.0509, "Agent": "SAC"}, {"env_step": 985000, "rew": 4919.6581, "rew_std": 299.977, "Agent": "SAC"}, {"env_step": 990000, "rew": 4908.7273, "rew_std": 277.1986, "Agent": "SAC"}, {"env_step": 995000, "rew": 5006.9909, "rew_std": 251.5363, "Agent": "SAC"}, {"env_step": 1000000, "rew": 4960.8519, "rew_std": 326.6731, "Agent": "SAC"}, {"env_step": 1005000, "rew": 5007.6406, "rew_std": 276.5167, "Agent": "SAC"}, {"env_step": 1010000, "rew": 4975.1938, "rew_std": 251.1375, "Agent": "SAC"}, {"env_step": 1015000, "rew": 4644.0452, "rew_std": 1054.6104, "Agent": "SAC"}, {"env_step": 1020000, "rew": 5055.6218, "rew_std": 239.9198, "Agent": "SAC"}, {"env_step": 1025000, "rew": 5011.8421, "rew_std": 264.9829, "Agent": "SAC"}, {"env_step": 1030000, "rew": 4997.3616, "rew_std": 280.4018, "Agent": "SAC"}, {"env_step": 1035000, "rew": 4966.7413, "rew_std": 272.2318, "Agent": "SAC"}, {"env_step": 1040000, "rew": 4982.7577, "rew_std": 273.0634, "Agent": "SAC"}, {"env_step": 1045000, "rew": 5036.827, "rew_std": 234.8077, "Agent": "SAC"}, {"env_step": 1050000, "rew": 5064.187, "rew_std": 270.0732, "Agent": "SAC"}, {"env_step": 1055000, "rew": 5039.7243, "rew_std": 234.6565, "Agent": "SAC"}, {"env_step": 1060000, "rew": 5048.1365, "rew_std": 267.1999, "Agent": "SAC"}, {"env_step": 1065000, "rew": 5048.2367, "rew_std": 241.2245, "Agent": "SAC"}, {"env_step": 1070000, "rew": 5020.6526, "rew_std": 246.4498, "Agent": "SAC"}, {"env_step": 1075000, "rew": 5028.6578, "rew_std": 276.1192, "Agent": "SAC"}, {"env_step": 1080000, "rew": 5055.9845, "rew_std": 285.7831, "Agent": "SAC"}, {"env_step": 1085000, "rew": 5032.9481, "rew_std": 287.6907, "Agent": "SAC"}, {"env_step": 1090000, "rew": 5094.031, "rew_std": 235.2431, "Agent": "SAC"}, {"env_step": 1095000, "rew": 5034.7263, "rew_std": 287.0603, "Agent": "SAC"}, {"env_step": 1100000, "rew": 5088.3686, "rew_std": 269.512, "Agent": "SAC"}, {"env_step": 1105000, "rew": 5070.0633, "rew_std": 300.3387, "Agent": "SAC"}, {"env_step": 1110000, "rew": 5089.1961, "rew_std": 189.3168, "Agent": "SAC"}, {"env_step": 1115000, "rew": 5099.9245, "rew_std": 250.309, "Agent": "SAC"}, {"env_step": 1120000, "rew": 5089.3528, "rew_std": 220.9666, "Agent": "SAC"}, {"env_step": 1125000, "rew": 5070.1846, "rew_std": 226.8031, "Agent": "SAC"}, {"env_step": 1130000, "rew": 5107.3689, "rew_std": 237.5596, "Agent": "SAC"}, {"env_step": 1135000, "rew": 5061.5314, "rew_std": 226.2364, "Agent": "SAC"}, {"env_step": 1140000, "rew": 5079.4029, "rew_std": 264.8791, "Agent": "SAC"}, {"env_step": 1145000, "rew": 5058.1592, "rew_std": 264.707, "Agent": "SAC"}, {"env_step": 1150000, "rew": 4580.0414, "rew_std": 1525.9135, "Agent": "SAC"}, {"env_step": 1155000, "rew": 5124.2839, "rew_std": 237.1135, "Agent": "SAC"}, {"env_step": 1160000, "rew": 4789.3126, "rew_std": 964.1734, "Agent": "SAC"}, {"env_step": 1165000, "rew": 5098.6035, "rew_std": 246.2682, "Agent": "SAC"}, {"env_step": 1170000, "rew": 4985.6138, "rew_std": 263.8668, "Agent": "SAC"}, {"env_step": 1175000, "rew": 4649.6205, "rew_std": 1425.5773, "Agent": "SAC"}, {"env_step": 1180000, "rew": 4694.9734, "rew_std": 1563.7542, "Agent": "SAC"}, {"env_step": 1185000, "rew": 4744.1841, "rew_std": 1237.5092, "Agent": "SAC"}, {"env_step": 1190000, "rew": 5118.0235, "rew_std": 295.8218, "Agent": "SAC"}, {"env_step": 1195000, "rew": 5149.0656, "rew_std": 294.5632, "Agent": "SAC"}, {"env_step": 1200000, "rew": 5146.3338, "rew_std": 256.8307, "Agent": "SAC"}, {"env_step": 1205000, "rew": 5162.8329, "rew_std": 275.7237, "Agent": "SAC"}, {"env_step": 1210000, "rew": 5160.506, "rew_std": 231.5942, "Agent": "SAC"}, {"env_step": 1215000, "rew": 5146.5724, "rew_std": 247.9617, "Agent": "SAC"}, {"env_step": 1220000, "rew": 4940.8572, "rew_std": 608.9754, "Agent": "SAC"}, {"env_step": 1225000, "rew": 5140.356, "rew_std": 255.4533, "Agent": "SAC"}, {"env_step": 1230000, "rew": 5117.0055, "rew_std": 278.9903, "Agent": "SAC"}, {"env_step": 1235000, "rew": 5098.2526, "rew_std": 242.4591, "Agent": "SAC"}, {"env_step": 1240000, "rew": 5123.496, "rew_std": 267.9716, "Agent": "SAC"}, {"env_step": 1245000, "rew": 5111.109, "rew_std": 260.9796, "Agent": "SAC"}, {"env_step": 1250000, "rew": 4649.8175, "rew_std": 1331.5951, "Agent": "SAC"}, {"env_step": 0, "rew": 2.8782, "rew_std": 2.4482, "Agent": "TRPO"}, {"env_step": 30720, "rew": 276.4455, "rew_std": 43.0813, "Agent": "TRPO"}, {"env_step": 61440, "rew": 335.1316, "rew_std": 48.2392, "Agent": "TRPO"}, {"env_step": 92160, "rew": 391.3235, "rew_std": 36.9341, "Agent": "TRPO"}, {"env_step": 122880, "rew": 466.3054, "rew_std": 40.8731, "Agent": "TRPO"}, {"env_step": 153600, "rew": 560.3762, "rew_std": 123.1622, "Agent": "TRPO"}, {"env_step": 184320, "rew": 816.1841, "rew_std": 338.8366, "Agent": "TRPO"}, {"env_step": 215040, "rew": 941.1309, "rew_std": 290.7862, "Agent": "TRPO"}, {"env_step": 245760, "rew": 1330.0169, "rew_std": 601.3669, "Agent": "TRPO"}, {"env_step": 276480, "rew": 1507.2928, "rew_std": 654.0613, "Agent": "TRPO"}, {"env_step": 307200, "rew": 1695.9278, "rew_std": 635.0205, "Agent": "TRPO"}, {"env_step": 337920, "rew": 2023.8279, "rew_std": 785.6886, "Agent": "TRPO"}, {"env_step": 368640, "rew": 1956.3254, "rew_std": 806.3374, "Agent": "TRPO"}, {"env_step": 399360, "rew": 2064.5065, "rew_std": 729.1481, "Agent": "TRPO"}, {"env_step": 430080, "rew": 2258.863, "rew_std": 667.9189, "Agent": "TRPO"}, {"env_step": 460800, "rew": 2414.6735, "rew_std": 729.8499, "Agent": "TRPO"}, {"env_step": 491520, "rew": 2636.5873, "rew_std": 565.8571, "Agent": "TRPO"}, {"env_step": 522240, "rew": 2532.6049, "rew_std": 594.3816, "Agent": "TRPO"}, {"env_step": 552960, "rew": 2791.5012, "rew_std": 894.7685, "Agent": "TRPO"}, {"env_step": 583680, "rew": 2593.9214, "rew_std": 756.9525, "Agent": "TRPO"}, {"env_step": 614400, "rew": 3148.2629, "rew_std": 674.2353, "Agent": "TRPO"}, {"env_step": 645120, "rew": 2939.1722, "rew_std": 845.3298, "Agent": "TRPO"}, {"env_step": 675840, "rew": 2891.8465, "rew_std": 757.1896, "Agent": "TRPO"}, {"env_step": 706560, "rew": 2972.7679, "rew_std": 944.8747, "Agent": "TRPO"}, {"env_step": 737280, "rew": 3176.5802, "rew_std": 895.4807, "Agent": "TRPO"}, {"env_step": 768000, "rew": 3306.0625, "rew_std": 877.0806, "Agent": "TRPO"}, {"env_step": 798720, "rew": 3242.2065, "rew_std": 849.3133, "Agent": "TRPO"}, {"env_step": 829440, "rew": 3711.0828, "rew_std": 707.2374, "Agent": "TRPO"}, {"env_step": 860160, "rew": 3383.707, "rew_std": 865.0469, "Agent": "TRPO"}, {"env_step": 890880, "rew": 3374.8203, "rew_std": 857.1058, "Agent": "TRPO"}, {"env_step": 921600, "rew": 3669.1124, "rew_std": 971.3578, "Agent": "TRPO"}, {"env_step": 952320, "rew": 3826.7182, "rew_std": 782.7454, "Agent": "TRPO"}, {"env_step": 983040, "rew": 3699.1509, "rew_std": 792.6609, "Agent": "TRPO"}, {"env_step": 1013760, "rew": 3506.9049, "rew_std": 714.3078, "Agent": "TRPO"}, {"env_step": 1044480, "rew": 3640.3614, "rew_std": 1164.7342, "Agent": "TRPO"}, {"env_step": 1075200, "rew": 3788.5475, "rew_std": 860.641, "Agent": "TRPO"}, {"env_step": 1105920, "rew": 3636.2749, "rew_std": 513.901, "Agent": "TRPO"}, {"env_step": 1136640, "rew": 3553.8113, "rew_std": 786.3746, "Agent": "TRPO"}, {"env_step": 1167360, "rew": 3793.7271, "rew_std": 821.249, "Agent": "TRPO"}, {"env_step": 1198080, "rew": 3866.1476, "rew_std": 839.2067, "Agent": "TRPO"}, {"env_step": 1228800, "rew": 3736.955, "rew_std": 779.3455, "Agent": "TRPO"}, {"env_step": 1259520, "rew": 3967.8554, "rew_std": 837.4972, "Agent": "TRPO"}, {"env_step": 1290240, "rew": 3734.0451, "rew_std": 942.7567, "Agent": "TRPO"}, {"env_step": 1320960, "rew": 3568.7172, "rew_std": 921.325, "Agent": "TRPO"}, {"env_step": 1351680, "rew": 3637.7948, "rew_std": 1086.471, "Agent": "TRPO"}, {"env_step": 1382400, "rew": 3528.3975, "rew_std": 854.6158, "Agent": "TRPO"}, {"env_step": 1413120, "rew": 3968.9392, "rew_std": 959.0679, "Agent": "TRPO"}, {"env_step": 1443840, "rew": 3840.0466, "rew_std": 964.3409, "Agent": "TRPO"}, {"env_step": 1474560, "rew": 4024.779, "rew_std": 1101.5301, "Agent": "TRPO"}, {"env_step": 1505280, "rew": 3816.7166, "rew_std": 1011.2852, "Agent": "TRPO"}, {"env_step": 1536000, "rew": 3898.2826, "rew_std": 983.4458, "Agent": "TRPO"}, {"env_step": 1566720, "rew": 3656.6691, "rew_std": 951.2498, "Agent": "TRPO"}, {"env_step": 1597440, "rew": 4090.7454, "rew_std": 803.5782, "Agent": "TRPO"}, {"env_step": 1628160, "rew": 3745.8832, "rew_std": 1057.9439, "Agent": "TRPO"}, {"env_step": 1658880, "rew": 3921.2684, "rew_std": 1052.1085, "Agent": "TRPO"}, {"env_step": 1689600, "rew": 3878.2909, "rew_std": 1331.2655, "Agent": "TRPO"}, {"env_step": 1720320, "rew": 4047.5337, "rew_std": 1075.5706, "Agent": "TRPO"}, {"env_step": 1751040, "rew": 3730.8862, "rew_std": 1258.0235, "Agent": "TRPO"}, {"env_step": 1781760, "rew": 3803.3556, "rew_std": 932.9923, "Agent": "TRPO"}, {"env_step": 1812480, "rew": 3881.5427, "rew_std": 943.1027, "Agent": "TRPO"}, {"env_step": 1843200, "rew": 3518.1911, "rew_std": 1234.3249, "Agent": "TRPO"}, {"env_step": 1873920, "rew": 3745.7263, "rew_std": 600.776, "Agent": "TRPO"}, {"env_step": 1904640, "rew": 4017.2684, "rew_std": 933.6147, "Agent": "TRPO"}, {"env_step": 1935360, "rew": 3671.991, "rew_std": 1111.098, "Agent": "TRPO"}, {"env_step": 1966080, "rew": 3889.9664, "rew_std": 851.4248, "Agent": "TRPO"}, {"env_step": 1996800, "rew": 3885.9574, "rew_std": 856.4463, "Agent": "TRPO"}, {"env_step": 2027520, "rew": 4183.8565, "rew_std": 904.3467, "Agent": "TRPO"}, {"env_step": 2058240, "rew": 3999.7238, "rew_std": 906.2692, "Agent": "TRPO"}, {"env_step": 2088960, "rew": 4090.8771, "rew_std": 689.8292, "Agent": "TRPO"}, {"env_step": 2119680, "rew": 4109.0513, "rew_std": 804.9544, "Agent": "TRPO"}, {"env_step": 2150400, "rew": 4155.6098, "rew_std": 1155.4661, "Agent": "TRPO"}, {"env_step": 2181120, "rew": 4229.3409, "rew_std": 888.0334, "Agent": "TRPO"}, {"env_step": 2211840, "rew": 4493.5781, "rew_std": 790.242, "Agent": "TRPO"}, {"env_step": 2242560, "rew": 4034.784, "rew_std": 1025.8938, "Agent": "TRPO"}, {"env_step": 2273280, "rew": 4221.0877, "rew_std": 806.7314, "Agent": "TRPO"}, {"env_step": 2304000, "rew": 4104.1356, "rew_std": 1020.4961, "Agent": "TRPO"}, {"env_step": 2334720, "rew": 4125.9129, "rew_std": 919.1601, "Agent": "TRPO"}, {"env_step": 2365440, "rew": 4365.8701, "rew_std": 1141.2491, "Agent": "TRPO"}, {"env_step": 2396160, "rew": 4391.7007, "rew_std": 898.0656, "Agent": "TRPO"}, {"env_step": 2426880, "rew": 3881.6266, "rew_std": 1129.9531, "Agent": "TRPO"}, {"env_step": 2457600, "rew": 4455.6202, "rew_std": 945.3446, "Agent": "TRPO"}, {"env_step": 2488320, "rew": 4701.8233, "rew_std": 921.1578, "Agent": "TRPO"}, {"env_step": 2519040, "rew": 4426.9202, "rew_std": 877.2145, "Agent": "TRPO"}, {"env_step": 2549760, "rew": 4482.3431, "rew_std": 668.8882, "Agent": "TRPO"}, {"env_step": 2580480, "rew": 4105.0671, "rew_std": 859.9176, "Agent": "TRPO"}, {"env_step": 2611200, "rew": 4491.0214, "rew_std": 940.9178, "Agent": "TRPO"}, {"env_step": 2641920, "rew": 4599.7047, "rew_std": 762.2523, "Agent": "TRPO"}, {"env_step": 2672640, "rew": 4787.0578, "rew_std": 609.1534, "Agent": "TRPO"}, {"env_step": 2703360, "rew": 4445.1027, "rew_std": 1037.8115, "Agent": "TRPO"}, {"env_step": 2734080, "rew": 4241.8485, "rew_std": 877.5309, "Agent": "TRPO"}, {"env_step": 2764800, "rew": 4370.9328, "rew_std": 1007.9423, "Agent": "TRPO"}, {"env_step": 2795520, "rew": 4358.4113, "rew_std": 1043.4188, "Agent": "TRPO"}, {"env_step": 2826240, "rew": 4640.1919, "rew_std": 713.5401, "Agent": "TRPO"}, {"env_step": 2856960, "rew": 4361.7372, "rew_std": 883.1266, "Agent": "TRPO"}, {"env_step": 2887680, "rew": 4613.8892, "rew_std": 928.3251, "Agent": "TRPO"}, {"env_step": 2918400, "rew": 4750.1872, "rew_std": 915.7121, "Agent": "TRPO"}, {"env_step": 2949120, "rew": 4680.6571, "rew_std": 520.604, "Agent": "TRPO"}, {"env_step": 2979840, "rew": 4673.5736, "rew_std": 1017.1457, "Agent": "TRPO"}, {"env_step": 3010560, "rew": 4545.0052, "rew_std": 1070.5663, "Agent": "TRPO"}, {"env_step": 3041280, "rew": 4809.5956, "rew_std": 619.5596, "Agent": "TRPO"}, {"env_step": 3072000, "rew": 4546.4164, "rew_std": 941.7217, "Agent": "TRPO"}, {"env_step": 0, "rew": 2.8782, "rew_std": 2.4482, "Agent": "A2C"}, {"env_step": 30000, "rew": 202.0535, "rew_std": 125.0532, "Agent": "A2C"}, {"env_step": 60000, "rew": 203.6009, "rew_std": 89.9611, "Agent": "A2C"}, {"env_step": 90000, "rew": 199.7673, "rew_std": 128.6289, "Agent": "A2C"}, {"env_step": 120000, "rew": 357.4458, "rew_std": 234.692, "Agent": "A2C"}, {"env_step": 150000, "rew": 478.5225, "rew_std": 222.9604, "Agent": "A2C"}, {"env_step": 180000, "rew": 548.6189, "rew_std": 294.5077, "Agent": "A2C"}, {"env_step": 210000, "rew": 645.4596, "rew_std": 310.3026, "Agent": "A2C"}, {"env_step": 240000, "rew": 628.3285, "rew_std": 199.1911, "Agent": "A2C"}, {"env_step": 270000, "rew": 671.2689, "rew_std": 335.6988, "Agent": "A2C"}, {"env_step": 300000, "rew": 547.9335, "rew_std": 236.2914, "Agent": "A2C"}, {"env_step": 330000, "rew": 507.6304, "rew_std": 160.0392, "Agent": "A2C"}, {"env_step": 360000, "rew": 570.0976, "rew_std": 255.8385, "Agent": "A2C"}, {"env_step": 390000, "rew": 556.3672, "rew_std": 204.2733, "Agent": "A2C"}, {"env_step": 420000, "rew": 561.311, "rew_std": 233.6207, "Agent": "A2C"}, {"env_step": 450000, "rew": 634.9585, "rew_std": 468.7015, "Agent": "A2C"}, {"env_step": 480000, "rew": 513.6519, "rew_std": 255.8916, "Agent": "A2C"}, {"env_step": 510000, "rew": 566.4153, "rew_std": 369.6174, "Agent": "A2C"}, {"env_step": 540000, "rew": 635.222, "rew_std": 356.6058, "Agent": "A2C"}, {"env_step": 570000, "rew": 664.1834, "rew_std": 377.3301, "Agent": "A2C"}, {"env_step": 600000, "rew": 782.6997, "rew_std": 539.4781, "Agent": "A2C"}, {"env_step": 630000, "rew": 719.1225, "rew_std": 355.298, "Agent": "A2C"}, {"env_step": 660000, "rew": 646.7552, "rew_std": 410.0789, "Agent": "A2C"}, {"env_step": 690000, "rew": 726.9089, "rew_std": 287.1523, "Agent": "A2C"}, {"env_step": 720000, "rew": 854.5273, "rew_std": 491.4004, "Agent": "A2C"}, {"env_step": 750000, "rew": 939.489, "rew_std": 746.9804, "Agent": "A2C"}, {"env_step": 780000, "rew": 993.2047, "rew_std": 737.1577, "Agent": "A2C"}, {"env_step": 810000, "rew": 983.7853, "rew_std": 534.7566, "Agent": "A2C"}, {"env_step": 840000, "rew": 828.3384, "rew_std": 438.1715, "Agent": "A2C"}, {"env_step": 870000, "rew": 1091.6377, "rew_std": 709.1839, "Agent": "A2C"}, {"env_step": 900000, "rew": 869.1863, "rew_std": 371.6148, "Agent": "A2C"}, {"env_step": 930000, "rew": 1028.6036, "rew_std": 618.1783, "Agent": "A2C"}, {"env_step": 960000, "rew": 1071.456, "rew_std": 608.5518, "Agent": "A2C"}, {"env_step": 990000, "rew": 1218.9367, "rew_std": 715.4378, "Agent": "A2C"}, {"env_step": 1020000, "rew": 1171.0587, "rew_std": 515.9813, "Agent": "A2C"}, {"env_step": 1050000, "rew": 1289.9904, "rew_std": 756.4703, "Agent": "A2C"}, {"env_step": 1080000, "rew": 1244.8827, "rew_std": 661.7623, "Agent": "A2C"}, {"env_step": 1110000, "rew": 1324.0092, "rew_std": 746.3179, "Agent": "A2C"}, {"env_step": 1140000, "rew": 1329.5089, "rew_std": 890.096, "Agent": "A2C"}, {"env_step": 1170000, "rew": 1440.4462, "rew_std": 868.7743, "Agent": "A2C"}, {"env_step": 1200000, "rew": 1452.9277, "rew_std": 881.4349, "Agent": "A2C"}, {"env_step": 1230000, "rew": 1641.462, "rew_std": 1019.5863, "Agent": "A2C"}, {"env_step": 1260000, "rew": 1672.4479, "rew_std": 984.9939, "Agent": "A2C"}, {"env_step": 1290000, "rew": 1608.7213, "rew_std": 864.3207, "Agent": "A2C"}, {"env_step": 1320000, "rew": 1617.7651, "rew_std": 1087.2479, "Agent": "A2C"}, {"env_step": 1350000, "rew": 1487.876, "rew_std": 988.1688, "Agent": "A2C"}, {"env_step": 1380000, "rew": 1476.9841, "rew_std": 768.3042, "Agent": "A2C"}, {"env_step": 1410000, "rew": 1805.3581, "rew_std": 1055.8783, "Agent": "A2C"}, {"env_step": 1440000, "rew": 1700.9757, "rew_std": 1165.7021, "Agent": "A2C"}, {"env_step": 1470000, "rew": 1771.6212, "rew_std": 901.2632, "Agent": "A2C"}, {"env_step": 1500000, "rew": 1766.9292, "rew_std": 967.6392, "Agent": "A2C"}, {"env_step": 1530000, "rew": 1574.3781, "rew_std": 961.4481, "Agent": "A2C"}, {"env_step": 1560000, "rew": 1788.8526, "rew_std": 792.947, "Agent": "A2C"}, {"env_step": 1590000, "rew": 1710.4779, "rew_std": 873.5761, "Agent": "A2C"}, {"env_step": 1620000, "rew": 1641.1858, "rew_std": 911.4718, "Agent": "A2C"}, {"env_step": 1650000, "rew": 1694.8277, "rew_std": 951.1382, "Agent": "A2C"}, {"env_step": 1680000, "rew": 1522.7366, "rew_std": 1068.8433, "Agent": "A2C"}, {"env_step": 1710000, "rew": 1394.1974, "rew_std": 715.0987, "Agent": "A2C"}, {"env_step": 1740000, "rew": 1350.849, "rew_std": 904.2712, "Agent": "A2C"}, {"env_step": 1770000, "rew": 1388.0303, "rew_std": 919.2345, "Agent": "A2C"}, {"env_step": 1800000, "rew": 1356.9308, "rew_std": 963.416, "Agent": "A2C"}, {"env_step": 1830000, "rew": 1316.883, "rew_std": 1070.2367, "Agent": "A2C"}, {"env_step": 1860000, "rew": 1272.1896, "rew_std": 924.1745, "Agent": "A2C"}, {"env_step": 1890000, "rew": 1386.0813, "rew_std": 1062.2458, "Agent": "A2C"}, {"env_step": 1920000, "rew": 1399.6613, "rew_std": 891.1578, "Agent": "A2C"}, {"env_step": 1950000, "rew": 1400.6987, "rew_std": 921.2195, "Agent": "A2C"}, {"env_step": 1980000, "rew": 1522.8818, "rew_std": 1060.9701, "Agent": "A2C"}, {"env_step": 2010000, "rew": 1395.3175, "rew_std": 1096.1453, "Agent": "A2C"}, {"env_step": 2040000, "rew": 1493.4073, "rew_std": 1334.7551, "Agent": "A2C"}, {"env_step": 2070000, "rew": 1475.0535, "rew_std": 1279.5097, "Agent": "A2C"}, {"env_step": 2100000, "rew": 1351.965, "rew_std": 1146.0997, "Agent": "A2C"}, {"env_step": 2130000, "rew": 1348.5182, "rew_std": 1050.743, "Agent": "A2C"}, {"env_step": 2160000, "rew": 1459.639, "rew_std": 1002.1804, "Agent": "A2C"}, {"env_step": 2190000, "rew": 1518.2845, "rew_std": 1217.019, "Agent": "A2C"}, {"env_step": 2220000, "rew": 1433.3372, "rew_std": 1185.8109, "Agent": "A2C"}, {"env_step": 2250000, "rew": 1504.5862, "rew_std": 1188.7119, "Agent": "A2C"}, {"env_step": 2280000, "rew": 1224.1892, "rew_std": 1016.6736, "Agent": "A2C"}, {"env_step": 2310000, "rew": 1372.7436, "rew_std": 1260.412, "Agent": "A2C"}, {"env_step": 2340000, "rew": 1396.0995, "rew_std": 1169.063, "Agent": "A2C"}, {"env_step": 2370000, "rew": 1319.1138, "rew_std": 1026.9624, "Agent": "A2C"}, {"env_step": 2400000, "rew": 1425.5124, "rew_std": 1166.84, "Agent": "A2C"}, {"env_step": 2430000, "rew": 1476.8554, "rew_std": 1220.7322, "Agent": "A2C"}, {"env_step": 2460000, "rew": 1365.7804, "rew_std": 1146.2047, "Agent": "A2C"}, {"env_step": 2490000, "rew": 1500.8564, "rew_std": 1190.1618, "Agent": "A2C"}, {"env_step": 2520000, "rew": 1516.4647, "rew_std": 1178.6812, "Agent": "A2C"}, {"env_step": 2550000, "rew": 1602.7566, "rew_std": 1381.7503, "Agent": "A2C"}, {"env_step": 2580000, "rew": 1364.5163, "rew_std": 1027.3753, "Agent": "A2C"}, {"env_step": 2610000, "rew": 1531.1848, "rew_std": 1143.1932, "Agent": "A2C"}, {"env_step": 2640000, "rew": 1437.8663, "rew_std": 1099.3151, "Agent": "A2C"}, {"env_step": 2670000, "rew": 1585.5412, "rew_std": 1187.9854, "Agent": "A2C"}, {"env_step": 2700000, "rew": 1463.7896, "rew_std": 939.225, "Agent": "A2C"}, {"env_step": 2730000, "rew": 1581.0281, "rew_std": 1204.4173, "Agent": "A2C"}, {"env_step": 2760000, "rew": 1582.5326, "rew_std": 1240.9568, "Agent": "A2C"}, {"env_step": 2790000, "rew": 1670.3598, "rew_std": 1185.5812, "Agent": "A2C"}, {"env_step": 2820000, "rew": 1517.0635, "rew_std": 1063.1808, "Agent": "A2C"}, {"env_step": 2850000, "rew": 1577.4279, "rew_std": 1179.4943, "Agent": "A2C"}, {"env_step": 2880000, "rew": 1549.6955, "rew_std": 1181.2401, "Agent": "A2C"}, {"env_step": 2910000, "rew": 1517.3998, "rew_std": 1060.0786, "Agent": "A2C"}, {"env_step": 2940000, "rew": 1465.4266, "rew_std": 1144.2754, "Agent": "A2C"}, {"env_step": 2970000, "rew": 1619.9052, "rew_std": 1184.9169, "Agent": "A2C"}, {"env_step": 3000000, "rew": 1658.422, "rew_std": 1153.6737, "Agent": "A2C"}, {"env_step": 0, "rew": 3.0706, "rew_std": 2.4242, "Agent": "ACKTR"}, {"env_step": 30000, "rew": 297.0348, "rew_std": 89.1263, "Agent": "ACKTR"}, {"env_step": 60000, "rew": 308.6476, "rew_std": 164.9206, "Agent": "ACKTR"}, {"env_step": 90000, "rew": 302.9199, "rew_std": 156.569, "Agent": "ACKTR"}, {"env_step": 120000, "rew": 290.7388, "rew_std": 125.0331, "Agent": "ACKTR"}, {"env_step": 150000, "rew": 315.0668, "rew_std": 81.0874, "Agent": "ACKTR"}, {"env_step": 180000, "rew": 360.8104, "rew_std": 145.8789, "Agent": "ACKTR"}, {"env_step": 210000, "rew": 375.5536, "rew_std": 205.9347, "Agent": "ACKTR"}, {"env_step": 240000, "rew": 414.0836, "rew_std": 216.7356, "Agent": "ACKTR"}, {"env_step": 270000, "rew": 395.1604, "rew_std": 193.851, "Agent": "ACKTR"}, {"env_step": 300000, "rew": 399.2448, "rew_std": 187.0716, "Agent": "ACKTR"}, {"env_step": 330000, "rew": 414.4444, "rew_std": 225.0963, "Agent": "ACKTR"}, {"env_step": 360000, "rew": 455.9466, "rew_std": 219.6832, "Agent": "ACKTR"}, {"env_step": 390000, "rew": 383.156, "rew_std": 116.8607, "Agent": "ACKTR"}, {"env_step": 420000, "rew": 449.4804, "rew_std": 228.6865, "Agent": "ACKTR"}, {"env_step": 450000, "rew": 411.1399, "rew_std": 78.3228, "Agent": "ACKTR"}, {"env_step": 480000, "rew": 413.2097, "rew_std": 78.9856, "Agent": "ACKTR"}, {"env_step": 510000, "rew": 437.5513, "rew_std": 106.2422, "Agent": "ACKTR"}, {"env_step": 540000, "rew": 411.0765, "rew_std": 82.1915, "Agent": "ACKTR"}, {"env_step": 570000, "rew": 447.4096, "rew_std": 125.4615, "Agent": "ACKTR"}, {"env_step": 600000, "rew": 470.9888, "rew_std": 204.8143, "Agent": "ACKTR"}, {"env_step": 630000, "rew": 469.4696, "rew_std": 146.7702, "Agent": "ACKTR"}, {"env_step": 660000, "rew": 416.0335, "rew_std": 120.4198, "Agent": "ACKTR"}, {"env_step": 690000, "rew": 450.132, "rew_std": 116.2922, "Agent": "ACKTR"}, {"env_step": 720000, "rew": 460.4646, "rew_std": 128.3028, "Agent": "ACKTR"}, {"env_step": 750000, "rew": 410.7637, "rew_std": 99.9272, "Agent": "ACKTR"}, {"env_step": 780000, "rew": 444.7342, "rew_std": 99.8818, "Agent": "ACKTR"}, {"env_step": 810000, "rew": 497.7111, "rew_std": 125.2393, "Agent": "ACKTR"}, {"env_step": 840000, "rew": 476.762, "rew_std": 124.4981, "Agent": "ACKTR"}, {"env_step": 870000, "rew": 502.4518, "rew_std": 111.7917, "Agent": "ACKTR"}, {"env_step": 900000, "rew": 561.7485, "rew_std": 198.9825, "Agent": "ACKTR"}, {"env_step": 930000, "rew": 619.0941, "rew_std": 277.3773, "Agent": "ACKTR"}, {"env_step": 960000, "rew": 537.1578, "rew_std": 225.4934, "Agent": "ACKTR"}, {"env_step": 990000, "rew": 584.0505, "rew_std": 278.1569, "Agent": "ACKTR"}, {"env_step": 1020000, "rew": 706.8412, "rew_std": 335.0092, "Agent": "ACKTR"}, {"env_step": 1050000, "rew": 620.9084, "rew_std": 246.2422, "Agent": "ACKTR"}, {"env_step": 1080000, "rew": 576.2241, "rew_std": 235.9415, "Agent": "ACKTR"}, {"env_step": 1110000, "rew": 626.7084, "rew_std": 235.1919, "Agent": "ACKTR"}, {"env_step": 1140000, "rew": 679.0752, "rew_std": 360.0373, "Agent": "ACKTR"}, {"env_step": 1170000, "rew": 688.2521, "rew_std": 342.8477, "Agent": "ACKTR"}, {"env_step": 1200000, "rew": 706.9692, "rew_std": 399.908, "Agent": "ACKTR"}, {"env_step": 1230000, "rew": 653.5134, "rew_std": 375.8327, "Agent": "ACKTR"}, {"env_step": 1260000, "rew": 721.4667, "rew_std": 426.1078, "Agent": "ACKTR"}, {"env_step": 1290000, "rew": 637.5896, "rew_std": 240.0467, "Agent": "ACKTR"}, {"env_step": 1320000, "rew": 751.7907, "rew_std": 445.7886, "Agent": "ACKTR"}, {"env_step": 1350000, "rew": 656.1142, "rew_std": 219.4402, "Agent": "ACKTR"}, {"env_step": 1380000, "rew": 685.1033, "rew_std": 324.7073, "Agent": "ACKTR"}, {"env_step": 1410000, "rew": 699.3731, "rew_std": 286.4977, "Agent": "ACKTR"}, {"env_step": 1440000, "rew": 701.7371, "rew_std": 360.77, "Agent": "ACKTR"}, {"env_step": 1470000, "rew": 711.4184, "rew_std": 251.996, "Agent": "ACKTR"}, {"env_step": 1500000, "rew": 789.8676, "rew_std": 348.6923, "Agent": "ACKTR"}, {"env_step": 1530000, "rew": 749.1981, "rew_std": 271.5748, "Agent": "ACKTR"}, {"env_step": 1560000, "rew": 801.281, "rew_std": 327.2471, "Agent": "ACKTR"}, {"env_step": 1590000, "rew": 737.8412, "rew_std": 254.1714, "Agent": "ACKTR"}, {"env_step": 1620000, "rew": 713.9641, "rew_std": 236.4116, "Agent": "ACKTR"}, {"env_step": 1650000, "rew": 742.7832, "rew_std": 203.8988, "Agent": "ACKTR"}, {"env_step": 1680000, "rew": 813.1017, "rew_std": 253.3622, "Agent": "ACKTR"}, {"env_step": 1710000, "rew": 790.645, "rew_std": 230.9439, "Agent": "ACKTR"}, {"env_step": 1740000, "rew": 717.8086, "rew_std": 173.6694, "Agent": "ACKTR"}, {"env_step": 1770000, "rew": 852.3277, "rew_std": 283.3972, "Agent": "ACKTR"}, {"env_step": 1800000, "rew": 929.943, "rew_std": 414.0796, "Agent": "ACKTR"}, {"env_step": 1830000, "rew": 924.3004, "rew_std": 373.9222, "Agent": "ACKTR"}, {"env_step": 1860000, "rew": 783.2235, "rew_std": 201.4583, "Agent": "ACKTR"}, {"env_step": 1890000, "rew": 975.48, "rew_std": 466.0772, "Agent": "ACKTR"}, {"env_step": 1920000, "rew": 989.3575, "rew_std": 423.3858, "Agent": "ACKTR"}, {"env_step": 1950000, "rew": 953.8659, "rew_std": 460.4283, "Agent": "ACKTR"}, {"env_step": 1980000, "rew": 879.6609, "rew_std": 395.0328, "Agent": "ACKTR"}, {"env_step": 2010000, "rew": 918.0207, "rew_std": 330.3395, "Agent": "ACKTR"}, {"env_step": 2040000, "rew": 878.8959, "rew_std": 342.9723, "Agent": "ACKTR"}, {"env_step": 2070000, "rew": 1034.2593, "rew_std": 488.9087, "Agent": "ACKTR"}, {"env_step": 2100000, "rew": 880.1474, "rew_std": 313.2929, "Agent": "ACKTR"}, {"env_step": 2130000, "rew": 969.4703, "rew_std": 319.9895, "Agent": "ACKTR"}, {"env_step": 2160000, "rew": 955.7337, "rew_std": 401.744, "Agent": "ACKTR"}, {"env_step": 2190000, "rew": 789.4459, "rew_std": 265.3747, "Agent": "ACKTR"}, {"env_step": 2220000, "rew": 932.7362, "rew_std": 444.3527, "Agent": "ACKTR"}, {"env_step": 2250000, "rew": 967.646, "rew_std": 325.098, "Agent": "ACKTR"}, {"env_step": 2280000, "rew": 1039.2046, "rew_std": 434.3245, "Agent": "ACKTR"}, {"env_step": 2310000, "rew": 879.698, "rew_std": 239.0196, "Agent": "ACKTR"}, {"env_step": 2340000, "rew": 1023.4071, "rew_std": 299.1967, "Agent": "ACKTR"}, {"env_step": 2370000, "rew": 992.6516, "rew_std": 353.9518, "Agent": "ACKTR"}, {"env_step": 2400000, "rew": 923.7997, "rew_std": 296.9229, "Agent": "ACKTR"}, {"env_step": 2430000, "rew": 1054.9251, "rew_std": 373.6577, "Agent": "ACKTR"}, {"env_step": 2460000, "rew": 1067.3841, "rew_std": 307.4446, "Agent": "ACKTR"}, {"env_step": 2490000, "rew": 1058.0064, "rew_std": 455.9785, "Agent": "ACKTR"}, {"env_step": 2520000, "rew": 1108.0236, "rew_std": 480.3206, "Agent": "ACKTR"}, {"env_step": 2550000, "rew": 1183.9306, "rew_std": 474.8471, "Agent": "ACKTR"}, {"env_step": 2580000, "rew": 1168.6298, "rew_std": 455.2282, "Agent": "ACKTR"}, {"env_step": 2610000, "rew": 1146.7878, "rew_std": 456.2708, "Agent": "ACKTR"}, {"env_step": 2640000, "rew": 1129.638, "rew_std": 336.7948, "Agent": "ACKTR"}, {"env_step": 2670000, "rew": 1213.7447, "rew_std": 696.0454, "Agent": "ACKTR"}, {"env_step": 2700000, "rew": 1259.4968, "rew_std": 636.493, "Agent": "ACKTR"}, {"env_step": 2730000, "rew": 1205.2767, "rew_std": 538.7521, "Agent": "ACKTR"}, {"env_step": 2760000, "rew": 1241.2245, "rew_std": 507.8919, "Agent": "ACKTR"}, {"env_step": 2790000, "rew": 999.9475, "rew_std": 388.0333, "Agent": "ACKTR"}, {"env_step": 2820000, "rew": 1095.1805, "rew_std": 386.0712, "Agent": "ACKTR"}, {"env_step": 2850000, "rew": 1258.7733, "rew_std": 627.9112, "Agent": "ACKTR"}, {"env_step": 2880000, "rew": 1065.5095, "rew_std": 328.7561, "Agent": "ACKTR"}, {"env_step": 2910000, "rew": 1100.6237, "rew_std": 447.4947, "Agent": "ACKTR"}, {"env_step": 2940000, "rew": 1329.1346, "rew_std": 498.8758, "Agent": "ACKTR"}, {"env_step": 2970000, "rew": 1049.2236, "rew_std": 324.0807, "Agent": "ACKTR"}, {"env_step": 3000000, "rew": 1254.8096, "rew_std": 647.9675, "Agent": "ACKTR"}, {"env_step": 0, "rew": 6.442, "rew_std": 12.7772, "Agent": "DDPG"}, {"env_step": 5000, "rew": 209.6345, "rew_std": 106.9195, "Agent": "DDPG"}, {"env_step": 10000, "rew": 92.4845, "rew_std": 86.3134, "Agent": "DDPG"}, {"env_step": 15000, "rew": 110.9192, "rew_std": 72.742, "Agent": "DDPG"}, {"env_step": 20000, "rew": 76.0794, "rew_std": 38.337, "Agent": "DDPG"}, {"env_step": 25000, "rew": 75.6129, "rew_std": 47.0657, "Agent": "DDPG"}, {"env_step": 30000, "rew": 52.394, "rew_std": 41.8502, "Agent": "DDPG"}, {"env_step": 35000, "rew": 72.7174, "rew_std": 59.2642, "Agent": "DDPG"}, {"env_step": 40000, "rew": 76.7715, "rew_std": 37.4037, "Agent": "DDPG"}, {"env_step": 45000, "rew": 86.3831, "rew_std": 52.4139, "Agent": "DDPG"}, {"env_step": 50000, "rew": 72.4621, "rew_std": 67.6108, "Agent": "DDPG"}, {"env_step": 55000, "rew": 113.8373, "rew_std": 73.6839, "Agent": "DDPG"}, {"env_step": 60000, "rew": 109.5331, "rew_std": 53.8501, "Agent": "DDPG"}, {"env_step": 65000, "rew": 112.6556, "rew_std": 107.7279, "Agent": "DDPG"}, {"env_step": 70000, "rew": 98.8362, "rew_std": 77.1782, "Agent": "DDPG"}, {"env_step": 75000, "rew": 85.5219, "rew_std": 96.1378, "Agent": "DDPG"}, {"env_step": 80000, "rew": 76.2617, "rew_std": 76.3135, "Agent": "DDPG"}, {"env_step": 85000, "rew": 80.9462, "rew_std": 66.6375, "Agent": "DDPG"}, {"env_step": 90000, "rew": 154.9533, "rew_std": 81.1592, "Agent": "DDPG"}, {"env_step": 95000, "rew": 82.6995, "rew_std": 63.5277, "Agent": "DDPG"}, {"env_step": 100000, "rew": 112.936, "rew_std": 77.8394, "Agent": "DDPG"}, {"env_step": 105000, "rew": 78.5565, "rew_std": 60.9083, "Agent": "DDPG"}, {"env_step": 110000, "rew": 117.2462, "rew_std": 132.1358, "Agent": "DDPG"}, {"env_step": 115000, "rew": 124.6421, "rew_std": 51.137, "Agent": "DDPG"}, {"env_step": 120000, "rew": 124.3216, "rew_std": 54.4929, "Agent": "DDPG"}, {"env_step": 125000, "rew": 154.0886, "rew_std": 85.1201, "Agent": "DDPG"}, {"env_step": 130000, "rew": 104.8898, "rew_std": 57.6905, "Agent": "DDPG"}, {"env_step": 135000, "rew": 137.9333, "rew_std": 102.3852, "Agent": "DDPG"}, {"env_step": 140000, "rew": 104.9934, "rew_std": 183.7926, "Agent": "DDPG"}, {"env_step": 145000, "rew": 100.7575, "rew_std": 171.5016, "Agent": "DDPG"}, {"env_step": 150000, "rew": 90.4641, "rew_std": 68.0479, "Agent": "DDPG"}, {"env_step": 155000, "rew": 84.1395, "rew_std": 77.7355, "Agent": "DDPG"}, {"env_step": 160000, "rew": 177.786, "rew_std": 172.6902, "Agent": "DDPG"}, {"env_step": 165000, "rew": 122.3961, "rew_std": 66.4944, "Agent": "DDPG"}, {"env_step": 170000, "rew": 131.1034, "rew_std": 77.2705, "Agent": "DDPG"}, {"env_step": 175000, "rew": 111.1769, "rew_std": 84.1658, "Agent": "DDPG"}, {"env_step": 180000, "rew": 128.7461, "rew_std": 73.745, "Agent": "DDPG"}, {"env_step": 185000, "rew": 139.9738, "rew_std": 91.6826, "Agent": "DDPG"}, {"env_step": 190000, "rew": 127.8014, "rew_std": 46.3038, "Agent": "DDPG"}, {"env_step": 195000, "rew": 102.6062, "rew_std": 92.6227, "Agent": "DDPG"}, {"env_step": 200000, "rew": 132.3893, "rew_std": 100.3886, "Agent": "DDPG"}, {"env_step": 205000, "rew": 120.6603, "rew_std": 123.4709, "Agent": "DDPG"}, {"env_step": 210000, "rew": 142.4264, "rew_std": 75.8023, "Agent": "DDPG"}, {"env_step": 215000, "rew": 94.8948, "rew_std": 60.3429, "Agent": "DDPG"}, {"env_step": 220000, "rew": 190.8407, "rew_std": 105.0961, "Agent": "DDPG"}, {"env_step": 225000, "rew": 130.2816, "rew_std": 94.5308, "Agent": "DDPG"}, {"env_step": 230000, "rew": 134.1195, "rew_std": 63.554, "Agent": "DDPG"}, {"env_step": 235000, "rew": 115.2859, "rew_std": 84.2026, "Agent": "DDPG"}, {"env_step": 240000, "rew": 169.5648, "rew_std": 119.7629, "Agent": "DDPG"}, {"env_step": 245000, "rew": 137.7573, "rew_std": 80.8006, "Agent": "DDPG"}, {"env_step": 250000, "rew": 136.8237, "rew_std": 88.4955, "Agent": "DDPG"}, {"env_step": 255000, "rew": 175.491, "rew_std": 95.7576, "Agent": "DDPG"}, {"env_step": 260000, "rew": 70.75, "rew_std": 67.4469, "Agent": "DDPG"}, {"env_step": 265000, "rew": 192.4634, "rew_std": 89.4985, "Agent": "DDPG"}, {"env_step": 270000, "rew": 168.0737, "rew_std": 140.0323, "Agent": "DDPG"}, {"env_step": 275000, "rew": 239.2678, "rew_std": 191.3136, "Agent": "DDPG"}, {"env_step": 280000, "rew": 276.5269, "rew_std": 197.5713, "Agent": "DDPG"}, {"env_step": 285000, "rew": 198.5067, "rew_std": 115.4132, "Agent": "DDPG"}, {"env_step": 290000, "rew": 218.5237, "rew_std": 161.1736, "Agent": "DDPG"}, {"env_step": 295000, "rew": 107.6979, "rew_std": 76.2297, "Agent": "DDPG"}, {"env_step": 300000, "rew": 175.0175, "rew_std": 117.8822, "Agent": "DDPG"}, {"env_step": 305000, "rew": 182.3931, "rew_std": 106.9644, "Agent": "DDPG"}, {"env_step": 310000, "rew": 149.532, "rew_std": 81.8634, "Agent": "DDPG"}, {"env_step": 315000, "rew": 245.8521, "rew_std": 148.3624, "Agent": "DDPG"}, {"env_step": 320000, "rew": 222.2484, "rew_std": 208.8133, "Agent": "DDPG"}, {"env_step": 325000, "rew": 272.465, "rew_std": 236.4393, "Agent": "DDPG"}, {"env_step": 330000, "rew": 244.9023, "rew_std": 197.0817, "Agent": "DDPG"}, {"env_step": 335000, "rew": 299.4603, "rew_std": 127.8442, "Agent": "DDPG"}, {"env_step": 340000, "rew": 135.6976, "rew_std": 210.0048, "Agent": "DDPG"}, {"env_step": 345000, "rew": 206.761, "rew_std": 194.4503, "Agent": "DDPG"}, {"env_step": 350000, "rew": 188.1136, "rew_std": 175.2533, "Agent": "DDPG"}, {"env_step": 355000, "rew": 167.8189, "rew_std": 146.0266, "Agent": "DDPG"}, {"env_step": 360000, "rew": 274.149, "rew_std": 251.136, "Agent": "DDPG"}, {"env_step": 365000, "rew": 197.8242, "rew_std": 124.2311, "Agent": "DDPG"}, {"env_step": 370000, "rew": 322.0313, "rew_std": 276.4998, "Agent": "DDPG"}, {"env_step": 375000, "rew": 300.0051, "rew_std": 232.919, "Agent": "DDPG"}, {"env_step": 380000, "rew": 312.4954, "rew_std": 225.9516, "Agent": "DDPG"}, {"env_step": 385000, "rew": 339.0263, "rew_std": 289.9215, "Agent": "DDPG"}, {"env_step": 390000, "rew": 271.5934, "rew_std": 331.1485, "Agent": "DDPG"}, {"env_step": 395000, "rew": 273.9743, "rew_std": 217.7879, "Agent": "DDPG"}, {"env_step": 400000, "rew": 247.9654, "rew_std": 112.5402, "Agent": "DDPG"}, {"env_step": 405000, "rew": 307.8344, "rew_std": 290.5602, "Agent": "DDPG"}, {"env_step": 410000, "rew": 250.8802, "rew_std": 198.3437, "Agent": "DDPG"}, {"env_step": 415000, "rew": 264.7911, "rew_std": 257.0488, "Agent": "DDPG"}, {"env_step": 420000, "rew": 307.2985, "rew_std": 245.4246, "Agent": "DDPG"}, {"env_step": 425000, "rew": 491.5373, "rew_std": 320.2946, "Agent": "DDPG"}, {"env_step": 430000, "rew": 364.0395, "rew_std": 219.7442, "Agent": "DDPG"}, {"env_step": 435000, "rew": 280.9915, "rew_std": 170.8729, "Agent": "DDPG"}, {"env_step": 440000, "rew": 280.4218, "rew_std": 268.7534, "Agent": "DDPG"}, {"env_step": 445000, "rew": 137.9308, "rew_std": 100.7475, "Agent": "DDPG"}, {"env_step": 450000, "rew": 278.2392, "rew_std": 215.7367, "Agent": "DDPG"}, {"env_step": 455000, "rew": 203.5839, "rew_std": 217.6392, "Agent": "DDPG"}, {"env_step": 460000, "rew": 328.9681, "rew_std": 313.5935, "Agent": "DDPG"}, {"env_step": 465000, "rew": 328.8672, "rew_std": 287.9298, "Agent": "DDPG"}, {"env_step": 470000, "rew": 251.5499, "rew_std": 167.0568, "Agent": "DDPG"}, {"env_step": 475000, "rew": 341.3302, "rew_std": 296.015, "Agent": "DDPG"}, {"env_step": 480000, "rew": 370.4565, "rew_std": 291.124, "Agent": "DDPG"}, {"env_step": 485000, "rew": 393.9402, "rew_std": 285.233, "Agent": "DDPG"}, {"env_step": 490000, "rew": 328.3354, "rew_std": 206.531, "Agent": "DDPG"}, {"env_step": 495000, "rew": 229.3258, "rew_std": 120.8655, "Agent": "DDPG"}, {"env_step": 500000, "rew": 329.8083, "rew_std": 231.147, "Agent": "DDPG"}, {"env_step": 505000, "rew": 504.2143, "rew_std": 338.5162, "Agent": "DDPG"}, {"env_step": 510000, "rew": 435.8627, "rew_std": 347.7476, "Agent": "DDPG"}, {"env_step": 515000, "rew": 357.607, "rew_std": 211.3767, "Agent": "DDPG"}, {"env_step": 520000, "rew": 352.5914, "rew_std": 221.5513, "Agent": "DDPG"}, {"env_step": 525000, "rew": 590.6616, "rew_std": 294.2043, "Agent": "DDPG"}, {"env_step": 530000, "rew": 440.5676, "rew_std": 276.736, "Agent": "DDPG"}, {"env_step": 535000, "rew": 457.0677, "rew_std": 313.7813, "Agent": "DDPG"}, {"env_step": 540000, "rew": 567.1471, "rew_std": 531.5638, "Agent": "DDPG"}, {"env_step": 545000, "rew": 519.2827, "rew_std": 597.3046, "Agent": "DDPG"}, {"env_step": 550000, "rew": 325.0792, "rew_std": 248.0299, "Agent": "DDPG"}, {"env_step": 555000, "rew": 495.9099, "rew_std": 367.6617, "Agent": "DDPG"}, {"env_step": 560000, "rew": 354.0319, "rew_std": 283.1013, "Agent": "DDPG"}, {"env_step": 565000, "rew": 451.488, "rew_std": 347.1324, "Agent": "DDPG"}, {"env_step": 570000, "rew": 422.2737, "rew_std": 275.5602, "Agent": "DDPG"}, {"env_step": 575000, "rew": 386.7718, "rew_std": 263.3219, "Agent": "DDPG"}, {"env_step": 580000, "rew": 538.5896, "rew_std": 285.8722, "Agent": "DDPG"}, {"env_step": 585000, "rew": 506.4352, "rew_std": 240.8315, "Agent": "DDPG"}, {"env_step": 590000, "rew": 456.9596, "rew_std": 304.9017, "Agent": "DDPG"}, {"env_step": 595000, "rew": 471.5949, "rew_std": 215.2671, "Agent": "DDPG"}, {"env_step": 600000, "rew": 539.6254, "rew_std": 298.8542, "Agent": "DDPG"}, {"env_step": 605000, "rew": 411.5241, "rew_std": 338.0484, "Agent": "DDPG"}, {"env_step": 610000, "rew": 447.4153, "rew_std": 227.0487, "Agent": "DDPG"}, {"env_step": 615000, "rew": 371.9614, "rew_std": 235.5178, "Agent": "DDPG"}, {"env_step": 620000, "rew": 389.4932, "rew_std": 329.9028, "Agent": "DDPG"}, {"env_step": 625000, "rew": 710.1275, "rew_std": 479.455, "Agent": "DDPG"}, {"env_step": 630000, "rew": 715.731, "rew_std": 370.1965, "Agent": "DDPG"}, {"env_step": 635000, "rew": 617.3054, "rew_std": 383.7749, "Agent": "DDPG"}, {"env_step": 640000, "rew": 612.6088, "rew_std": 464.348, "Agent": "DDPG"}, {"env_step": 645000, "rew": 552.6727, "rew_std": 398.5933, "Agent": "DDPG"}, {"env_step": 650000, "rew": 639.7049, "rew_std": 586.3823, "Agent": "DDPG"}, {"env_step": 655000, "rew": 605.128, "rew_std": 455.4957, "Agent": "DDPG"}, {"env_step": 660000, "rew": 585.7066, "rew_std": 371.6375, "Agent": "DDPG"}, {"env_step": 665000, "rew": 637.137, "rew_std": 506.6573, "Agent": "DDPG"}, {"env_step": 670000, "rew": 496.4376, "rew_std": 337.2977, "Agent": "DDPG"}, {"env_step": 675000, "rew": 750.3062, "rew_std": 679.6938, "Agent": "DDPG"}, {"env_step": 680000, "rew": 707.022, "rew_std": 408.6625, "Agent": "DDPG"}, {"env_step": 685000, "rew": 649.8468, "rew_std": 318.9338, "Agent": "DDPG"}, {"env_step": 690000, "rew": 675.1389, "rew_std": 360.0423, "Agent": "DDPG"}, {"env_step": 695000, "rew": 1035.521, "rew_std": 602.2645, "Agent": "DDPG"}, {"env_step": 700000, "rew": 621.3213, "rew_std": 397.6714, "Agent": "DDPG"}, {"env_step": 705000, "rew": 720.6641, "rew_std": 472.6936, "Agent": "DDPG"}, {"env_step": 710000, "rew": 928.2668, "rew_std": 491.9258, "Agent": "DDPG"}, {"env_step": 715000, "rew": 720.6522, "rew_std": 438.0118, "Agent": "DDPG"}, {"env_step": 720000, "rew": 1006.4925, "rew_std": 778.8225, "Agent": "DDPG"}, {"env_step": 725000, "rew": 775.1715, "rew_std": 499.7838, "Agent": "DDPG"}, {"env_step": 730000, "rew": 734.8001, "rew_std": 535.1972, "Agent": "DDPG"}, {"env_step": 735000, "rew": 755.3114, "rew_std": 749.0306, "Agent": "DDPG"}, {"env_step": 740000, "rew": 562.1704, "rew_std": 396.1291, "Agent": "DDPG"}, {"env_step": 745000, "rew": 552.7935, "rew_std": 202.8772, "Agent": "DDPG"}, {"env_step": 750000, "rew": 805.4595, "rew_std": 345.2212, "Agent": "DDPG"}, {"env_step": 755000, "rew": 695.7063, "rew_std": 417.3729, "Agent": "DDPG"}, {"env_step": 760000, "rew": 723.2767, "rew_std": 386.8996, "Agent": "DDPG"}, {"env_step": 765000, "rew": 849.0509, "rew_std": 304.5712, "Agent": "DDPG"}, {"env_step": 770000, "rew": 784.1156, "rew_std": 299.4126, "Agent": "DDPG"}, {"env_step": 775000, "rew": 921.9506, "rew_std": 463.5833, "Agent": "DDPG"}, {"env_step": 780000, "rew": 1058.706, "rew_std": 531.6714, "Agent": "DDPG"}, {"env_step": 785000, "rew": 1114.4326, "rew_std": 496.5961, "Agent": "DDPG"}, {"env_step": 790000, "rew": 1079.6687, "rew_std": 833.8941, "Agent": "DDPG"}, {"env_step": 795000, "rew": 638.847, "rew_std": 308.0488, "Agent": "DDPG"}, {"env_step": 800000, "rew": 757.8548, "rew_std": 352.2484, "Agent": "DDPG"}, {"env_step": 805000, "rew": 831.3697, "rew_std": 445.5783, "Agent": "DDPG"}, {"env_step": 810000, "rew": 858.7461, "rew_std": 319.6896, "Agent": "DDPG"}, {"env_step": 815000, "rew": 816.9652, "rew_std": 434.1336, "Agent": "DDPG"}, {"env_step": 820000, "rew": 886.6492, "rew_std": 631.2365, "Agent": "DDPG"}, {"env_step": 825000, "rew": 1049.6078, "rew_std": 652.9144, "Agent": "DDPG"}, {"env_step": 830000, "rew": 1031.1323, "rew_std": 776.5163, "Agent": "DDPG"}, {"env_step": 835000, "rew": 1095.1575, "rew_std": 512.6977, "Agent": "DDPG"}, {"env_step": 840000, "rew": 1219.7758, "rew_std": 664.5146, "Agent": "DDPG"}, {"env_step": 845000, "rew": 1011.1645, "rew_std": 535.7047, "Agent": "DDPG"}, {"env_step": 850000, "rew": 904.2512, "rew_std": 425.4184, "Agent": "DDPG"}, {"env_step": 855000, "rew": 940.3503, "rew_std": 287.5882, "Agent": "DDPG"}, {"env_step": 860000, "rew": 884.3952, "rew_std": 379.0463, "Agent": "DDPG"}, {"env_step": 865000, "rew": 817.2448, "rew_std": 341.9711, "Agent": "DDPG"}, {"env_step": 870000, "rew": 935.3364, "rew_std": 626.8482, "Agent": "DDPG"}, {"env_step": 875000, "rew": 861.8186, "rew_std": 404.6279, "Agent": "DDPG"}, {"env_step": 880000, "rew": 1105.0786, "rew_std": 457.7364, "Agent": "DDPG"}, {"env_step": 885000, "rew": 1006.9897, "rew_std": 642.6791, "Agent": "DDPG"}, {"env_step": 890000, "rew": 1145.9055, "rew_std": 788.6456, "Agent": "DDPG"}, {"env_step": 895000, "rew": 793.1493, "rew_std": 699.8714, "Agent": "DDPG"}, {"env_step": 900000, "rew": 893.9485, "rew_std": 360.6161, "Agent": "DDPG"}, {"env_step": 905000, "rew": 948.873, "rew_std": 512.409, "Agent": "DDPG"}, {"env_step": 910000, "rew": 1000.8644, "rew_std": 555.9317, "Agent": "DDPG"}, {"env_step": 915000, "rew": 1246.2144, "rew_std": 686.9246, "Agent": "DDPG"}, {"env_step": 920000, "rew": 922.9555, "rew_std": 639.8346, "Agent": "DDPG"}, {"env_step": 925000, "rew": 1034.1605, "rew_std": 590.7845, "Agent": "DDPG"}, {"env_step": 930000, "rew": 888.3659, "rew_std": 510.8527, "Agent": "DDPG"}, {"env_step": 935000, "rew": 947.3354, "rew_std": 451.528, "Agent": "DDPG"}, {"env_step": 940000, "rew": 964.2577, "rew_std": 676.8375, "Agent": "DDPG"}, {"env_step": 945000, "rew": 1074.9208, "rew_std": 786.5433, "Agent": "DDPG"}, {"env_step": 950000, "rew": 792.7072, "rew_std": 621.3961, "Agent": "DDPG"}, {"env_step": 955000, "rew": 1129.5728, "rew_std": 510.5583, "Agent": "DDPG"}, {"env_step": 960000, "rew": 1109.5555, "rew_std": 593.7077, "Agent": "DDPG"}, {"env_step": 965000, "rew": 1044.0145, "rew_std": 695.5334, "Agent": "DDPG"}, {"env_step": 970000, "rew": 1213.4942, "rew_std": 613.818, "Agent": "DDPG"}, {"env_step": 975000, "rew": 1400.6112, "rew_std": 904.9948, "Agent": "DDPG"}, {"env_step": 980000, "rew": 1307.934, "rew_std": 721.4078, "Agent": "DDPG"}, {"env_step": 985000, "rew": 1171.1626, "rew_std": 930.6772, "Agent": "DDPG"}, {"env_step": 990000, "rew": 1366.0952, "rew_std": 910.6052, "Agent": "DDPG"}, {"env_step": 995000, "rew": 1160.4298, "rew_std": 508.7525, "Agent": "DDPG"}, {"env_step": 1000000, "rew": 915.7222, "rew_std": 534.5199, "Agent": "DDPG"}, {"env_step": 1005000, "rew": 1266.544, "rew_std": 694.0691, "Agent": "DDPG"}, {"env_step": 1010000, "rew": 952.1188, "rew_std": 474.778, "Agent": "DDPG"}, {"env_step": 1015000, "rew": 1266.1654, "rew_std": 1003.0514, "Agent": "DDPG"}, {"env_step": 1020000, "rew": 1223.4316, "rew_std": 494.6038, "Agent": "DDPG"}, {"env_step": 1025000, "rew": 1151.0592, "rew_std": 740.6732, "Agent": "DDPG"}, {"env_step": 1030000, "rew": 1203.8333, "rew_std": 652.7641, "Agent": "DDPG"}, {"env_step": 1035000, "rew": 1392.2484, "rew_std": 711.8577, "Agent": "DDPG"}, {"env_step": 1040000, "rew": 1020.7799, "rew_std": 486.5689, "Agent": "DDPG"}, {"env_step": 1045000, "rew": 1367.0833, "rew_std": 705.3204, "Agent": "DDPG"}, {"env_step": 1050000, "rew": 1069.1821, "rew_std": 405.9415, "Agent": "DDPG"}, {"env_step": 1055000, "rew": 1211.1614, "rew_std": 565.3418, "Agent": "DDPG"}, {"env_step": 1060000, "rew": 1477.6099, "rew_std": 990.3152, "Agent": "DDPG"}, {"env_step": 1065000, "rew": 1213.522, "rew_std": 734.6501, "Agent": "DDPG"}, {"env_step": 1070000, "rew": 1059.1154, "rew_std": 471.9167, "Agent": "DDPG"}, {"env_step": 1075000, "rew": 1164.246, "rew_std": 547.1, "Agent": "DDPG"}, {"env_step": 1080000, "rew": 1117.6033, "rew_std": 678.8722, "Agent": "DDPG"}, {"env_step": 1085000, "rew": 967.3343, "rew_std": 451.0196, "Agent": "DDPG"}, {"env_step": 1090000, "rew": 1170.0815, "rew_std": 716.037, "Agent": "DDPG"}, {"env_step": 1095000, "rew": 1105.9619, "rew_std": 795.8141, "Agent": "DDPG"}, {"env_step": 1100000, "rew": 1355.7224, "rew_std": 659.8579, "Agent": "DDPG"}, {"env_step": 1105000, "rew": 1333.6021, "rew_std": 791.1507, "Agent": "DDPG"}, {"env_step": 1110000, "rew": 1215.6688, "rew_std": 694.2394, "Agent": "DDPG"}, {"env_step": 1115000, "rew": 1535.3212, "rew_std": 654.6559, "Agent": "DDPG"}, {"env_step": 1120000, "rew": 1266.2611, "rew_std": 524.1622, "Agent": "DDPG"}, {"env_step": 1125000, "rew": 1423.7348, "rew_std": 533.8083, "Agent": "DDPG"}, {"env_step": 1130000, "rew": 1471.318, "rew_std": 822.0757, "Agent": "DDPG"}, {"env_step": 1135000, "rew": 1524.7916, "rew_std": 446.62, "Agent": "DDPG"}, {"env_step": 1140000, "rew": 1534.0366, "rew_std": 926.9304, "Agent": "DDPG"}, {"env_step": 1145000, "rew": 1279.9772, "rew_std": 415.4775, "Agent": "DDPG"}, {"env_step": 1150000, "rew": 1126.2236, "rew_std": 614.9367, "Agent": "DDPG"}, {"env_step": 1155000, "rew": 1307.0345, "rew_std": 569.8288, "Agent": "DDPG"}, {"env_step": 1160000, "rew": 1085.1028, "rew_std": 679.3547, "Agent": "DDPG"}, {"env_step": 1165000, "rew": 1159.2904, "rew_std": 685.5038, "Agent": "DDPG"}, {"env_step": 1170000, "rew": 1253.3681, "rew_std": 514.3574, "Agent": "DDPG"}, {"env_step": 1175000, "rew": 1231.8572, "rew_std": 516.4037, "Agent": "DDPG"}, {"env_step": 1180000, "rew": 1284.062, "rew_std": 710.3769, "Agent": "DDPG"}, {"env_step": 1185000, "rew": 1684.7917, "rew_std": 781.7017, "Agent": "DDPG"}, {"env_step": 1190000, "rew": 1162.9384, "rew_std": 393.7133, "Agent": "DDPG"}, {"env_step": 1195000, "rew": 1348.3814, "rew_std": 461.711, "Agent": "DDPG"}, {"env_step": 1200000, "rew": 1296.4064, "rew_std": 646.6632, "Agent": "DDPG"}, {"env_step": 1205000, "rew": 1242.8858, "rew_std": 779.497, "Agent": "DDPG"}, {"env_step": 1210000, "rew": 1698.99, "rew_std": 558.7736, "Agent": "DDPG"}, {"env_step": 1215000, "rew": 1329.7003, "rew_std": 763.7896, "Agent": "DDPG"}, {"env_step": 1220000, "rew": 1147.4303, "rew_std": 611.0743, "Agent": "DDPG"}, {"env_step": 1225000, "rew": 1242.4779, "rew_std": 586.2073, "Agent": "DDPG"}, {"env_step": 1230000, "rew": 1454.4249, "rew_std": 531.6401, "Agent": "DDPG"}, {"env_step": 1235000, "rew": 1261.938, "rew_std": 555.3104, "Agent": "DDPG"}, {"env_step": 1240000, "rew": 1164.7458, "rew_std": 489.9345, "Agent": "DDPG"}, {"env_step": 1245000, "rew": 1441.9256, "rew_std": 566.5546, "Agent": "DDPG"}, {"env_step": 1250000, "rew": 1464.3456, "rew_std": 784.2176, "Agent": "DDPG"}, {"env_step": 0, "rew": 2.8782, "rew_std": 2.4482, "Agent": "NPG"}, {"env_step": 30720, "rew": 112.6522, "rew_std": 23.8697, "Agent": "NPG"}, {"env_step": 61440, "rew": 287.399, "rew_std": 18.8537, "Agent": "NPG"}, {"env_step": 92160, "rew": 291.4988, "rew_std": 24.0332, "Agent": "NPG"}, {"env_step": 122880, "rew": 316.6308, "rew_std": 29.1213, "Agent": "NPG"}, {"env_step": 153600, "rew": 334.6154, "rew_std": 31.6255, "Agent": "NPG"}, {"env_step": 184320, "rew": 354.9364, "rew_std": 45.2634, "Agent": "NPG"}, {"env_step": 215040, "rew": 388.8686, "rew_std": 36.5586, "Agent": "NPG"}, {"env_step": 245760, "rew": 421.4853, "rew_std": 42.871, "Agent": "NPG"}, {"env_step": 276480, "rew": 463.0154, "rew_std": 46.6935, "Agent": "NPG"}, {"env_step": 307200, "rew": 507.1279, "rew_std": 59.6974, "Agent": "NPG"}, {"env_step": 337920, "rew": 569.2482, "rew_std": 68.0989, "Agent": "NPG"}, {"env_step": 368640, "rew": 621.7042, "rew_std": 110.052, "Agent": "NPG"}, {"env_step": 399360, "rew": 690.7203, "rew_std": 120.9019, "Agent": "NPG"}, {"env_step": 430080, "rew": 723.6404, "rew_std": 139.7524, "Agent": "NPG"}, {"env_step": 460800, "rew": 796.4174, "rew_std": 154.9348, "Agent": "NPG"}, {"env_step": 491520, "rew": 829.0645, "rew_std": 224.9852, "Agent": "NPG"}, {"env_step": 522240, "rew": 989.404, "rew_std": 318.0274, "Agent": "NPG"}, {"env_step": 552960, "rew": 1070.3641, "rew_std": 371.5852, "Agent": "NPG"}, {"env_step": 583680, "rew": 1175.6614, "rew_std": 488.6075, "Agent": "NPG"}, {"env_step": 614400, "rew": 1474.6281, "rew_std": 787.4962, "Agent": "NPG"}, {"env_step": 645120, "rew": 1357.9694, "rew_std": 523.9254, "Agent": "NPG"}, {"env_step": 675840, "rew": 1490.8213, "rew_std": 768.911, "Agent": "NPG"}, {"env_step": 706560, "rew": 1607.691, "rew_std": 666.2092, "Agent": "NPG"}, {"env_step": 737280, "rew": 1694.3592, "rew_std": 617.5648, "Agent": "NPG"}, {"env_step": 768000, "rew": 1900.2682, "rew_std": 774.7461, "Agent": "NPG"}, {"env_step": 798720, "rew": 2103.572, "rew_std": 892.1839, "Agent": "NPG"}, {"env_step": 829440, "rew": 2030.9049, "rew_std": 600.1798, "Agent": "NPG"}, {"env_step": 860160, "rew": 2112.5021, "rew_std": 784.0933, "Agent": "NPG"}, {"env_step": 890880, "rew": 2191.2694, "rew_std": 948.1336, "Agent": "NPG"}, {"env_step": 921600, "rew": 2038.4032, "rew_std": 754.2217, "Agent": "NPG"}, {"env_step": 952320, "rew": 2281.8811, "rew_std": 702.9688, "Agent": "NPG"}, {"env_step": 983040, "rew": 2503.2147, "rew_std": 963.3421, "Agent": "NPG"}, {"env_step": 1013760, "rew": 2424.5509, "rew_std": 708.3593, "Agent": "NPG"}, {"env_step": 1044480, "rew": 2519.7144, "rew_std": 671.9148, "Agent": "NPG"}, {"env_step": 1075200, "rew": 2703.4138, "rew_std": 847.6787, "Agent": "NPG"}, {"env_step": 1105920, "rew": 2847.0771, "rew_std": 1114.5343, "Agent": "NPG"}, {"env_step": 1136640, "rew": 2755.8514, "rew_std": 842.0802, "Agent": "NPG"}, {"env_step": 1167360, "rew": 2738.7251, "rew_std": 659.2855, "Agent": "NPG"}, {"env_step": 1198080, "rew": 2852.8859, "rew_std": 838.6826, "Agent": "NPG"}, {"env_step": 1228800, "rew": 2865.8297, "rew_std": 926.2666, "Agent": "NPG"}, {"env_step": 1259520, "rew": 2939.751, "rew_std": 716.7971, "Agent": "NPG"}, {"env_step": 1290240, "rew": 2806.4684, "rew_std": 746.0406, "Agent": "NPG"}, {"env_step": 1320960, "rew": 3019.8786, "rew_std": 733.2081, "Agent": "NPG"}, {"env_step": 1351680, "rew": 3264.082, "rew_std": 892.7078, "Agent": "NPG"}, {"env_step": 1382400, "rew": 3154.9876, "rew_std": 890.9255, "Agent": "NPG"}, {"env_step": 1413120, "rew": 3070.7847, "rew_std": 751.5189, "Agent": "NPG"}, {"env_step": 1443840, "rew": 3300.3823, "rew_std": 907.4424, "Agent": "NPG"}, {"env_step": 1474560, "rew": 3013.6278, "rew_std": 772.1038, "Agent": "NPG"}, {"env_step": 1505280, "rew": 3203.737, "rew_std": 918.8399, "Agent": "NPG"}, {"env_step": 1536000, "rew": 3435.0662, "rew_std": 926.1293, "Agent": "NPG"}, {"env_step": 1566720, "rew": 3650.606, "rew_std": 880.6538, "Agent": "NPG"}, {"env_step": 1597440, "rew": 3594.429, "rew_std": 868.5779, "Agent": "NPG"}, {"env_step": 1628160, "rew": 3561.5818, "rew_std": 881.7381, "Agent": "NPG"}, {"env_step": 1658880, "rew": 3423.9483, "rew_std": 621.0521, "Agent": "NPG"}, {"env_step": 1689600, "rew": 3657.2812, "rew_std": 983.4185, "Agent": "NPG"}, {"env_step": 1720320, "rew": 3100.4422, "rew_std": 826.8598, "Agent": "NPG"}, {"env_step": 1751040, "rew": 3661.7091, "rew_std": 959.6696, "Agent": "NPG"}, {"env_step": 1781760, "rew": 3673.1036, "rew_std": 1011.3161, "Agent": "NPG"}, {"env_step": 1812480, "rew": 3351.3371, "rew_std": 867.3419, "Agent": "NPG"}, {"env_step": 1843200, "rew": 3511.2881, "rew_std": 669.0114, "Agent": "NPG"}, {"env_step": 1873920, "rew": 3720.4224, "rew_std": 780.0568, "Agent": "NPG"}, {"env_step": 1904640, "rew": 3834.7133, "rew_std": 843.3155, "Agent": "NPG"}, {"env_step": 1935360, "rew": 3819.3163, "rew_std": 754.4939, "Agent": "NPG"}, {"env_step": 1966080, "rew": 3835.2695, "rew_std": 798.1231, "Agent": "NPG"}, {"env_step": 1996800, "rew": 3724.7058, "rew_std": 918.0848, "Agent": "NPG"}, {"env_step": 2027520, "rew": 3698.5876, "rew_std": 721.3852, "Agent": "NPG"}, {"env_step": 2058240, "rew": 4015.9083, "rew_std": 941.2723, "Agent": "NPG"}, {"env_step": 2088960, "rew": 3820.293, "rew_std": 1008.6731, "Agent": "NPG"}, {"env_step": 2119680, "rew": 3674.3533, "rew_std": 855.2969, "Agent": "NPG"}, {"env_step": 2150400, "rew": 3626.8252, "rew_std": 960.4881, "Agent": "NPG"}, {"env_step": 2181120, "rew": 3824.4691, "rew_std": 847.7884, "Agent": "NPG"}, {"env_step": 2211840, "rew": 3848.5224, "rew_std": 894.3708, "Agent": "NPG"}, {"env_step": 2242560, "rew": 3782.4851, "rew_std": 746.5715, "Agent": "NPG"}, {"env_step": 2273280, "rew": 3993.4058, "rew_std": 882.7231, "Agent": "NPG"}, {"env_step": 2304000, "rew": 4111.5323, "rew_std": 846.544, "Agent": "NPG"}, {"env_step": 2334720, "rew": 4087.1457, "rew_std": 1043.8247, "Agent": "NPG"}, {"env_step": 2365440, "rew": 3885.5116, "rew_std": 879.8541, "Agent": "NPG"}, {"env_step": 2396160, "rew": 3891.22, "rew_std": 953.9313, "Agent": "NPG"}, {"env_step": 2426880, "rew": 4011.158, "rew_std": 894.0843, "Agent": "NPG"}, {"env_step": 2457600, "rew": 3987.8754, "rew_std": 723.513, "Agent": "NPG"}, {"env_step": 2488320, "rew": 3988.9495, "rew_std": 820.6914, "Agent": "NPG"}, {"env_step": 2519040, "rew": 4073.6939, "rew_std": 930.3635, "Agent": "NPG"}, {"env_step": 2549760, "rew": 4094.205, "rew_std": 816.9038, "Agent": "NPG"}, {"env_step": 2580480, "rew": 4202.6132, "rew_std": 777.2975, "Agent": "NPG"}, {"env_step": 2611200, "rew": 4355.3191, "rew_std": 797.2507, "Agent": "NPG"}, {"env_step": 2641920, "rew": 4232.2864, "rew_std": 917.0152, "Agent": "NPG"}, {"env_step": 2672640, "rew": 4012.3518, "rew_std": 989.9207, "Agent": "NPG"}, {"env_step": 2703360, "rew": 4168.4174, "rew_std": 898.3971, "Agent": "NPG"}, {"env_step": 2734080, "rew": 3987.0889, "rew_std": 898.8436, "Agent": "NPG"}, {"env_step": 2764800, "rew": 4205.7175, "rew_std": 823.4693, "Agent": "NPG"}, {"env_step": 2795520, "rew": 4264.8484, "rew_std": 833.9701, "Agent": "NPG"}, {"env_step": 2826240, "rew": 4086.8036, "rew_std": 858.5224, "Agent": "NPG"}, {"env_step": 2856960, "rew": 3948.5052, "rew_std": 1190.5425, "Agent": "NPG"}, {"env_step": 2887680, "rew": 4459.5002, "rew_std": 803.5574, "Agent": "NPG"}, {"env_step": 2918400, "rew": 4222.2665, "rew_std": 848.0455, "Agent": "NPG"}, {"env_step": 2949120, "rew": 4028.5353, "rew_std": 968.9714, "Agent": "NPG"}, {"env_step": 2979840, "rew": 4246.034, "rew_std": 819.8512, "Agent": "NPG"}, {"env_step": 3010560, "rew": 4333.7754, "rew_std": 945.4779, "Agent": "NPG"}, {"env_step": 3041280, "rew": 4264.4591, "rew_std": 825.6799, "Agent": "NPG"}, {"env_step": 3072000, "rew": 4586.884, "rew_std": 905.0242, "Agent": "NPG"}]