[{"env_step": 0, "rew": 1.0903, "rew_std": 3.5978, "Agent": "PPO"}, {"env_step": 30720, "rew": 14.541, "rew_std": 5.4261, "Agent": "PPO"}, {"env_step": 61440, "rew": -17.2246, "rew_std": 3.7694, "Agent": "PPO"}, {"env_step": 92160, "rew": -11.2966, "rew_std": 8.1654, "Agent": "PPO"}, {"env_step": 122880, "rew": -10.0344, "rew_std": 10.6224, "Agent": "PPO"}, {"env_step": 153600, "rew": 3.5313, "rew_std": 14.4579, "Agent": "PPO"}, {"env_step": 184320, "rew": 3.9484, "rew_std": 15.9274, "Agent": "PPO"}, {"env_step": 215040, "rew": 12.3234, "rew_std": 13.8123, "Agent": "PPO"}, {"env_step": 245760, "rew": 10.885, "rew_std": 19.2383, "Agent": "PPO"}, {"env_step": 276480, "rew": 15.0975, "rew_std": 14.2842, "Agent": "PPO"}, {"env_step": 307200, "rew": 16.7842, "rew_std": 17.8373, "Agent": "PPO"}, {"env_step": 337920, "rew": 24.768, "rew_std": 20.6693, "Agent": "PPO"}, {"env_step": 368640, "rew": 28.4681, "rew_std": 16.759, "Agent": "PPO"}, {"env_step": 399360, "rew": 31.9449, "rew_std": 14.1058, "Agent": "PPO"}, {"env_step": 430080, "rew": 33.7103, "rew_std": 8.9838, "Agent": "PPO"}, {"env_step": 460800, "rew": 31.834, "rew_std": 14.3058, "Agent": "PPO"}, {"env_step": 491520, "rew": 28.5064, "rew_std": 20.959, "Agent": "PPO"}, {"env_step": 522240, "rew": 28.5923, "rew_std": 29.5259, "Agent": "PPO"}, {"env_step": 552960, "rew": 23.8657, "rew_std": 22.2134, "Agent": "PPO"}, {"env_step": 583680, "rew": 34.3898, "rew_std": 34.7257, "Agent": "PPO"}, {"env_step": 614400, "rew": 31.3354, "rew_std": 27.7352, "Agent": "PPO"}, {"env_step": 645120, "rew": 29.9966, "rew_std": 23.1932, "Agent": "PPO"}, {"env_step": 675840, "rew": 34.0979, "rew_std": 26.5224, "Agent": "PPO"}, {"env_step": 706560, "rew": 36.3625, "rew_std": 16.5982, "Agent": "PPO"}, {"env_step": 737280, "rew": 37.9557, "rew_std": 17.0515, "Agent": "PPO"}, {"env_step": 768000, "rew": 35.7174, "rew_std": 17.8115, "Agent": "PPO"}, {"env_step": 798720, "rew": 47.5277, "rew_std": 38.7629, "Agent": "PPO"}, {"env_step": 829440, "rew": 44.0949, "rew_std": 38.5072, "Agent": "PPO"}, {"env_step": 860160, "rew": 63.287, "rew_std": 93.1252, "Agent": "PPO"}, {"env_step": 890880, "rew": 62.5291, "rew_std": 96.7548, "Agent": "PPO"}, {"env_step": 921600, "rew": 61.587, "rew_std": 99.9543, "Agent": "PPO"}, {"env_step": 952320, "rew": 66.6847, "rew_std": 99.1066, "Agent": "PPO"}, {"env_step": 983040, "rew": 66.1222, "rew_std": 99.6237, "Agent": "PPO"}, {"env_step": 1013760, "rew": 64.5596, "rew_std": 96.657, "Agent": "PPO"}, {"env_step": 1044480, "rew": 63.9429, "rew_std": 100.59, "Agent": "PPO"}, {"env_step": 1075200, "rew": 67.3104, "rew_std": 99.7823, "Agent": "PPO"}, {"env_step": 1105920, "rew": 68.3072, "rew_std": 99.4767, "Agent": "PPO"}, {"env_step": 1136640, "rew": 69.532, "rew_std": 98.3712, "Agent": "PPO"}, {"env_step": 1167360, "rew": 71.7715, "rew_std": 98.3249, "Agent": "PPO"}, {"env_step": 1198080, "rew": 70.3806, "rew_std": 98.6928, "Agent": "PPO"}, {"env_step": 1228800, "rew": 70.3897, "rew_std": 98.3615, "Agent": "PPO"}, {"env_step": 1259520, "rew": 71.1511, "rew_std": 98.1166, "Agent": "PPO"}, {"env_step": 1290240, "rew": 72.489, "rew_std": 98.3858, "Agent": "PPO"}, {"env_step": 1320960, "rew": 71.0808, "rew_std": 98.8914, "Agent": "PPO"}, {"env_step": 1351680, "rew": 69.7793, "rew_std": 98.9076, "Agent": "PPO"}, {"env_step": 1382400, "rew": 72.0401, "rew_std": 98.174, "Agent": "PPO"}, {"env_step": 1413120, "rew": 72.0039, "rew_std": 98.6329, "Agent": "PPO"}, {"env_step": 1443840, "rew": 71.0677, "rew_std": 99.5856, "Agent": "PPO"}, {"env_step": 1474560, "rew": 73.6586, "rew_std": 97.4667, "Agent": "PPO"}, {"env_step": 1505280, "rew": 70.4729, "rew_std": 99.3265, "Agent": "PPO"}, {"env_step": 1536000, "rew": 72.6155, "rew_std": 98.2909, "Agent": "PPO"}, {"env_step": 1566720, "rew": 75.7714, "rew_std": 97.3342, "Agent": "PPO"}, {"env_step": 1597440, "rew": 73.6515, "rew_std": 97.8379, "Agent": "PPO"}, {"env_step": 1628160, "rew": 73.5543, "rew_std": 98.5735, "Agent": "PPO"}, {"env_step": 1658880, "rew": 70.3039, "rew_std": 98.8956, "Agent": "PPO"}, {"env_step": 1689600, "rew": 75.3847, "rew_std": 97.7091, "Agent": "PPO"}, {"env_step": 1720320, "rew": 70.2479, "rew_std": 99.3575, "Agent": "PPO"}, {"env_step": 1751040, "rew": 75.8085, "rew_std": 97.4939, "Agent": "PPO"}, {"env_step": 1781760, "rew": 78.0713, "rew_std": 96.2682, "Agent": "PPO"}, {"env_step": 1812480, "rew": 70.7668, "rew_std": 99.9198, "Agent": "PPO"}, {"env_step": 1843200, "rew": 74.9315, "rew_std": 98.0385, "Agent": "PPO"}, {"env_step": 1873920, "rew": 74.4566, "rew_std": 97.8105, "Agent": "PPO"}, {"env_step": 1904640, "rew": 72.7717, "rew_std": 99.2967, "Agent": "PPO"}, {"env_step": 1935360, "rew": 76.5677, "rew_std": 96.9867, "Agent": "PPO"}, {"env_step": 1966080, "rew": 78.3815, "rew_std": 96.275, "Agent": "PPO"}, {"env_step": 1996800, "rew": 72.2778, "rew_std": 98.9372, "Agent": "PPO"}, {"env_step": 2027520, "rew": 73.4618, "rew_std": 98.2254, "Agent": "PPO"}, {"env_step": 2058240, "rew": 73.0458, "rew_std": 98.8491, "Agent": "PPO"}, {"env_step": 2088960, "rew": 76.1767, "rew_std": 97.7641, "Agent": "PPO"}, {"env_step": 2119680, "rew": 78.726, "rew_std": 96.0722, "Agent": "PPO"}, {"env_step": 2150400, "rew": 76.7965, "rew_std": 97.3736, "Agent": "PPO"}, {"env_step": 2181120, "rew": 75.239, "rew_std": 98.4263, "Agent": "PPO"}, {"env_step": 2211840, "rew": 76.4495, "rew_std": 97.35, "Agent": "PPO"}, {"env_step": 2242560, "rew": 77.0431, "rew_std": 96.7973, "Agent": "PPO"}, {"env_step": 2273280, "rew": 76.0307, "rew_std": 97.4001, "Agent": "PPO"}, {"env_step": 2304000, "rew": 77.3101, "rew_std": 97.2428, "Agent": "PPO"}, {"env_step": 2334720, "rew": 77.2666, "rew_std": 97.1735, "Agent": "PPO"}, {"env_step": 2365440, "rew": 75.6714, "rew_std": 97.8766, "Agent": "PPO"}, {"env_step": 2396160, "rew": 74.9936, "rew_std": 97.9828, "Agent": "PPO"}, {"env_step": 2426880, "rew": 78.1617, "rew_std": 96.8809, "Agent": "PPO"}, {"env_step": 2457600, "rew": 76.8037, "rew_std": 97.0951, "Agent": "PPO"}, {"env_step": 2488320, "rew": 79.3963, "rew_std": 96.5996, "Agent": "PPO"}, {"env_step": 2519040, "rew": 73.241, "rew_std": 99.1238, "Agent": "PPO"}, {"env_step": 2549760, "rew": 77.9169, "rew_std": 97.3104, "Agent": "PPO"}, {"env_step": 2580480, "rew": 79.9991, "rew_std": 96.0853, "Agent": "PPO"}, {"env_step": 2611200, "rew": 79.6211, "rew_std": 96.5515, "Agent": "PPO"}, {"env_step": 2641920, "rew": 78.5614, "rew_std": 96.9572, "Agent": "PPO"}, {"env_step": 2672640, "rew": 76.6251, "rew_std": 97.7851, "Agent": "PPO"}, {"env_step": 2703360, "rew": 73.7308, "rew_std": 98.7249, "Agent": "PPO"}, {"env_step": 2734080, "rew": 78.168, "rew_std": 96.7511, "Agent": "PPO"}, {"env_step": 2764800, "rew": 78.9345, "rew_std": 96.4013, "Agent": "PPO"}, {"env_step": 2795520, "rew": 77.202, "rew_std": 97.8047, "Agent": "PPO"}, {"env_step": 2826240, "rew": 78.4772, "rew_std": 96.6058, "Agent": "PPO"}, {"env_step": 2856960, "rew": 74.9028, "rew_std": 98.5857, "Agent": "PPO"}, {"env_step": 2887680, "rew": 78.9153, "rew_std": 96.8546, "Agent": "PPO"}, {"env_step": 2918400, "rew": 80.0785, "rew_std": 96.3598, "Agent": "PPO"}, {"env_step": 2949120, "rew": 78.4847, "rew_std": 96.8831, "Agent": "PPO"}, {"env_step": 2979840, "rew": 81.3662, "rew_std": 96.0461, "Agent": "PPO"}, {"env_step": 3010560, "rew": 78.3437, "rew_std": 97.3812, "Agent": "PPO"}, {"env_step": 3041280, "rew": 79.2758, "rew_std": 96.4586, "Agent": "PPO"}, {"env_step": 3072000, "rew": 77.5265, "rew_std": 97.1351, "Agent": "PPO"}, {"env_step": 0, "rew": -7.7439, "rew_std": 16.8878, "Agent": "TD3"}, {"env_step": 5000, "rew": 24.6469, "rew_std": 4.5382, "Agent": "TD3"}, {"env_step": 10000, "rew": 25.0534, "rew_std": 10.6669, "Agent": "TD3"}, {"env_step": 15000, "rew": 29.6534, "rew_std": 11.6169, "Agent": "TD3"}, {"env_step": 20000, "rew": 38.585, "rew_std": 9.998, "Agent": "TD3"}, {"env_step": 25000, "rew": 44.6048, "rew_std": 11.0176, "Agent": "TD3"}, {"env_step": 30000, "rew": 26.28, "rew_std": 26.582, "Agent": "TD3"}, {"env_step": 35000, "rew": 34.9212, "rew_std": 8.0993, "Agent": "TD3"}, {"env_step": 40000, "rew": 33.5783, "rew_std": 11.7866, "Agent": "TD3"}, {"env_step": 45000, "rew": 33.854, "rew_std": 8.7302, "Agent": "TD3"}, {"env_step": 50000, "rew": 39.2372, "rew_std": 13.5948, "Agent": "TD3"}, {"env_step": 55000, "rew": 37.533, "rew_std": 6.0203, "Agent": "TD3"}, {"env_step": 60000, "rew": 36.653, "rew_std": 6.8221, "Agent": "TD3"}, {"env_step": 65000, "rew": 41.4642, "rew_std": 8.1535, "Agent": "TD3"}, {"env_step": 70000, "rew": 40.2504, "rew_std": 8.7733, "Agent": "TD3"}, {"env_step": 75000, "rew": 40.4649, "rew_std": 9.2816, "Agent": "TD3"}, {"env_step": 80000, "rew": 38.4952, "rew_std": 16.6833, "Agent": "TD3"}, {"env_step": 85000, "rew": 41.4131, "rew_std": 9.4847, "Agent": "TD3"}, {"env_step": 90000, "rew": 40.3345, "rew_std": 12.7181, "Agent": "TD3"}, {"env_step": 95000, "rew": 44.8763, "rew_std": 6.4609, "Agent": "TD3"}, {"env_step": 100000, "rew": 44.8324, "rew_std": 6.8199, "Agent": "TD3"}, {"env_step": 105000, "rew": 42.1155, "rew_std": 6.4451, "Agent": "TD3"}, {"env_step": 110000, "rew": 45.29, "rew_std": 3.558, "Agent": "TD3"}, {"env_step": 115000, "rew": 43.5655, "rew_std": 8.7519, "Agent": "TD3"}, {"env_step": 120000, "rew": 44.2056, "rew_std": 7.8904, "Agent": "TD3"}, {"env_step": 125000, "rew": 45.1126, "rew_std": 4.9606, "Agent": "TD3"}, {"env_step": 130000, "rew": 46.5372, "rew_std": 5.0502, "Agent": "TD3"}, {"env_step": 135000, "rew": 46.5835, "rew_std": 5.288, "Agent": "TD3"}, {"env_step": 140000, "rew": 48.8754, "rew_std": 4.7581, "Agent": "TD3"}, {"env_step": 145000, "rew": 46.3889, "rew_std": 3.3211, "Agent": "TD3"}, {"env_step": 150000, "rew": 45.6373, "rew_std": 3.9252, "Agent": "TD3"}, {"env_step": 155000, "rew": 46.1775, "rew_std": 3.5939, "Agent": "TD3"}, {"env_step": 160000, "rew": 47.9908, "rew_std": 4.1987, "Agent": "TD3"}, {"env_step": 165000, "rew": 49.3943, "rew_std": 5.5982, "Agent": "TD3"}, {"env_step": 170000, "rew": 48.5755, "rew_std": 4.1708, "Agent": "TD3"}, {"env_step": 175000, "rew": 48.1512, "rew_std": 4.4001, "Agent": "TD3"}, {"env_step": 180000, "rew": 48.9247, "rew_std": 3.3916, "Agent": "TD3"}, {"env_step": 185000, "rew": 49.942, "rew_std": 3.9773, "Agent": "TD3"}, {"env_step": 190000, "rew": 48.5643, "rew_std": 2.8522, "Agent": "TD3"}, {"env_step": 195000, "rew": 47.3657, "rew_std": 5.0301, "Agent": "TD3"}, {"env_step": 200000, "rew": 50.0434, "rew_std": 3.9202, "Agent": "TD3"}, {"env_step": 205000, "rew": 47.858, "rew_std": 3.4439, "Agent": "TD3"}, {"env_step": 210000, "rew": 50.2507, "rew_std": 4.5715, "Agent": "TD3"}, {"env_step": 215000, "rew": 51.8494, "rew_std": 7.9624, "Agent": "TD3"}, {"env_step": 220000, "rew": 49.5942, "rew_std": 6.0095, "Agent": "TD3"}, {"env_step": 225000, "rew": 49.2158, "rew_std": 4.0273, "Agent": "TD3"}, {"env_step": 230000, "rew": 50.2866, "rew_std": 7.6562, "Agent": "TD3"}, {"env_step": 235000, "rew": 51.362, "rew_std": 6.8194, "Agent": "TD3"}, {"env_step": 240000, "rew": 49.5634, "rew_std": 6.0966, "Agent": "TD3"}, {"env_step": 245000, "rew": 47.582, "rew_std": 11.166, "Agent": "TD3"}, {"env_step": 250000, "rew": 51.2911, "rew_std": 8.8841, "Agent": "TD3"}, {"env_step": 255000, "rew": 52.3947, "rew_std": 9.7762, "Agent": "TD3"}, {"env_step": 260000, "rew": 52.2859, "rew_std": 11.4657, "Agent": "TD3"}, {"env_step": 265000, "rew": 55.5904, "rew_std": 12.1624, "Agent": "TD3"}, {"env_step": 270000, "rew": 55.3218, "rew_std": 10.1369, "Agent": "TD3"}, {"env_step": 275000, "rew": 53.8998, "rew_std": 9.8109, "Agent": "TD3"}, {"env_step": 280000, "rew": 56.1154, "rew_std": 7.0174, "Agent": "TD3"}, {"env_step": 285000, "rew": 57.3024, "rew_std": 10.2827, "Agent": "TD3"}, {"env_step": 290000, "rew": 57.764, "rew_std": 11.1871, "Agent": "TD3"}, {"env_step": 295000, "rew": 59.0905, "rew_std": 17.8983, "Agent": "TD3"}, {"env_step": 300000, "rew": 59.292, "rew_std": 17.2291, "Agent": "TD3"}, {"env_step": 305000, "rew": 60.419, "rew_std": 17.6389, "Agent": "TD3"}, {"env_step": 310000, "rew": 61.5869, "rew_std": 20.8453, "Agent": "TD3"}, {"env_step": 315000, "rew": 58.665, "rew_std": 14.5205, "Agent": "TD3"}, {"env_step": 320000, "rew": 61.191, "rew_std": 17.4832, "Agent": "TD3"}, {"env_step": 325000, "rew": 62.7797, "rew_std": 18.1448, "Agent": "TD3"}, {"env_step": 330000, "rew": 62.6546, "rew_std": 19.4931, "Agent": "TD3"}, {"env_step": 335000, "rew": 65.461, "rew_std": 19.32, "Agent": "TD3"}, {"env_step": 340000, "rew": 65.9703, "rew_std": 22.4508, "Agent": "TD3"}, {"env_step": 345000, "rew": 64.5671, "rew_std": 21.895, "Agent": "TD3"}, {"env_step": 350000, "rew": 69.7419, "rew_std": 25.4201, "Agent": "TD3"}, {"env_step": 355000, "rew": 66.8439, "rew_std": 21.4126, "Agent": "TD3"}, {"env_step": 360000, "rew": 67.2735, "rew_std": 22.4134, "Agent": "TD3"}, {"env_step": 365000, "rew": 70.1827, "rew_std": 23.8667, "Agent": "TD3"}, {"env_step": 370000, "rew": 67.7494, "rew_std": 21.4642, "Agent": "TD3"}, {"env_step": 375000, "rew": 70.1232, "rew_std": 26.1163, "Agent": "TD3"}, {"env_step": 380000, "rew": 70.7586, "rew_std": 24.5781, "Agent": "TD3"}, {"env_step": 385000, "rew": 69.3465, "rew_std": 26.9114, "Agent": "TD3"}, {"env_step": 390000, "rew": 70.8394, "rew_std": 25.6505, "Agent": "TD3"}, {"env_step": 395000, "rew": 72.95, "rew_std": 28.7033, "Agent": "TD3"}, {"env_step": 400000, "rew": 74.0454, "rew_std": 30.5719, "Agent": "TD3"}, {"env_step": 405000, "rew": 72.0362, "rew_std": 29.6133, "Agent": "TD3"}, {"env_step": 410000, "rew": 70.9323, "rew_std": 26.7513, "Agent": "TD3"}, {"env_step": 415000, "rew": 73.8199, "rew_std": 30.3458, "Agent": "TD3"}, {"env_step": 420000, "rew": 72.9135, "rew_std": 31.2769, "Agent": "TD3"}, {"env_step": 425000, "rew": 70.1839, "rew_std": 24.8352, "Agent": "TD3"}, {"env_step": 430000, "rew": 72.7441, "rew_std": 25.5592, "Agent": "TD3"}, {"env_step": 435000, "rew": 77.4554, "rew_std": 29.2872, "Agent": "TD3"}, {"env_step": 440000, "rew": 77.9076, "rew_std": 30.3671, "Agent": "TD3"}, {"env_step": 445000, "rew": 77.3448, "rew_std": 31.0666, "Agent": "TD3"}, {"env_step": 450000, "rew": 76.5884, "rew_std": 31.2528, "Agent": "TD3"}, {"env_step": 455000, "rew": 78.3391, "rew_std": 33.6286, "Agent": "TD3"}, {"env_step": 460000, "rew": 77.0918, "rew_std": 33.4976, "Agent": "TD3"}, {"env_step": 465000, "rew": 76.8354, "rew_std": 32.2517, "Agent": "TD3"}, {"env_step": 470000, "rew": 76.2787, "rew_std": 30.1177, "Agent": "TD3"}, {"env_step": 475000, "rew": 78.2738, "rew_std": 32.6535, "Agent": "TD3"}, {"env_step": 480000, "rew": 76.5014, "rew_std": 28.3248, "Agent": "TD3"}, {"env_step": 485000, "rew": 76.188, "rew_std": 30.7491, "Agent": "TD3"}, {"env_step": 490000, "rew": 77.5848, "rew_std": 30.0843, "Agent": "TD3"}, {"env_step": 495000, "rew": 77.3351, "rew_std": 29.965, "Agent": "TD3"}, {"env_step": 500000, "rew": 79.3092, "rew_std": 30.0778, "Agent": "TD3"}, {"env_step": 505000, "rew": 74.8518, "rew_std": 30.9475, "Agent": "TD3"}, {"env_step": 510000, "rew": 80.657, "rew_std": 31.7103, "Agent": "TD3"}, {"env_step": 515000, "rew": 80.9163, "rew_std": 29.685, "Agent": "TD3"}, {"env_step": 520000, "rew": 80.2363, "rew_std": 29.1871, "Agent": "TD3"}, {"env_step": 525000, "rew": 83.3068, "rew_std": 29.8053, "Agent": "TD3"}, {"env_step": 530000, "rew": 80.923, "rew_std": 29.902, "Agent": "TD3"}, {"env_step": 535000, "rew": 82.1793, "rew_std": 31.9273, "Agent": "TD3"}, {"env_step": 540000, "rew": 81.4991, "rew_std": 31.5799, "Agent": "TD3"}, {"env_step": 545000, "rew": 79.6794, "rew_std": 30.9146, "Agent": "TD3"}, {"env_step": 550000, "rew": 81.2391, "rew_std": 29.9395, "Agent": "TD3"}, {"env_step": 555000, "rew": 81.0082, "rew_std": 30.8059, "Agent": "TD3"}, {"env_step": 560000, "rew": 82.1303, "rew_std": 31.0288, "Agent": "TD3"}, {"env_step": 565000, "rew": 82.3656, "rew_std": 32.1176, "Agent": "TD3"}, {"env_step": 570000, "rew": 81.7197, "rew_std": 32.3548, "Agent": "TD3"}, {"env_step": 575000, "rew": 80.6937, "rew_std": 30.7503, "Agent": "TD3"}, {"env_step": 580000, "rew": 84.4082, "rew_std": 30.6736, "Agent": "TD3"}, {"env_step": 585000, "rew": 82.4516, "rew_std": 30.6142, "Agent": "TD3"}, {"env_step": 590000, "rew": 86.4441, "rew_std": 30.2415, "Agent": "TD3"}, {"env_step": 595000, "rew": 81.5008, "rew_std": 29.9591, "Agent": "TD3"}, {"env_step": 600000, "rew": 84.318, "rew_std": 29.7351, "Agent": "TD3"}, {"env_step": 605000, "rew": 83.5531, "rew_std": 30.6785, "Agent": "TD3"}, {"env_step": 610000, "rew": 86.2638, "rew_std": 30.767, "Agent": "TD3"}, {"env_step": 615000, "rew": 87.2233, "rew_std": 30.9616, "Agent": "TD3"}, {"env_step": 620000, "rew": 85.1809, "rew_std": 31.0423, "Agent": "TD3"}, {"env_step": 625000, "rew": 88.4356, "rew_std": 31.6306, "Agent": "TD3"}, {"env_step": 630000, "rew": 82.1748, "rew_std": 32.4394, "Agent": "TD3"}, {"env_step": 635000, "rew": 87.2665, "rew_std": 32.4218, "Agent": "TD3"}, {"env_step": 640000, "rew": 85.785, "rew_std": 30.6537, "Agent": "TD3"}, {"env_step": 645000, "rew": 86.5869, "rew_std": 30.4763, "Agent": "TD3"}, {"env_step": 650000, "rew": 87.3203, "rew_std": 32.0232, "Agent": "TD3"}, {"env_step": 655000, "rew": 87.7947, "rew_std": 29.9599, "Agent": "TD3"}, {"env_step": 660000, "rew": 87.8461, "rew_std": 30.2639, "Agent": "TD3"}, {"env_step": 665000, "rew": 88.8311, "rew_std": 32.377, "Agent": "TD3"}, {"env_step": 670000, "rew": 84.6939, "rew_std": 32.3997, "Agent": "TD3"}, {"env_step": 675000, "rew": 85.5088, "rew_std": 32.55, "Agent": "TD3"}, {"env_step": 680000, "rew": 87.4098, "rew_std": 31.2783, "Agent": "TD3"}, {"env_step": 685000, "rew": 88.276, "rew_std": 32.8023, "Agent": "TD3"}, {"env_step": 690000, "rew": 87.2682, "rew_std": 32.3965, "Agent": "TD3"}, {"env_step": 695000, "rew": 89.4875, "rew_std": 31.3106, "Agent": "TD3"}, {"env_step": 700000, "rew": 89.3074, "rew_std": 31.7229, "Agent": "TD3"}, {"env_step": 705000, "rew": 91.8734, "rew_std": 31.0277, "Agent": "TD3"}, {"env_step": 710000, "rew": 88.4577, "rew_std": 28.9902, "Agent": "TD3"}, {"env_step": 715000, "rew": 90.7966, "rew_std": 28.9473, "Agent": "TD3"}, {"env_step": 720000, "rew": 88.8606, "rew_std": 29.6708, "Agent": "TD3"}, {"env_step": 725000, "rew": 90.5793, "rew_std": 30.4509, "Agent": "TD3"}, {"env_step": 730000, "rew": 92.6566, "rew_std": 29.1638, "Agent": "TD3"}, {"env_step": 735000, "rew": 91.0644, "rew_std": 30.132, "Agent": "TD3"}, {"env_step": 740000, "rew": 93.81, "rew_std": 31.2251, "Agent": "TD3"}, {"env_step": 745000, "rew": 93.186, "rew_std": 30.4468, "Agent": "TD3"}, {"env_step": 750000, "rew": 92.6643, "rew_std": 31.8271, "Agent": "TD3"}, {"env_step": 755000, "rew": 95.9085, "rew_std": 30.7396, "Agent": "TD3"}, {"env_step": 760000, "rew": 93.2766, "rew_std": 30.5946, "Agent": "TD3"}, {"env_step": 765000, "rew": 91.7779, "rew_std": 30.9428, "Agent": "TD3"}, {"env_step": 770000, "rew": 92.8975, "rew_std": 30.3727, "Agent": "TD3"}, {"env_step": 775000, "rew": 93.2678, "rew_std": 30.035, "Agent": "TD3"}, {"env_step": 780000, "rew": 94.9334, "rew_std": 30.218, "Agent": "TD3"}, {"env_step": 785000, "rew": 97.689, "rew_std": 33.428, "Agent": "TD3"}, {"env_step": 790000, "rew": 95.8544, "rew_std": 29.5172, "Agent": "TD3"}, {"env_step": 795000, "rew": 95.3164, "rew_std": 31.1582, "Agent": "TD3"}, {"env_step": 800000, "rew": 99.102, "rew_std": 34.4922, "Agent": "TD3"}, {"env_step": 805000, "rew": 98.9969, "rew_std": 33.5135, "Agent": "TD3"}, {"env_step": 810000, "rew": 97.6485, "rew_std": 34.9215, "Agent": "TD3"}, {"env_step": 815000, "rew": 97.5072, "rew_std": 33.132, "Agent": "TD3"}, {"env_step": 820000, "rew": 100.9863, "rew_std": 32.6827, "Agent": "TD3"}, {"env_step": 825000, "rew": 97.8096, "rew_std": 31.934, "Agent": "TD3"}, {"env_step": 830000, "rew": 100.3499, "rew_std": 33.2398, "Agent": "TD3"}, {"env_step": 835000, "rew": 99.6387, "rew_std": 32.1877, "Agent": "TD3"}, {"env_step": 840000, "rew": 100.1878, "rew_std": 35.5064, "Agent": "TD3"}, {"env_step": 845000, "rew": 100.9504, "rew_std": 31.808, "Agent": "TD3"}, {"env_step": 850000, "rew": 102.5165, "rew_std": 34.9759, "Agent": "TD3"}, {"env_step": 855000, "rew": 99.8103, "rew_std": 32.3758, "Agent": "TD3"}, {"env_step": 860000, "rew": 101.7581, "rew_std": 31.9818, "Agent": "TD3"}, {"env_step": 865000, "rew": 100.7405, "rew_std": 32.7885, "Agent": "TD3"}, {"env_step": 870000, "rew": 100.8249, "rew_std": 33.4003, "Agent": "TD3"}, {"env_step": 875000, "rew": 100.7485, "rew_std": 33.2082, "Agent": "TD3"}, {"env_step": 880000, "rew": 102.5295, "rew_std": 34.4189, "Agent": "TD3"}, {"env_step": 885000, "rew": 99.8226, "rew_std": 32.9092, "Agent": "TD3"}, {"env_step": 890000, "rew": 94.6528, "rew_std": 34.0478, "Agent": "TD3"}, {"env_step": 895000, "rew": 93.6971, "rew_std": 32.7561, "Agent": "TD3"}, {"env_step": 900000, "rew": 101.2272, "rew_std": 33.0066, "Agent": "TD3"}, {"env_step": 905000, "rew": 99.1686, "rew_std": 32.928, "Agent": "TD3"}, {"env_step": 910000, "rew": 101.3434, "rew_std": 33.0791, "Agent": "TD3"}, {"env_step": 915000, "rew": 100.4035, "rew_std": 33.5787, "Agent": "TD3"}, {"env_step": 920000, "rew": 99.3797, "rew_std": 34.4315, "Agent": "TD3"}, {"env_step": 925000, "rew": 100.1444, "rew_std": 34.0045, "Agent": "TD3"}, {"env_step": 930000, "rew": 97.4632, "rew_std": 33.0392, "Agent": "TD3"}, {"env_step": 935000, "rew": 101.2141, "rew_std": 32.8136, "Agent": "TD3"}, {"env_step": 940000, "rew": 97.8222, "rew_std": 34.4894, "Agent": "TD3"}, {"env_step": 945000, "rew": 99.0311, "rew_std": 31.3895, "Agent": "TD3"}, {"env_step": 950000, "rew": 99.9747, "rew_std": 32.4121, "Agent": "TD3"}, {"env_step": 955000, "rew": 98.6989, "rew_std": 33.4333, "Agent": "TD3"}, {"env_step": 960000, "rew": 91.8445, "rew_std": 36.9984, "Agent": "TD3"}, {"env_step": 965000, "rew": 93.2391, "rew_std": 35.273, "Agent": "TD3"}, {"env_step": 970000, "rew": 93.917, "rew_std": 33.1432, "Agent": "TD3"}, {"env_step": 975000, "rew": 99.1082, "rew_std": 31.1777, "Agent": "TD3"}, {"env_step": 980000, "rew": 99.4874, "rew_std": 34.1046, "Agent": "TD3"}, {"env_step": 985000, "rew": 98.5446, "rew_std": 33.182, "Agent": "TD3"}, {"env_step": 990000, "rew": 104.1637, "rew_std": 34.1874, "Agent": "TD3"}, {"env_step": 995000, "rew": 101.2461, "rew_std": 34.129, "Agent": "TD3"}, {"env_step": 1000000, "rew": 96.2436, "rew_std": 33.4562, "Agent": "TD3"}, {"env_step": 1005000, "rew": 96.9054, "rew_std": 34.0766, "Agent": "TD3"}, {"env_step": 1010000, "rew": 102.1064, "rew_std": 32.5263, "Agent": "TD3"}, {"env_step": 1015000, "rew": 100.9795, "rew_std": 34.6542, "Agent": "TD3"}, {"env_step": 1020000, "rew": 98.552, "rew_std": 32.6727, "Agent": "TD3"}, {"env_step": 1025000, "rew": 100.4183, "rew_std": 35.4292, "Agent": "TD3"}, {"env_step": 1030000, "rew": 101.5891, "rew_std": 34.5836, "Agent": "TD3"}, {"env_step": 1035000, "rew": 101.3104, "rew_std": 33.444, "Agent": "TD3"}, {"env_step": 1040000, "rew": 98.8935, "rew_std": 34.7818, "Agent": "TD3"}, {"env_step": 1045000, "rew": 100.1006, "rew_std": 34.472, "Agent": "TD3"}, {"env_step": 1050000, "rew": 101.8728, "rew_std": 33.0307, "Agent": "TD3"}, {"env_step": 1055000, "rew": 100.3289, "rew_std": 33.8025, "Agent": "TD3"}, {"env_step": 1060000, "rew": 99.3667, "rew_std": 34.6098, "Agent": "TD3"}, {"env_step": 1065000, "rew": 100.904, "rew_std": 33.4198, "Agent": "TD3"}, {"env_step": 1070000, "rew": 101.9024, "rew_std": 33.8339, "Agent": "TD3"}, {"env_step": 1075000, "rew": 102.4069, "rew_std": 34.2427, "Agent": "TD3"}, {"env_step": 1080000, "rew": 100.5603, "rew_std": 33.2086, "Agent": "TD3"}, {"env_step": 1085000, "rew": 104.1487, "rew_std": 33.6152, "Agent": "TD3"}, {"env_step": 1090000, "rew": 101.7053, "rew_std": 33.0356, "Agent": "TD3"}, {"env_step": 1095000, "rew": 102.106, "rew_std": 32.8048, "Agent": "TD3"}, {"env_step": 1100000, "rew": 101.0828, "rew_std": 33.3971, "Agent": "TD3"}, {"env_step": 1105000, "rew": 102.5127, "rew_std": 32.3886, "Agent": "TD3"}, {"env_step": 1110000, "rew": 95.4044, "rew_std": 31.6599, "Agent": "TD3"}, {"env_step": 1115000, "rew": 102.8439, "rew_std": 32.6782, "Agent": "TD3"}, {"env_step": 1120000, "rew": 102.2217, "rew_std": 35.2064, "Agent": "TD3"}, {"env_step": 1125000, "rew": 102.1562, "rew_std": 34.7002, "Agent": "TD3"}, {"env_step": 1130000, "rew": 101.2998, "rew_std": 35.3869, "Agent": "TD3"}, {"env_step": 1135000, "rew": 102.9873, "rew_std": 32.7296, "Agent": "TD3"}, {"env_step": 1140000, "rew": 102.4587, "rew_std": 33.3457, "Agent": "TD3"}, {"env_step": 1145000, "rew": 103.994, "rew_std": 32.6864, "Agent": "TD3"}, {"env_step": 1150000, "rew": 103.5746, "rew_std": 31.4598, "Agent": "TD3"}, {"env_step": 1155000, "rew": 102.734, "rew_std": 31.8162, "Agent": "TD3"}, {"env_step": 1160000, "rew": 106.0746, "rew_std": 31.9923, "Agent": "TD3"}, {"env_step": 1165000, "rew": 104.1096, "rew_std": 32.0328, "Agent": "TD3"}, {"env_step": 1170000, "rew": 102.8255, "rew_std": 34.3626, "Agent": "TD3"}, {"env_step": 1175000, "rew": 102.9476, "rew_std": 33.3184, "Agent": "TD3"}, {"env_step": 1180000, "rew": 103.5396, "rew_std": 32.3704, "Agent": "TD3"}, {"env_step": 1185000, "rew": 103.7538, "rew_std": 33.86, "Agent": "TD3"}, {"env_step": 1190000, "rew": 106.8142, "rew_std": 32.7257, "Agent": "TD3"}, {"env_step": 1195000, "rew": 104.5737, "rew_std": 32.7523, "Agent": "TD3"}, {"env_step": 1200000, "rew": 103.5237, "rew_std": 33.3121, "Agent": "TD3"}, {"env_step": 1205000, "rew": 104.1739, "rew_std": 33.8102, "Agent": "TD3"}, {"env_step": 1210000, "rew": 106.0291, "rew_std": 33.2563, "Agent": "TD3"}, {"env_step": 1215000, "rew": 106.5229, "rew_std": 34.5558, "Agent": "TD3"}, {"env_step": 1220000, "rew": 108.357, "rew_std": 33.9605, "Agent": "TD3"}, {"env_step": 1225000, "rew": 104.495, "rew_std": 33.2559, "Agent": "TD3"}, {"env_step": 1230000, "rew": 107.376, "rew_std": 32.6799, "Agent": "TD3"}, {"env_step": 1235000, "rew": 105.9014, "rew_std": 33.3857, "Agent": "TD3"}, {"env_step": 1240000, "rew": 106.8905, "rew_std": 33.261, "Agent": "TD3"}, {"env_step": 1245000, "rew": 108.226, "rew_std": 32.7489, "Agent": "TD3"}, {"env_step": 1250000, "rew": 106.2262, "rew_std": 34.3315, "Agent": "TD3"}, {"env_step": 0, "rew": 0.9618, "rew_std": 3.5215, "Agent": "REINFORCE"}, {"env_step": 30720, "rew": 21.6497, "rew_std": 2.0583, "Agent": "REINFORCE"}, {"env_step": 61440, "rew": 18.8407, "rew_std": 1.6384, "Agent": "REINFORCE"}, {"env_step": 92160, "rew": 21.3462, "rew_std": 1.0074, "Agent": "REINFORCE"}, {"env_step": 122880, "rew": 20.6712, "rew_std": 1.6014, "Agent": "REINFORCE"}, {"env_step": 153600, "rew": 19.9964, "rew_std": 2.1868, "Agent": "REINFORCE"}, {"env_step": 184320, "rew": 22.6191, "rew_std": 4.6673, "Agent": "REINFORCE"}, {"env_step": 215040, "rew": 20.3581, "rew_std": 1.9549, "Agent": "REINFORCE"}, {"env_step": 245760, "rew": 19.8743, "rew_std": 3.3722, "Agent": "REINFORCE"}, {"env_step": 276480, "rew": 21.3424, "rew_std": 2.5073, "Agent": "REINFORCE"}, {"env_step": 307200, "rew": 20.9955, "rew_std": 2.2787, "Agent": "REINFORCE"}, {"env_step": 337920, "rew": 20.4953, "rew_std": 2.7613, "Agent": "REINFORCE"}, {"env_step": 368640, "rew": 22.0264, "rew_std": 4.6766, "Agent": "REINFORCE"}, {"env_step": 399360, "rew": 22.3219, "rew_std": 5.2812, "Agent": "REINFORCE"}, {"env_step": 430080, "rew": 24.307, "rew_std": 6.9595, "Agent": "REINFORCE"}, {"env_step": 460800, "rew": 23.2968, "rew_std": 6.6963, "Agent": "REINFORCE"}, {"env_step": 491520, "rew": 20.2182, "rew_std": 6.8104, "Agent": "REINFORCE"}, {"env_step": 522240, "rew": 24.1779, "rew_std": 6.203, "Agent": "REINFORCE"}, {"env_step": 552960, "rew": 24.7635, "rew_std": 5.5496, "Agent": "REINFORCE"}, {"env_step": 583680, "rew": 25.7685, "rew_std": 7.252, "Agent": "REINFORCE"}, {"env_step": 614400, "rew": 23.2547, "rew_std": 8.9279, "Agent": "REINFORCE"}, {"env_step": 645120, "rew": 25.7667, "rew_std": 8.5028, "Agent": "REINFORCE"}, {"env_step": 675840, "rew": 26.3615, "rew_std": 5.6484, "Agent": "REINFORCE"}, {"env_step": 706560, "rew": 29.3509, "rew_std": 4.2497, "Agent": "REINFORCE"}, {"env_step": 737280, "rew": 27.4427, "rew_std": 4.5532, "Agent": "REINFORCE"}, {"env_step": 768000, "rew": 29.4254, "rew_std": 4.4139, "Agent": "REINFORCE"}, {"env_step": 798720, "rew": 28.885, "rew_std": 4.5786, "Agent": "REINFORCE"}, {"env_step": 829440, "rew": 29.5476, "rew_std": 5.0349, "Agent": "REINFORCE"}, {"env_step": 860160, "rew": 29.6066, "rew_std": 5.663, "Agent": "REINFORCE"}, {"env_step": 890880, "rew": 29.6368, "rew_std": 5.2243, "Agent": "REINFORCE"}, {"env_step": 921600, "rew": 29.8861, "rew_std": 5.0542, "Agent": "REINFORCE"}, {"env_step": 952320, "rew": 29.8157, "rew_std": 5.0216, "Agent": "REINFORCE"}, {"env_step": 983040, "rew": 30.0077, "rew_std": 7.2744, "Agent": "REINFORCE"}, {"env_step": 1013760, "rew": 30.5773, "rew_std": 6.8568, "Agent": "REINFORCE"}, {"env_step": 1044480, "rew": 29.8747, "rew_std": 6.5815, "Agent": "REINFORCE"}, {"env_step": 1075200, "rew": 28.6939, "rew_std": 8.3452, "Agent": "REINFORCE"}, {"env_step": 1105920, "rew": 30.8997, "rew_std": 4.6416, "Agent": "REINFORCE"}, {"env_step": 1136640, "rew": 32.1676, "rew_std": 3.6635, "Agent": "REINFORCE"}, {"env_step": 1167360, "rew": 33.282, "rew_std": 3.9632, "Agent": "REINFORCE"}, {"env_step": 1198080, "rew": 32.7282, "rew_std": 4.2844, "Agent": "REINFORCE"}, {"env_step": 1228800, "rew": 32.175, "rew_std": 1.4538, "Agent": "REINFORCE"}, {"env_step": 1259520, "rew": 32.3137, "rew_std": 2.4142, "Agent": "REINFORCE"}, {"env_step": 1290240, "rew": 33.0787, "rew_std": 1.7409, "Agent": "REINFORCE"}, {"env_step": 1320960, "rew": 32.4292, "rew_std": 2.7709, "Agent": "REINFORCE"}, {"env_step": 1351680, "rew": 33.5495, "rew_std": 1.8482, "Agent": "REINFORCE"}, {"env_step": 1382400, "rew": 33.2865, "rew_std": 1.8124, "Agent": "REINFORCE"}, {"env_step": 1413120, "rew": 34.02, "rew_std": 1.5783, "Agent": "REINFORCE"}, {"env_step": 1443840, "rew": 32.4269, "rew_std": 1.3609, "Agent": "REINFORCE"}, {"env_step": 1474560, "rew": 35.2871, "rew_std": 1.4372, "Agent": "REINFORCE"}, {"env_step": 1505280, "rew": 32.8925, "rew_std": 2.0544, "Agent": "REINFORCE"}, {"env_step": 1536000, "rew": 33.947, "rew_std": 2.344, "Agent": "REINFORCE"}, {"env_step": 1566720, "rew": 33.2722, "rew_std": 2.4675, "Agent": "REINFORCE"}, {"env_step": 1597440, "rew": 33.1716, "rew_std": 2.4712, "Agent": "REINFORCE"}, {"env_step": 1628160, "rew": 31.8048, "rew_std": 3.1568, "Agent": "REINFORCE"}, {"env_step": 1658880, "rew": 32.1113, "rew_std": 3.3193, "Agent": "REINFORCE"}, {"env_step": 1689600, "rew": 32.7537, "rew_std": 2.7257, "Agent": "REINFORCE"}, {"env_step": 1720320, "rew": 32.2556, "rew_std": 2.9733, "Agent": "REINFORCE"}, {"env_step": 1751040, "rew": 34.5128, "rew_std": 2.3075, "Agent": "REINFORCE"}, {"env_step": 1781760, "rew": 34.341, "rew_std": 2.7978, "Agent": "REINFORCE"}, {"env_step": 1812480, "rew": 32.339, "rew_std": 2.7514, "Agent": "REINFORCE"}, {"env_step": 1843200, "rew": 34.0286, "rew_std": 2.9285, "Agent": "REINFORCE"}, {"env_step": 1873920, "rew": 32.9519, "rew_std": 2.0919, "Agent": "REINFORCE"}, {"env_step": 1904640, "rew": 33.9109, "rew_std": 2.8357, "Agent": "REINFORCE"}, {"env_step": 1935360, "rew": 34.4966, "rew_std": 1.0048, "Agent": "REINFORCE"}, {"env_step": 1966080, "rew": 34.5729, "rew_std": 1.5995, "Agent": "REINFORCE"}, {"env_step": 1996800, "rew": 33.9055, "rew_std": 1.9507, "Agent": "REINFORCE"}, {"env_step": 2027520, "rew": 33.6248, "rew_std": 2.1721, "Agent": "REINFORCE"}, {"env_step": 2058240, "rew": 33.5189, "rew_std": 2.9632, "Agent": "REINFORCE"}, {"env_step": 2088960, "rew": 33.0232, "rew_std": 3.8123, "Agent": "REINFORCE"}, {"env_step": 2119680, "rew": 33.4146, "rew_std": 3.783, "Agent": "REINFORCE"}, {"env_step": 2150400, "rew": 32.7739, "rew_std": 3.8725, "Agent": "REINFORCE"}, {"env_step": 2181120, "rew": 32.1464, "rew_std": 3.4452, "Agent": "REINFORCE"}, {"env_step": 2211840, "rew": 32.4067, "rew_std": 3.6292, "Agent": "REINFORCE"}, {"env_step": 2242560, "rew": 32.8531, "rew_std": 4.2917, "Agent": "REINFORCE"}, {"env_step": 2273280, "rew": 31.3723, "rew_std": 4.6388, "Agent": "REINFORCE"}, {"env_step": 2304000, "rew": 31.7266, "rew_std": 4.3836, "Agent": "REINFORCE"}, {"env_step": 2334720, "rew": 31.9897, "rew_std": 4.348, "Agent": "REINFORCE"}, {"env_step": 2365440, "rew": 33.2492, "rew_std": 4.0503, "Agent": "REINFORCE"}, {"env_step": 2396160, "rew": 32.555, "rew_std": 3.7809, "Agent": "REINFORCE"}, {"env_step": 2426880, "rew": 32.5059, "rew_std": 3.2845, "Agent": "REINFORCE"}, {"env_step": 2457600, "rew": 31.1916, "rew_std": 4.5898, "Agent": "REINFORCE"}, {"env_step": 2488320, "rew": 32.4978, "rew_std": 3.9197, "Agent": "REINFORCE"}, {"env_step": 2519040, "rew": 29.8591, "rew_std": 6.5104, "Agent": "REINFORCE"}, {"env_step": 2549760, "rew": 31.2884, "rew_std": 4.2571, "Agent": "REINFORCE"}, {"env_step": 2580480, "rew": 32.3156, "rew_std": 4.9718, "Agent": "REINFORCE"}, {"env_step": 2611200, "rew": 32.6244, "rew_std": 5.1626, "Agent": "REINFORCE"}, {"env_step": 2641920, "rew": 31.9868, "rew_std": 5.7592, "Agent": "REINFORCE"}, {"env_step": 2672640, "rew": 32.893, "rew_std": 3.5311, "Agent": "REINFORCE"}, {"env_step": 2703360, "rew": 32.205, "rew_std": 4.235, "Agent": "REINFORCE"}, {"env_step": 2734080, "rew": 32.1189, "rew_std": 4.6476, "Agent": "REINFORCE"}, {"env_step": 2764800, "rew": 32.3047, "rew_std": 4.5396, "Agent": "REINFORCE"}, {"env_step": 2795520, "rew": 32.6739, "rew_std": 4.9249, "Agent": "REINFORCE"}, {"env_step": 2826240, "rew": 33.2044, "rew_std": 4.504, "Agent": "REINFORCE"}, {"env_step": 2856960, "rew": 33.0202, "rew_std": 3.5788, "Agent": "REINFORCE"}, {"env_step": 2887680, "rew": 33.5991, "rew_std": 3.9779, "Agent": "REINFORCE"}, {"env_step": 2918400, "rew": 33.6818, "rew_std": 3.3053, "Agent": "REINFORCE"}, {"env_step": 2949120, "rew": 33.2439, "rew_std": 3.7153, "Agent": "REINFORCE"}, {"env_step": 2979840, "rew": 35.0602, "rew_std": 2.1509, "Agent": "REINFORCE"}, {"env_step": 3010560, "rew": 34.144, "rew_std": 1.9498, "Agent": "REINFORCE"}, {"env_step": 3041280, "rew": 34.0212, "rew_std": 2.8477, "Agent": "REINFORCE"}, {"env_step": 3072000, "rew": 33.22, "rew_std": 2.5058, "Agent": "REINFORCE"}, {"env_step": 3102720, "rew": 34.3311, "rew_std": 2.0098, "Agent": "REINFORCE"}, {"env_step": 3133440, "rew": 34.5845, "rew_std": 2.487, "Agent": "REINFORCE"}, {"env_step": 3164160, "rew": 33.8012, "rew_std": 2.8445, "Agent": "REINFORCE"}, {"env_step": 3194880, "rew": 33.4961, "rew_std": 2.9447, "Agent": "REINFORCE"}, {"env_step": 3225600, "rew": 34.1328, "rew_std": 2.1202, "Agent": "REINFORCE"}, {"env_step": 3256320, "rew": 33.9942, "rew_std": 2.1889, "Agent": "REINFORCE"}, {"env_step": 3287040, "rew": 34.4959, "rew_std": 3.1445, "Agent": "REINFORCE"}, {"env_step": 3317760, "rew": 34.1392, "rew_std": 4.2095, "Agent": "REINFORCE"}, {"env_step": 3348480, "rew": 34.3033, "rew_std": 4.2899, "Agent": "REINFORCE"}, {"env_step": 3379200, "rew": 34.2744, "rew_std": 3.3235, "Agent": "REINFORCE"}, {"env_step": 3409920, "rew": 32.5941, "rew_std": 5.7054, "Agent": "REINFORCE"}, {"env_step": 3440640, "rew": 32.5893, "rew_std": 5.6679, "Agent": "REINFORCE"}, {"env_step": 3471360, "rew": 32.8065, "rew_std": 4.9803, "Agent": "REINFORCE"}, {"env_step": 3502080, "rew": 34.058, "rew_std": 4.703, "Agent": "REINFORCE"}, {"env_step": 3532800, "rew": 32.7505, "rew_std": 6.0165, "Agent": "REINFORCE"}, {"env_step": 3563520, "rew": 32.9924, "rew_std": 5.2966, "Agent": "REINFORCE"}, {"env_step": 3594240, "rew": 33.5606, "rew_std": 5.081, "Agent": "REINFORCE"}, {"env_step": 3624960, "rew": 34.3386, "rew_std": 4.0346, "Agent": "REINFORCE"}, {"env_step": 3655680, "rew": 33.9057, "rew_std": 4.381, "Agent": "REINFORCE"}, {"env_step": 3686400, "rew": 34.9121, "rew_std": 2.9535, "Agent": "REINFORCE"}, {"env_step": 3717120, "rew": 33.749, "rew_std": 3.1327, "Agent": "REINFORCE"}, {"env_step": 3747840, "rew": 34.2743, "rew_std": 3.6415, "Agent": "REINFORCE"}, {"env_step": 3778560, "rew": 35.3061, "rew_std": 2.1058, "Agent": "REINFORCE"}, {"env_step": 3809280, "rew": 34.3247, "rew_std": 2.3545, "Agent": "REINFORCE"}, {"env_step": 3840000, "rew": 34.8757, "rew_std": 3.2262, "Agent": "REINFORCE"}, {"env_step": 3870720, "rew": 34.947, "rew_std": 2.9427, "Agent": "REINFORCE"}, {"env_step": 3901440, "rew": 34.7932, "rew_std": 2.9123, "Agent": "REINFORCE"}, {"env_step": 3932160, "rew": 34.0642, "rew_std": 5.3443, "Agent": "REINFORCE"}, {"env_step": 3962880, "rew": 34.2344, "rew_std": 4.4914, "Agent": "REINFORCE"}, {"env_step": 3993600, "rew": 33.9348, "rew_std": 4.2284, "Agent": "REINFORCE"}, {"env_step": 4024320, "rew": 33.3052, "rew_std": 4.1758, "Agent": "REINFORCE"}, {"env_step": 4055040, "rew": 33.9265, "rew_std": 5.0275, "Agent": "REINFORCE"}, {"env_step": 4085760, "rew": 32.6343, "rew_std": 4.9864, "Agent": "REINFORCE"}, {"env_step": 4116480, "rew": 33.7496, "rew_std": 3.5404, "Agent": "REINFORCE"}, {"env_step": 4147200, "rew": 33.345, "rew_std": 4.1666, "Agent": "REINFORCE"}, {"env_step": 4177920, "rew": 33.9686, "rew_std": 2.8585, "Agent": "REINFORCE"}, {"env_step": 4208640, "rew": 34.0236, "rew_std": 3.1606, "Agent": "REINFORCE"}, {"env_step": 4239360, "rew": 34.0668, "rew_std": 3.1711, "Agent": "REINFORCE"}, {"env_step": 4270080, "rew": 34.0769, "rew_std": 2.6831, "Agent": "REINFORCE"}, {"env_step": 4300800, "rew": 33.2015, "rew_std": 3.4703, "Agent": "REINFORCE"}, {"env_step": 4331520, "rew": 33.1703, "rew_std": 3.6308, "Agent": "REINFORCE"}, {"env_step": 4362240, "rew": 33.7326, "rew_std": 3.5252, "Agent": "REINFORCE"}, {"env_step": 4392960, "rew": 33.1725, "rew_std": 3.596, "Agent": "REINFORCE"}, {"env_step": 4423680, "rew": 32.7075, "rew_std": 4.6077, "Agent": "REINFORCE"}, {"env_step": 4454400, "rew": 32.9265, "rew_std": 3.6788, "Agent": "REINFORCE"}, {"env_step": 4485120, "rew": 33.281, "rew_std": 3.5235, "Agent": "REINFORCE"}, {"env_step": 4515840, "rew": 32.0004, "rew_std": 4.0413, "Agent": "REINFORCE"}, {"env_step": 4546560, "rew": 32.252, "rew_std": 3.6599, "Agent": "REINFORCE"}, {"env_step": 4577280, "rew": 33.465, "rew_std": 4.4369, "Agent": "REINFORCE"}, {"env_step": 4608000, "rew": 33.002, "rew_std": 4.3731, "Agent": "REINFORCE"}, {"env_step": 4638720, "rew": 34.0664, "rew_std": 4.0684, "Agent": "REINFORCE"}, {"env_step": 4669440, "rew": 34.2007, "rew_std": 4.326, "Agent": "REINFORCE"}, {"env_step": 4700160, "rew": 33.1797, "rew_std": 3.901, "Agent": "REINFORCE"}, {"env_step": 4730880, "rew": 33.247, "rew_std": 3.4091, "Agent": "REINFORCE"}, {"env_step": 4761600, "rew": 33.1553, "rew_std": 4.0657, "Agent": "REINFORCE"}, {"env_step": 4792320, "rew": 32.6889, "rew_std": 4.1791, "Agent": "REINFORCE"}, {"env_step": 4823040, "rew": 33.854, "rew_std": 3.5738, "Agent": "REINFORCE"}, {"env_step": 4853760, "rew": 33.5175, "rew_std": 3.3581, "Agent": "REINFORCE"}, {"env_step": 4884480, "rew": 32.3676, "rew_std": 2.9989, "Agent": "REINFORCE"}, {"env_step": 4915200, "rew": 32.6538, "rew_std": 3.5436, "Agent": "REINFORCE"}, {"env_step": 4945920, "rew": 31.9695, "rew_std": 4.0538, "Agent": "REINFORCE"}, {"env_step": 4976640, "rew": 33.8209, "rew_std": 3.4171, "Agent": "REINFORCE"}, {"env_step": 5007360, "rew": 33.2326, "rew_std": 4.5398, "Agent": "REINFORCE"}, {"env_step": 5038080, "rew": 33.0102, "rew_std": 5.1255, "Agent": "REINFORCE"}, {"env_step": 5068800, "rew": 32.7645, "rew_std": 3.9751, "Agent": "REINFORCE"}, {"env_step": 5099520, "rew": 33.3095, "rew_std": 3.5838, "Agent": "REINFORCE"}, {"env_step": 5130240, "rew": 33.9164, "rew_std": 4.5219, "Agent": "REINFORCE"}, {"env_step": 5160960, "rew": 33.2565, "rew_std": 3.1545, "Agent": "REINFORCE"}, {"env_step": 5191680, "rew": 33.6445, "rew_std": 3.4789, "Agent": "REINFORCE"}, {"env_step": 5222400, "rew": 32.9714, "rew_std": 5.0788, "Agent": "REINFORCE"}, {"env_step": 5253120, "rew": 33.2731, "rew_std": 4.1268, "Agent": "REINFORCE"}, {"env_step": 5283840, "rew": 34.2387, "rew_std": 3.831, "Agent": "REINFORCE"}, {"env_step": 5314560, "rew": 33.0195, "rew_std": 4.4602, "Agent": "REINFORCE"}, {"env_step": 5345280, "rew": 33.0358, "rew_std": 4.7634, "Agent": "REINFORCE"}, {"env_step": 5376000, "rew": 33.066, "rew_std": 5.381, "Agent": "REINFORCE"}, {"env_step": 5406720, "rew": 32.8663, "rew_std": 4.5141, "Agent": "REINFORCE"}, {"env_step": 5437440, "rew": 32.182, "rew_std": 5.3874, "Agent": "REINFORCE"}, {"env_step": 5468160, "rew": 32.1664, "rew_std": 6.5647, "Agent": "REINFORCE"}, {"env_step": 5498880, "rew": 32.4971, "rew_std": 5.5007, "Agent": "REINFORCE"}, {"env_step": 5529600, "rew": 31.575, "rew_std": 5.0883, "Agent": "REINFORCE"}, {"env_step": 5560320, "rew": 33.3368, "rew_std": 3.9527, "Agent": "REINFORCE"}, {"env_step": 5591040, "rew": 33.6293, "rew_std": 4.5512, "Agent": "REINFORCE"}, {"env_step": 5621760, "rew": 33.625, "rew_std": 3.9672, "Agent": "REINFORCE"}, {"env_step": 5652480, "rew": 33.2956, "rew_std": 4.5379, "Agent": "REINFORCE"}, {"env_step": 5683200, "rew": 33.2566, "rew_std": 4.1496, "Agent": "REINFORCE"}, {"env_step": 5713920, "rew": 33.7133, "rew_std": 4.1502, "Agent": "REINFORCE"}, {"env_step": 5744640, "rew": 34.8932, "rew_std": 3.706, "Agent": "REINFORCE"}, {"env_step": 5775360, "rew": 34.6708, "rew_std": 3.8852, "Agent": "REINFORCE"}, {"env_step": 5806080, "rew": 34.7482, "rew_std": 3.4388, "Agent": "REINFORCE"}, {"env_step": 5836800, "rew": 34.3264, "rew_std": 3.6939, "Agent": "REINFORCE"}, {"env_step": 5867520, "rew": 33.9703, "rew_std": 3.2207, "Agent": "REINFORCE"}, {"env_step": 5898240, "rew": 34.8393, "rew_std": 4.2321, "Agent": "REINFORCE"}, {"env_step": 5928960, "rew": 34.9294, "rew_std": 4.0082, "Agent": "REINFORCE"}, {"env_step": 5959680, "rew": 34.1719, "rew_std": 4.7017, "Agent": "REINFORCE"}, {"env_step": 5990400, "rew": 33.3955, "rew_std": 4.192, "Agent": "REINFORCE"}, {"env_step": 6021120, "rew": 32.3953, "rew_std": 5.2512, "Agent": "REINFORCE"}, {"env_step": 6051840, "rew": 33.3806, "rew_std": 4.3844, "Agent": "REINFORCE"}, {"env_step": 6082560, "rew": 33.129, "rew_std": 5.484, "Agent": "REINFORCE"}, {"env_step": 6113280, "rew": 32.5978, "rew_std": 5.0187, "Agent": "REINFORCE"}, {"env_step": 6144000, "rew": 33.2739, "rew_std": 3.9319, "Agent": "REINFORCE"}, {"env_step": 6174720, "rew": 32.561, "rew_std": 4.5382, "Agent": "REINFORCE"}, {"env_step": 6205440, "rew": 32.4747, "rew_std": 5.3743, "Agent": "REINFORCE"}, {"env_step": 6236160, "rew": 32.4632, "rew_std": 5.8385, "Agent": "REINFORCE"}, {"env_step": 6266880, "rew": 32.6665, "rew_std": 5.6886, "Agent": "REINFORCE"}, {"env_step": 6297600, "rew": 31.5359, "rew_std": 6.0376, "Agent": "REINFORCE"}, {"env_step": 6328320, "rew": 32.0438, "rew_std": 5.7212, "Agent": "REINFORCE"}, {"env_step": 6359040, "rew": 30.95, "rew_std": 7.1644, "Agent": "REINFORCE"}, {"env_step": 6389760, "rew": 32.0496, "rew_std": 6.4098, "Agent": "REINFORCE"}, {"env_step": 6420480, "rew": 32.5061, "rew_std": 5.9136, "Agent": "REINFORCE"}, {"env_step": 6451200, "rew": 32.4526, "rew_std": 5.9224, "Agent": "REINFORCE"}, {"env_step": 6481920, "rew": 32.3688, "rew_std": 6.1382, "Agent": "REINFORCE"}, {"env_step": 6512640, "rew": 32.2328, "rew_std": 4.6938, "Agent": "REINFORCE"}, {"env_step": 6543360, "rew": 31.9146, "rew_std": 4.3941, "Agent": "REINFORCE"}, {"env_step": 6574080, "rew": 31.4479, "rew_std": 6.3545, "Agent": "REINFORCE"}, {"env_step": 6604800, "rew": 30.8629, "rew_std": 5.4676, "Agent": "REINFORCE"}, {"env_step": 6635520, "rew": 30.7007, "rew_std": 5.5163, "Agent": "REINFORCE"}, {"env_step": 6666240, "rew": 31.7723, "rew_std": 5.9939, "Agent": "REINFORCE"}, {"env_step": 6696960, "rew": 32.615, "rew_std": 5.8788, "Agent": "REINFORCE"}, {"env_step": 6727680, "rew": 31.6344, "rew_std": 4.9203, "Agent": "REINFORCE"}, {"env_step": 6758400, "rew": 32.0157, "rew_std": 5.063, "Agent": "REINFORCE"}, {"env_step": 6789120, "rew": 31.7169, "rew_std": 4.5693, "Agent": "REINFORCE"}, {"env_step": 6819840, "rew": 32.4026, "rew_std": 4.4906, "Agent": "REINFORCE"}, {"env_step": 6850560, "rew": 30.6853, "rew_std": 5.5575, "Agent": "REINFORCE"}, {"env_step": 6881280, "rew": 31.1717, "rew_std": 5.9472, "Agent": "REINFORCE"}, {"env_step": 6912000, "rew": 31.6307, "rew_std": 4.759, "Agent": "REINFORCE"}, {"env_step": 6942720, "rew": 31.6028, "rew_std": 5.7942, "Agent": "REINFORCE"}, {"env_step": 6973440, "rew": 31.8346, "rew_std": 5.6822, "Agent": "REINFORCE"}, {"env_step": 7004160, "rew": 31.9882, "rew_std": 5.955, "Agent": "REINFORCE"}, {"env_step": 7034880, "rew": 32.382, "rew_std": 5.8684, "Agent": "REINFORCE"}, {"env_step": 7065600, "rew": 31.0684, "rew_std": 6.2851, "Agent": "REINFORCE"}, {"env_step": 7096320, "rew": 30.9765, "rew_std": 5.6595, "Agent": "REINFORCE"}, {"env_step": 7127040, "rew": 31.9173, "rew_std": 5.1753, "Agent": "REINFORCE"}, {"env_step": 7157760, "rew": 31.3002, "rew_std": 5.7539, "Agent": "REINFORCE"}, {"env_step": 7188480, "rew": 32.7446, "rew_std": 5.5887, "Agent": "REINFORCE"}, {"env_step": 7219200, "rew": 31.3714, "rew_std": 6.5631, "Agent": "REINFORCE"}, {"env_step": 7249920, "rew": 32.337, "rew_std": 5.475, "Agent": "REINFORCE"}, {"env_step": 7280640, "rew": 31.2519, "rew_std": 5.9219, "Agent": "REINFORCE"}, {"env_step": 7311360, "rew": 33.2408, "rew_std": 4.933, "Agent": "REINFORCE"}, {"env_step": 7342080, "rew": 32.6244, "rew_std": 5.3486, "Agent": "REINFORCE"}, {"env_step": 7372800, "rew": 32.2818, "rew_std": 5.1002, "Agent": "REINFORCE"}, {"env_step": 7403520, "rew": 32.4273, "rew_std": 5.6617, "Agent": "REINFORCE"}, {"env_step": 7434240, "rew": 32.5061, "rew_std": 5.56, "Agent": "REINFORCE"}, {"env_step": 7464960, "rew": 31.0894, "rew_std": 5.8324, "Agent": "REINFORCE"}, {"env_step": 7495680, "rew": 31.6037, "rew_std": 6.0186, "Agent": "REINFORCE"}, {"env_step": 7526400, "rew": 32.7055, "rew_std": 6.2364, "Agent": "REINFORCE"}, {"env_step": 7557120, "rew": 32.8096, "rew_std": 4.6631, "Agent": "REINFORCE"}, {"env_step": 7587840, "rew": 32.5216, "rew_std": 5.6356, "Agent": "REINFORCE"}, {"env_step": 7618560, "rew": 32.3616, "rew_std": 6.5821, "Agent": "REINFORCE"}, {"env_step": 7649280, "rew": 32.4397, "rew_std": 5.0747, "Agent": "REINFORCE"}, {"env_step": 7680000, "rew": 32.0721, "rew_std": 6.0841, "Agent": "REINFORCE"}, {"env_step": 7710720, "rew": 32.0599, "rew_std": 5.1005, "Agent": "REINFORCE"}, {"env_step": 7741440, "rew": 32.512, "rew_std": 5.0088, "Agent": "REINFORCE"}, {"env_step": 7772160, "rew": 33.6162, "rew_std": 4.6397, "Agent": "REINFORCE"}, {"env_step": 7802880, "rew": 32.9104, "rew_std": 4.5188, "Agent": "REINFORCE"}, {"env_step": 7833600, "rew": 32.8331, "rew_std": 4.9909, "Agent": "REINFORCE"}, {"env_step": 7864320, "rew": 32.7758, "rew_std": 4.5786, "Agent": "REINFORCE"}, {"env_step": 7895040, "rew": 34.003, "rew_std": 4.3646, "Agent": "REINFORCE"}, {"env_step": 7925760, "rew": 32.4516, "rew_std": 5.5562, "Agent": "REINFORCE"}, {"env_step": 7956480, "rew": 34.1675, "rew_std": 4.9455, "Agent": "REINFORCE"}, {"env_step": 7987200, "rew": 33.6632, "rew_std": 4.0695, "Agent": "REINFORCE"}, {"env_step": 8017920, "rew": 34.0068, "rew_std": 4.107, "Agent": "REINFORCE"}, {"env_step": 8048640, "rew": 33.4871, "rew_std": 4.6873, "Agent": "REINFORCE"}, {"env_step": 8079360, "rew": 33.7246, "rew_std": 4.5231, "Agent": "REINFORCE"}, {"env_step": 8110080, "rew": 32.5878, "rew_std": 5.5223, "Agent": "REINFORCE"}, {"env_step": 8140800, "rew": 33.9746, "rew_std": 4.7386, "Agent": "REINFORCE"}, {"env_step": 8171520, "rew": 32.6613, "rew_std": 5.3638, "Agent": "REINFORCE"}, {"env_step": 8202240, "rew": 33.0588, "rew_std": 5.1075, "Agent": "REINFORCE"}, {"env_step": 8232960, "rew": 33.9021, "rew_std": 5.0514, "Agent": "REINFORCE"}, {"env_step": 8263680, "rew": 34.0947, "rew_std": 4.5952, "Agent": "REINFORCE"}, {"env_step": 8294400, "rew": 32.703, "rew_std": 4.7867, "Agent": "REINFORCE"}, {"env_step": 8325120, "rew": 34.1386, "rew_std": 4.75, "Agent": "REINFORCE"}, {"env_step": 8355840, "rew": 33.9661, "rew_std": 4.4242, "Agent": "REINFORCE"}, {"env_step": 8386560, "rew": 34.7524, "rew_std": 4.6168, "Agent": "REINFORCE"}, {"env_step": 8417280, "rew": 33.9398, "rew_std": 4.263, "Agent": "REINFORCE"}, {"env_step": 8448000, "rew": 33.1136, "rew_std": 5.6609, "Agent": "REINFORCE"}, {"env_step": 8478720, "rew": 34.2965, "rew_std": 4.169, "Agent": "REINFORCE"}, {"env_step": 8509440, "rew": 33.6618, "rew_std": 4.5977, "Agent": "REINFORCE"}, {"env_step": 8540160, "rew": 33.6729, "rew_std": 4.0488, "Agent": "REINFORCE"}, {"env_step": 8570880, "rew": 34.9866, "rew_std": 4.0343, "Agent": "REINFORCE"}, {"env_step": 8601600, "rew": 34.5048, "rew_std": 4.5793, "Agent": "REINFORCE"}, {"env_step": 8632320, "rew": 34.0164, "rew_std": 4.0996, "Agent": "REINFORCE"}, {"env_step": 8663040, "rew": 34.5609, "rew_std": 3.7994, "Agent": "REINFORCE"}, {"env_step": 8693760, "rew": 33.8448, "rew_std": 4.3228, "Agent": "REINFORCE"}, {"env_step": 8724480, "rew": 33.4444, "rew_std": 4.5564, "Agent": "REINFORCE"}, {"env_step": 8755200, "rew": 33.525, "rew_std": 4.4545, "Agent": "REINFORCE"}, {"env_step": 8785920, "rew": 33.7675, "rew_std": 5.0768, "Agent": "REINFORCE"}, {"env_step": 8816640, "rew": 34.8722, "rew_std": 3.4362, "Agent": "REINFORCE"}, {"env_step": 8847360, "rew": 33.9305, "rew_std": 3.8452, "Agent": "REINFORCE"}, {"env_step": 8878080, "rew": 33.381, "rew_std": 4.6669, "Agent": "REINFORCE"}, {"env_step": 8908800, "rew": 34.5151, "rew_std": 4.0725, "Agent": "REINFORCE"}, {"env_step": 8939520, "rew": 34.5288, "rew_std": 4.3255, "Agent": "REINFORCE"}, {"env_step": 8970240, "rew": 34.3572, "rew_std": 4.0005, "Agent": "REINFORCE"}, {"env_step": 9000960, "rew": 35.5993, "rew_std": 4.8346, "Agent": "REINFORCE"}, {"env_step": 9031680, "rew": 35.0188, "rew_std": 3.7941, "Agent": "REINFORCE"}, {"env_step": 9062400, "rew": 32.4251, "rew_std": 4.2903, "Agent": "REINFORCE"}, {"env_step": 9093120, "rew": 34.6576, "rew_std": 4.1041, "Agent": "REINFORCE"}, {"env_step": 9123840, "rew": 33.9335, "rew_std": 4.2551, "Agent": "REINFORCE"}, {"env_step": 9154560, "rew": 33.5112, "rew_std": 4.5228, "Agent": "REINFORCE"}, {"env_step": 9185280, "rew": 35.0373, "rew_std": 4.2203, "Agent": "REINFORCE"}, {"env_step": 9216000, "rew": 33.1811, "rew_std": 4.8138, "Agent": "REINFORCE"}, {"env_step": 9246720, "rew": 35.6357, "rew_std": 2.5664, "Agent": "REINFORCE"}, {"env_step": 9277440, "rew": 35.1787, "rew_std": 3.656, "Agent": "REINFORCE"}, {"env_step": 9308160, "rew": 34.1176, "rew_std": 4.1731, "Agent": "REINFORCE"}, {"env_step": 9338880, "rew": 32.852, "rew_std": 5.0998, "Agent": "REINFORCE"}, {"env_step": 9369600, "rew": 34.1419, "rew_std": 4.3647, "Agent": "REINFORCE"}, {"env_step": 9400320, "rew": 34.9605, "rew_std": 4.4513, "Agent": "REINFORCE"}, {"env_step": 9431040, "rew": 34.0714, "rew_std": 4.1276, "Agent": "REINFORCE"}, {"env_step": 9461760, "rew": 33.9586, "rew_std": 4.0475, "Agent": "REINFORCE"}, {"env_step": 9492480, "rew": 32.7241, "rew_std": 5.6342, "Agent": "REINFORCE"}, {"env_step": 9523200, "rew": 34.8576, "rew_std": 4.3271, "Agent": "REINFORCE"}, {"env_step": 9553920, "rew": 34.5418, "rew_std": 4.3088, "Agent": "REINFORCE"}, {"env_step": 9584640, "rew": 33.4314, "rew_std": 4.8686, "Agent": "REINFORCE"}, {"env_step": 9615360, "rew": 34.31, "rew_std": 4.2917, "Agent": "REINFORCE"}, {"env_step": 9646080, "rew": 34.1281, "rew_std": 4.2791, "Agent": "REINFORCE"}, {"env_step": 9676800, "rew": 34.2341, "rew_std": 4.776, "Agent": "REINFORCE"}, {"env_step": 9707520, "rew": 34.8616, "rew_std": 3.861, "Agent": "REINFORCE"}, {"env_step": 9738240, "rew": 33.6738, "rew_std": 4.3368, "Agent": "REINFORCE"}, {"env_step": 9768960, "rew": 34.363, "rew_std": 4.2437, "Agent": "REINFORCE"}, {"env_step": 9799680, "rew": 33.7762, "rew_std": 4.6374, "Agent": "REINFORCE"}, {"env_step": 9830400, "rew": 34.3446, "rew_std": 4.5658, "Agent": "REINFORCE"}, {"env_step": 9861120, "rew": 34.2667, "rew_std": 4.1647, "Agent": "REINFORCE"}, {"env_step": 9891840, "rew": 34.6621, "rew_std": 4.0091, "Agent": "REINFORCE"}, {"env_step": 9922560, "rew": 33.8437, "rew_std": 4.2047, "Agent": "REINFORCE"}, {"env_step": 9953280, "rew": 33.6302, "rew_std": 4.7983, "Agent": "REINFORCE"}, {"env_step": 9984000, "rew": 34.0698, "rew_std": 4.1396, "Agent": "REINFORCE"}, {"env_step": 10014720, "rew": 32.9844, "rew_std": 5.1013, "Agent": "REINFORCE"}, {"env_step": 10045440, "rew": 33.5285, "rew_std": 4.4086, "Agent": "REINFORCE"}, {"env_step": 10076160, "rew": 34.0825, "rew_std": 4.5864, "Agent": "REINFORCE"}, {"env_step": 10106880, "rew": 34.2197, "rew_std": 4.7614, "Agent": "REINFORCE"}, {"env_step": 10137600, "rew": 33.4028, "rew_std": 4.4683, "Agent": "REINFORCE"}, {"env_step": 10168320, "rew": 33.7714, "rew_std": 5.2796, "Agent": "REINFORCE"}, {"env_step": 10199040, "rew": 33.7844, "rew_std": 5.0687, "Agent": "REINFORCE"}, {"env_step": 10229760, "rew": 34.2833, "rew_std": 4.5147, "Agent": "REINFORCE"}, {"env_step": 0, "rew": -7.7439, "rew_std": 16.8878, "Agent": "SAC"}, {"env_step": 5000, "rew": 26.2874, "rew_std": 10.5409, "Agent": "SAC"}, {"env_step": 10000, "rew": 25.6709, "rew_std": 8.9848, "Agent": "SAC"}, {"env_step": 15000, "rew": 33.9519, "rew_std": 3.7954, "Agent": "SAC"}, {"env_step": 20000, "rew": 38.1491, "rew_std": 2.543, "Agent": "SAC"}, {"env_step": 25000, "rew": 39.3281, "rew_std": 2.1892, "Agent": "SAC"}, {"env_step": 30000, "rew": 38.0972, "rew_std": 2.6193, "Agent": "SAC"}, {"env_step": 35000, "rew": 39.4004, "rew_std": 1.9991, "Agent": "SAC"}, {"env_step": 40000, "rew": 39.3137, "rew_std": 1.7931, "Agent": "SAC"}, {"env_step": 45000, "rew": 38.8152, "rew_std": 1.6557, "Agent": "SAC"}, {"env_step": 50000, "rew": 39.8585, "rew_std": 1.157, "Agent": "SAC"}, {"env_step": 55000, "rew": 38.1781, "rew_std": 4.3822, "Agent": "SAC"}, {"env_step": 60000, "rew": 37.8314, "rew_std": 4.4601, "Agent": "SAC"}, {"env_step": 65000, "rew": 38.3241, "rew_std": 2.8926, "Agent": "SAC"}, {"env_step": 70000, "rew": 39.395, "rew_std": 1.2904, "Agent": "SAC"}, {"env_step": 75000, "rew": 39.6681, "rew_std": 1.354, "Agent": "SAC"}, {"env_step": 80000, "rew": 40.2258, "rew_std": 1.3807, "Agent": "SAC"}, {"env_step": 85000, "rew": 40.0252, "rew_std": 1.7095, "Agent": "SAC"}, {"env_step": 90000, "rew": 39.8833, "rew_std": 1.071, "Agent": "SAC"}, {"env_step": 95000, "rew": 37.6892, "rew_std": 4.3594, "Agent": "SAC"}, {"env_step": 100000, "rew": 39.866, "rew_std": 1.494, "Agent": "SAC"}, {"env_step": 105000, "rew": 40.3161, "rew_std": 1.5569, "Agent": "SAC"}, {"env_step": 110000, "rew": 38.6797, "rew_std": 5.4645, "Agent": "SAC"}, {"env_step": 115000, "rew": 39.4061, "rew_std": 1.0227, "Agent": "SAC"}, {"env_step": 120000, "rew": 39.0564, "rew_std": 1.6067, "Agent": "SAC"}, {"env_step": 125000, "rew": 41.2194, "rew_std": 1.1145, "Agent": "SAC"}, {"env_step": 130000, "rew": 38.7546, "rew_std": 2.59, "Agent": "SAC"}, {"env_step": 135000, "rew": 41.1758, "rew_std": 1.2852, "Agent": "SAC"}, {"env_step": 140000, "rew": 40.7014, "rew_std": 1.3486, "Agent": "SAC"}, {"env_step": 145000, "rew": 40.0147, "rew_std": 1.7605, "Agent": "SAC"}, {"env_step": 150000, "rew": 40.3221, "rew_std": 1.2607, "Agent": "SAC"}, {"env_step": 155000, "rew": 41.6201, "rew_std": 1.3049, "Agent": "SAC"}, {"env_step": 160000, "rew": 41.3052, "rew_std": 1.0019, "Agent": "SAC"}, {"env_step": 165000, "rew": 39.9204, "rew_std": 2.8623, "Agent": "SAC"}, {"env_step": 170000, "rew": 40.9499, "rew_std": 1.6341, "Agent": "SAC"}, {"env_step": 175000, "rew": 42.1303, "rew_std": 1.635, "Agent": "SAC"}, {"env_step": 180000, "rew": 41.3798, "rew_std": 1.3728, "Agent": "SAC"}, {"env_step": 185000, "rew": 41.6402, "rew_std": 1.3664, "Agent": "SAC"}, {"env_step": 190000, "rew": 41.8703, "rew_std": 1.0121, "Agent": "SAC"}, {"env_step": 195000, "rew": 41.686, "rew_std": 2.8906, "Agent": "SAC"}, {"env_step": 200000, "rew": 41.7817, "rew_std": 0.8474, "Agent": "SAC"}, {"env_step": 205000, "rew": 41.7951, "rew_std": 1.7754, "Agent": "SAC"}, {"env_step": 210000, "rew": 42.0247, "rew_std": 1.4268, "Agent": "SAC"}, {"env_step": 215000, "rew": 42.3229, "rew_std": 0.7668, "Agent": "SAC"}, {"env_step": 220000, "rew": 40.6762, "rew_std": 2.6318, "Agent": "SAC"}, {"env_step": 225000, "rew": 41.497, "rew_std": 0.6603, "Agent": "SAC"}, {"env_step": 230000, "rew": 41.5852, "rew_std": 1.2995, "Agent": "SAC"}, {"env_step": 235000, "rew": 39.668, "rew_std": 6.5793, "Agent": "SAC"}, {"env_step": 240000, "rew": 41.4187, "rew_std": 0.7364, "Agent": "SAC"}, {"env_step": 245000, "rew": 41.6194, "rew_std": 0.9224, "Agent": "SAC"}, {"env_step": 250000, "rew": 42.5275, "rew_std": 0.8569, "Agent": "SAC"}, {"env_step": 255000, "rew": 42.1773, "rew_std": 0.8542, "Agent": "SAC"}, {"env_step": 260000, "rew": 40.6498, "rew_std": 1.9453, "Agent": "SAC"}, {"env_step": 265000, "rew": 41.8543, "rew_std": 0.7636, "Agent": "SAC"}, {"env_step": 270000, "rew": 41.4246, "rew_std": 1.4716, "Agent": "SAC"}, {"env_step": 275000, "rew": 41.6244, "rew_std": 1.4436, "Agent": "SAC"}, {"env_step": 280000, "rew": 41.762, "rew_std": 1.3608, "Agent": "SAC"}, {"env_step": 285000, "rew": 41.7634, "rew_std": 2.4729, "Agent": "SAC"}, {"env_step": 290000, "rew": 42.5842, "rew_std": 1.3938, "Agent": "SAC"}, {"env_step": 295000, "rew": 42.0463, "rew_std": 1.3349, "Agent": "SAC"}, {"env_step": 300000, "rew": 41.4114, "rew_std": 2.0244, "Agent": "SAC"}, {"env_step": 305000, "rew": 41.8277, "rew_std": 0.8916, "Agent": "SAC"}, {"env_step": 310000, "rew": 42.9752, "rew_std": 1.0657, "Agent": "SAC"}, {"env_step": 315000, "rew": 42.2197, "rew_std": 0.99, "Agent": "SAC"}, {"env_step": 320000, "rew": 41.3587, "rew_std": 1.7308, "Agent": "SAC"}, {"env_step": 325000, "rew": 42.1496, "rew_std": 0.8021, "Agent": "SAC"}, {"env_step": 330000, "rew": 42.0622, "rew_std": 1.483, "Agent": "SAC"}, {"env_step": 335000, "rew": 42.4782, "rew_std": 1.7003, "Agent": "SAC"}, {"env_step": 340000, "rew": 42.1533, "rew_std": 0.7591, "Agent": "SAC"}, {"env_step": 345000, "rew": 41.324, "rew_std": 1.244, "Agent": "SAC"}, {"env_step": 350000, "rew": 42.606, "rew_std": 1.386, "Agent": "SAC"}, {"env_step": 355000, "rew": 41.5811, "rew_std": 1.7395, "Agent": "SAC"}, {"env_step": 360000, "rew": 42.418, "rew_std": 1.5588, "Agent": "SAC"}, {"env_step": 365000, "rew": 41.6303, "rew_std": 0.759, "Agent": "SAC"}, {"env_step": 370000, "rew": 42.2691, "rew_std": 0.9922, "Agent": "SAC"}, {"env_step": 375000, "rew": 42.5791, "rew_std": 1.3288, "Agent": "SAC"}, {"env_step": 380000, "rew": 42.7526, "rew_std": 1.0351, "Agent": "SAC"}, {"env_step": 385000, "rew": 43.2361, "rew_std": 1.4465, "Agent": "SAC"}, {"env_step": 390000, "rew": 41.8614, "rew_std": 0.9324, "Agent": "SAC"}, {"env_step": 395000, "rew": 42.3396, "rew_std": 1.3756, "Agent": "SAC"}, {"env_step": 400000, "rew": 41.9191, "rew_std": 1.1385, "Agent": "SAC"}, {"env_step": 405000, "rew": 41.5898, "rew_std": 1.1394, "Agent": "SAC"}, {"env_step": 410000, "rew": 41.2049, "rew_std": 2.1405, "Agent": "SAC"}, {"env_step": 415000, "rew": 43.1547, "rew_std": 1.3899, "Agent": "SAC"}, {"env_step": 420000, "rew": 41.9552, "rew_std": 1.4365, "Agent": "SAC"}, {"env_step": 425000, "rew": 42.865, "rew_std": 0.7121, "Agent": "SAC"}, {"env_step": 430000, "rew": 43.2182, "rew_std": 1.2923, "Agent": "SAC"}, {"env_step": 435000, "rew": 43.0546, "rew_std": 1.1176, "Agent": "SAC"}, {"env_step": 440000, "rew": 42.1793, "rew_std": 1.0319, "Agent": "SAC"}, {"env_step": 445000, "rew": 42.3744, "rew_std": 1.1834, "Agent": "SAC"}, {"env_step": 450000, "rew": 42.7055, "rew_std": 1.0265, "Agent": "SAC"}, {"env_step": 455000, "rew": 42.7255, "rew_std": 0.888, "Agent": "SAC"}, {"env_step": 460000, "rew": 42.2179, "rew_std": 1.6927, "Agent": "SAC"}, {"env_step": 465000, "rew": 42.4877, "rew_std": 1.298, "Agent": "SAC"}, {"env_step": 470000, "rew": 42.8837, "rew_std": 1.0435, "Agent": "SAC"}, {"env_step": 475000, "rew": 42.9676, "rew_std": 0.9981, "Agent": "SAC"}, {"env_step": 480000, "rew": 42.9281, "rew_std": 1.965, "Agent": "SAC"}, {"env_step": 485000, "rew": 42.3553, "rew_std": 0.884, "Agent": "SAC"}, {"env_step": 490000, "rew": 42.5956, "rew_std": 0.8306, "Agent": "SAC"}, {"env_step": 495000, "rew": 42.3804, "rew_std": 1.8631, "Agent": "SAC"}, {"env_step": 500000, "rew": 40.6518, "rew_std": 2.8328, "Agent": "SAC"}, {"env_step": 505000, "rew": 41.8868, "rew_std": 2.1089, "Agent": "SAC"}, {"env_step": 510000, "rew": 42.2984, "rew_std": 1.8482, "Agent": "SAC"}, {"env_step": 515000, "rew": 42.5435, "rew_std": 1.5197, "Agent": "SAC"}, {"env_step": 520000, "rew": 42.5111, "rew_std": 1.2591, "Agent": "SAC"}, {"env_step": 525000, "rew": 42.5548, "rew_std": 1.581, "Agent": "SAC"}, {"env_step": 530000, "rew": 43.2509, "rew_std": 1.0975, "Agent": "SAC"}, {"env_step": 535000, "rew": 42.8992, "rew_std": 0.6006, "Agent": "SAC"}, {"env_step": 540000, "rew": 42.6448, "rew_std": 0.6434, "Agent": "SAC"}, {"env_step": 545000, "rew": 43.6739, "rew_std": 1.03, "Agent": "SAC"}, {"env_step": 550000, "rew": 42.1373, "rew_std": 1.1803, "Agent": "SAC"}, {"env_step": 555000, "rew": 43.392, "rew_std": 0.7966, "Agent": "SAC"}, {"env_step": 560000, "rew": 42.998, "rew_std": 1.7691, "Agent": "SAC"}, {"env_step": 565000, "rew": 42.3194, "rew_std": 1.6072, "Agent": "SAC"}, {"env_step": 570000, "rew": 42.4264, "rew_std": 1.0855, "Agent": "SAC"}, {"env_step": 575000, "rew": 43.0293, "rew_std": 1.5761, "Agent": "SAC"}, {"env_step": 580000, "rew": 43.1212, "rew_std": 1.0842, "Agent": "SAC"}, {"env_step": 585000, "rew": 43.7142, "rew_std": 0.8072, "Agent": "SAC"}, {"env_step": 590000, "rew": 42.9435, "rew_std": 0.8323, "Agent": "SAC"}, {"env_step": 595000, "rew": 43.0102, "rew_std": 1.1116, "Agent": "SAC"}, {"env_step": 600000, "rew": 42.6918, "rew_std": 1.7408, "Agent": "SAC"}, {"env_step": 605000, "rew": 42.9151, "rew_std": 1.5017, "Agent": "SAC"}, {"env_step": 610000, "rew": 42.4029, "rew_std": 1.1383, "Agent": "SAC"}, {"env_step": 615000, "rew": 42.2635, "rew_std": 1.1714, "Agent": "SAC"}, {"env_step": 620000, "rew": 42.2494, "rew_std": 2.1549, "Agent": "SAC"}, {"env_step": 625000, "rew": 42.9938, "rew_std": 0.8821, "Agent": "SAC"}, {"env_step": 630000, "rew": 42.7989, "rew_std": 0.8944, "Agent": "SAC"}, {"env_step": 635000, "rew": 42.8052, "rew_std": 1.5786, "Agent": "SAC"}, {"env_step": 640000, "rew": 42.9076, "rew_std": 0.7705, "Agent": "SAC"}, {"env_step": 645000, "rew": 42.7719, "rew_std": 0.8277, "Agent": "SAC"}, {"env_step": 650000, "rew": 42.0232, "rew_std": 1.5944, "Agent": "SAC"}, {"env_step": 655000, "rew": 42.4545, "rew_std": 1.5504, "Agent": "SAC"}, {"env_step": 660000, "rew": 42.6647, "rew_std": 1.2738, "Agent": "SAC"}, {"env_step": 665000, "rew": 42.8804, "rew_std": 0.8634, "Agent": "SAC"}, {"env_step": 670000, "rew": 42.26, "rew_std": 1.2206, "Agent": "SAC"}, {"env_step": 675000, "rew": 42.8885, "rew_std": 0.7465, "Agent": "SAC"}, {"env_step": 680000, "rew": 43.2638, "rew_std": 0.5848, "Agent": "SAC"}, {"env_step": 685000, "rew": 42.8161, "rew_std": 1.0889, "Agent": "SAC"}, {"env_step": 690000, "rew": 43.6413, "rew_std": 0.8257, "Agent": "SAC"}, {"env_step": 695000, "rew": 42.0686, "rew_std": 2.5861, "Agent": "SAC"}, {"env_step": 700000, "rew": 42.6375, "rew_std": 0.859, "Agent": "SAC"}, {"env_step": 705000, "rew": 43.1986, "rew_std": 0.924, "Agent": "SAC"}, {"env_step": 710000, "rew": 42.8405, "rew_std": 1.2386, "Agent": "SAC"}, {"env_step": 715000, "rew": 42.6156, "rew_std": 2.2722, "Agent": "SAC"}, {"env_step": 720000, "rew": 42.7577, "rew_std": 0.8786, "Agent": "SAC"}, {"env_step": 725000, "rew": 43.4543, "rew_std": 1.2874, "Agent": "SAC"}, {"env_step": 730000, "rew": 43.7171, "rew_std": 0.6439, "Agent": "SAC"}, {"env_step": 735000, "rew": 42.5117, "rew_std": 1.2804, "Agent": "SAC"}, {"env_step": 740000, "rew": 43.3573, "rew_std": 1.2178, "Agent": "SAC"}, {"env_step": 745000, "rew": 42.8615, "rew_std": 1.4943, "Agent": "SAC"}, {"env_step": 750000, "rew": 43.3079, "rew_std": 1.2424, "Agent": "SAC"}, {"env_step": 755000, "rew": 42.3746, "rew_std": 1.0121, "Agent": "SAC"}, {"env_step": 760000, "rew": 42.8132, "rew_std": 1.0824, "Agent": "SAC"}, {"env_step": 765000, "rew": 43.7006, "rew_std": 0.7133, "Agent": "SAC"}, {"env_step": 770000, "rew": 43.3221, "rew_std": 0.9818, "Agent": "SAC"}, {"env_step": 775000, "rew": 42.4514, "rew_std": 1.4063, "Agent": "SAC"}, {"env_step": 780000, "rew": 43.8367, "rew_std": 0.9614, "Agent": "SAC"}, {"env_step": 785000, "rew": 43.2259, "rew_std": 1.0272, "Agent": "SAC"}, {"env_step": 790000, "rew": 43.4329, "rew_std": 0.8463, "Agent": "SAC"}, {"env_step": 795000, "rew": 43.2807, "rew_std": 0.6291, "Agent": "SAC"}, {"env_step": 800000, "rew": 43.2571, "rew_std": 1.088, "Agent": "SAC"}, {"env_step": 805000, "rew": 43.4552, "rew_std": 1.1519, "Agent": "SAC"}, {"env_step": 810000, "rew": 43.4323, "rew_std": 0.9875, "Agent": "SAC"}, {"env_step": 815000, "rew": 43.474, "rew_std": 0.9647, "Agent": "SAC"}, {"env_step": 820000, "rew": 43.0198, "rew_std": 1.1391, "Agent": "SAC"}, {"env_step": 825000, "rew": 42.789, "rew_std": 1.2367, "Agent": "SAC"}, {"env_step": 830000, "rew": 42.3454, "rew_std": 1.3127, "Agent": "SAC"}, {"env_step": 835000, "rew": 43.4136, "rew_std": 1.0791, "Agent": "SAC"}, {"env_step": 840000, "rew": 43.3779, "rew_std": 0.7225, "Agent": "SAC"}, {"env_step": 845000, "rew": 43.3594, "rew_std": 0.7372, "Agent": "SAC"}, {"env_step": 850000, "rew": 43.1062, "rew_std": 1.266, "Agent": "SAC"}, {"env_step": 855000, "rew": 42.6848, "rew_std": 0.9429, "Agent": "SAC"}, {"env_step": 860000, "rew": 43.5006, "rew_std": 0.8984, "Agent": "SAC"}, {"env_step": 865000, "rew": 43.2251, "rew_std": 1.3076, "Agent": "SAC"}, {"env_step": 870000, "rew": 43.7185, "rew_std": 0.9205, "Agent": "SAC"}, {"env_step": 875000, "rew": 43.6287, "rew_std": 1.03, "Agent": "SAC"}, {"env_step": 880000, "rew": 42.8404, "rew_std": 1.0181, "Agent": "SAC"}, {"env_step": 885000, "rew": 42.6213, "rew_std": 1.5867, "Agent": "SAC"}, {"env_step": 890000, "rew": 43.4013, "rew_std": 2.1414, "Agent": "SAC"}, {"env_step": 895000, "rew": 43.3951, "rew_std": 1.0499, "Agent": "SAC"}, {"env_step": 900000, "rew": 43.3527, "rew_std": 1.0789, "Agent": "SAC"}, {"env_step": 905000, "rew": 42.8644, "rew_std": 1.422, "Agent": "SAC"}, {"env_step": 910000, "rew": 42.9771, "rew_std": 1.0238, "Agent": "SAC"}, {"env_step": 915000, "rew": 43.5087, "rew_std": 1.0089, "Agent": "SAC"}, {"env_step": 920000, "rew": 43.373, "rew_std": 0.9359, "Agent": "SAC"}, {"env_step": 925000, "rew": 43.8177, "rew_std": 0.9008, "Agent": "SAC"}, {"env_step": 930000, "rew": 42.797, "rew_std": 0.8653, "Agent": "SAC"}, {"env_step": 935000, "rew": 43.276, "rew_std": 0.8909, "Agent": "SAC"}, {"env_step": 940000, "rew": 43.6976, "rew_std": 1.3921, "Agent": "SAC"}, {"env_step": 945000, "rew": 44.0239, "rew_std": 1.5283, "Agent": "SAC"}, {"env_step": 950000, "rew": 43.6672, "rew_std": 0.9988, "Agent": "SAC"}, {"env_step": 955000, "rew": 43.871, "rew_std": 0.9807, "Agent": "SAC"}, {"env_step": 960000, "rew": 44.3549, "rew_std": 0.4953, "Agent": "SAC"}, {"env_step": 965000, "rew": 43.8333, "rew_std": 1.216, "Agent": "SAC"}, {"env_step": 970000, "rew": 42.7589, "rew_std": 1.282, "Agent": "SAC"}, {"env_step": 975000, "rew": 43.4426, "rew_std": 1.0953, "Agent": "SAC"}, {"env_step": 980000, "rew": 43.913, "rew_std": 1.4897, "Agent": "SAC"}, {"env_step": 985000, "rew": 43.1539, "rew_std": 1.1106, "Agent": "SAC"}, {"env_step": 990000, "rew": 43.6382, "rew_std": 0.874, "Agent": "SAC"}, {"env_step": 995000, "rew": 43.3717, "rew_std": 2.2402, "Agent": "SAC"}, {"env_step": 1000000, "rew": 43.5731, "rew_std": 0.9632, "Agent": "SAC"}, {"env_step": 1005000, "rew": 44.2985, "rew_std": 1.4402, "Agent": "SAC"}, {"env_step": 1010000, "rew": 43.1896, "rew_std": 1.0631, "Agent": "SAC"}, {"env_step": 1015000, "rew": 43.7741, "rew_std": 1.1827, "Agent": "SAC"}, {"env_step": 1020000, "rew": 43.3785, "rew_std": 1.3209, "Agent": "SAC"}, {"env_step": 1025000, "rew": 43.4507, "rew_std": 0.8396, "Agent": "SAC"}, {"env_step": 1030000, "rew": 43.0527, "rew_std": 0.7842, "Agent": "SAC"}, {"env_step": 1035000, "rew": 43.5944, "rew_std": 0.8916, "Agent": "SAC"}, {"env_step": 1040000, "rew": 43.0462, "rew_std": 0.8515, "Agent": "SAC"}, {"env_step": 1045000, "rew": 43.3839, "rew_std": 0.5822, "Agent": "SAC"}, {"env_step": 1050000, "rew": 43.4203, "rew_std": 1.0907, "Agent": "SAC"}, {"env_step": 1055000, "rew": 43.3705, "rew_std": 0.9512, "Agent": "SAC"}, {"env_step": 1060000, "rew": 43.7978, "rew_std": 0.704, "Agent": "SAC"}, {"env_step": 1065000, "rew": 43.7268, "rew_std": 0.9554, "Agent": "SAC"}, {"env_step": 1070000, "rew": 43.5983, "rew_std": 0.7237, "Agent": "SAC"}, {"env_step": 1075000, "rew": 43.5771, "rew_std": 1.0144, "Agent": "SAC"}, {"env_step": 1080000, "rew": 44.0056, "rew_std": 1.0758, "Agent": "SAC"}, {"env_step": 1085000, "rew": 44.1718, "rew_std": 0.9893, "Agent": "SAC"}, {"env_step": 1090000, "rew": 43.1443, "rew_std": 0.9257, "Agent": "SAC"}, {"env_step": 1095000, "rew": 43.5743, "rew_std": 1.2003, "Agent": "SAC"}, {"env_step": 1100000, "rew": 43.8866, "rew_std": 0.8057, "Agent": "SAC"}, {"env_step": 1105000, "rew": 44.0473, "rew_std": 0.876, "Agent": "SAC"}, {"env_step": 1110000, "rew": 43.4748, "rew_std": 0.9671, "Agent": "SAC"}, {"env_step": 1115000, "rew": 43.2211, "rew_std": 1.2039, "Agent": "SAC"}, {"env_step": 1120000, "rew": 44.6832, "rew_std": 0.8636, "Agent": "SAC"}, {"env_step": 1125000, "rew": 43.3888, "rew_std": 0.914, "Agent": "SAC"}, {"env_step": 1130000, "rew": 43.9367, "rew_std": 0.9688, "Agent": "SAC"}, {"env_step": 1135000, "rew": 44.0778, "rew_std": 0.8398, "Agent": "SAC"}, {"env_step": 1140000, "rew": 43.6552, "rew_std": 0.8414, "Agent": "SAC"}, {"env_step": 1145000, "rew": 43.8613, "rew_std": 0.7711, "Agent": "SAC"}, {"env_step": 1150000, "rew": 43.7305, "rew_std": 0.9517, "Agent": "SAC"}, {"env_step": 1155000, "rew": 44.4041, "rew_std": 0.7634, "Agent": "SAC"}, {"env_step": 1160000, "rew": 44.1468, "rew_std": 0.5902, "Agent": "SAC"}, {"env_step": 1165000, "rew": 43.6025, "rew_std": 0.4915, "Agent": "SAC"}, {"env_step": 1170000, "rew": 43.6958, "rew_std": 1.1437, "Agent": "SAC"}, {"env_step": 1175000, "rew": 43.7657, "rew_std": 1.3804, "Agent": "SAC"}, {"env_step": 1180000, "rew": 43.9155, "rew_std": 0.9774, "Agent": "SAC"}, {"env_step": 1185000, "rew": 43.7091, "rew_std": 0.7425, "Agent": "SAC"}, {"env_step": 1190000, "rew": 43.9555, "rew_std": 0.5798, "Agent": "SAC"}, {"env_step": 1195000, "rew": 43.2931, "rew_std": 0.8764, "Agent": "SAC"}, {"env_step": 1200000, "rew": 43.1039, "rew_std": 2.1058, "Agent": "SAC"}, {"env_step": 1205000, "rew": 43.7402, "rew_std": 0.7227, "Agent": "SAC"}, {"env_step": 1210000, "rew": 43.0009, "rew_std": 0.7026, "Agent": "SAC"}, {"env_step": 1215000, "rew": 43.0386, "rew_std": 1.1108, "Agent": "SAC"}, {"env_step": 1220000, "rew": 43.8467, "rew_std": 1.314, "Agent": "SAC"}, {"env_step": 1225000, "rew": 44.4796, "rew_std": 1.3949, "Agent": "SAC"}, {"env_step": 1230000, "rew": 43.759, "rew_std": 1.2652, "Agent": "SAC"}, {"env_step": 1235000, "rew": 44.294, "rew_std": 0.8111, "Agent": "SAC"}, {"env_step": 1240000, "rew": 42.8652, "rew_std": 2.2385, "Agent": "SAC"}, {"env_step": 1245000, "rew": 43.5858, "rew_std": 0.4343, "Agent": "SAC"}, {"env_step": 1250000, "rew": 43.7967, "rew_std": 1.4092, "Agent": "SAC"}, {"env_step": 0, "rew": 1.0258, "rew_std": 3.8982, "Agent": "TRPO"}, {"env_step": 30720, "rew": 4.5318, "rew_std": 9.1322, "Agent": "TRPO"}, {"env_step": 61440, "rew": 17.1783, "rew_std": 8.1443, "Agent": "TRPO"}, {"env_step": 92160, "rew": 11.1364, "rew_std": 12.8551, "Agent": "TRPO"}, {"env_step": 122880, "rew": 15.7876, "rew_std": 10.9049, "Agent": "TRPO"}, {"env_step": 153600, "rew": 21.7352, "rew_std": 7.681, "Agent": "TRPO"}, {"env_step": 184320, "rew": 23.1981, "rew_std": 9.3278, "Agent": "TRPO"}, {"env_step": 215040, "rew": 21.9929, "rew_std": 8.907, "Agent": "TRPO"}, {"env_step": 245760, "rew": 21.8011, "rew_std": 8.5701, "Agent": "TRPO"}, {"env_step": 276480, "rew": 16.2216, "rew_std": 15.0817, "Agent": "TRPO"}, {"env_step": 307200, "rew": 23.3714, "rew_std": 10.452, "Agent": "TRPO"}, {"env_step": 337920, "rew": 22.3619, "rew_std": 11.7553, "Agent": "TRPO"}, {"env_step": 368640, "rew": 17.2247, "rew_std": 10.5776, "Agent": "TRPO"}, {"env_step": 399360, "rew": 15.3447, "rew_std": 14.1523, "Agent": "TRPO"}, {"env_step": 430080, "rew": 21.4185, "rew_std": 11.8105, "Agent": "TRPO"}, {"env_step": 460800, "rew": 25.6353, "rew_std": 8.0985, "Agent": "TRPO"}, {"env_step": 491520, "rew": 23.912, "rew_std": 11.0104, "Agent": "TRPO"}, {"env_step": 522240, "rew": 23.7326, "rew_std": 13.0333, "Agent": "TRPO"}, {"env_step": 552960, "rew": 20.2099, "rew_std": 11.8485, "Agent": "TRPO"}, {"env_step": 583680, "rew": 26.7197, "rew_std": 13.5298, "Agent": "TRPO"}, {"env_step": 614400, "rew": 26.1615, "rew_std": 13.1838, "Agent": "TRPO"}, {"env_step": 645120, "rew": 26.7897, "rew_std": 12.4442, "Agent": "TRPO"}, {"env_step": 675840, "rew": 25.7339, "rew_std": 14.2278, "Agent": "TRPO"}, {"env_step": 706560, "rew": 25.3773, "rew_std": 13.8077, "Agent": "TRPO"}, {"env_step": 737280, "rew": 25.283, "rew_std": 13.5207, "Agent": "TRPO"}, {"env_step": 768000, "rew": 23.0409, "rew_std": 11.0208, "Agent": "TRPO"}, {"env_step": 798720, "rew": 29.934, "rew_std": 5.984, "Agent": "TRPO"}, {"env_step": 829440, "rew": 30.0473, "rew_std": 12.1315, "Agent": "TRPO"}, {"env_step": 860160, "rew": 30.4816, "rew_std": 6.7929, "Agent": "TRPO"}, {"env_step": 890880, "rew": 31.0399, "rew_std": 7.8191, "Agent": "TRPO"}, {"env_step": 921600, "rew": 28.5465, "rew_std": 9.465, "Agent": "TRPO"}, {"env_step": 952320, "rew": 40.8794, "rew_std": 19.6036, "Agent": "TRPO"}, {"env_step": 983040, "rew": 35.2544, "rew_std": 9.8548, "Agent": "TRPO"}, {"env_step": 1013760, "rew": 35.8913, "rew_std": 15.153, "Agent": "TRPO"}, {"env_step": 1044480, "rew": 36.3142, "rew_std": 9.3228, "Agent": "TRPO"}, {"env_step": 1075200, "rew": 40.3545, "rew_std": 8.1899, "Agent": "TRPO"}, {"env_step": 1105920, "rew": 37.6326, "rew_std": 10.5305, "Agent": "TRPO"}, {"env_step": 1136640, "rew": 35.7299, "rew_std": 9.4198, "Agent": "TRPO"}, {"env_step": 1167360, "rew": 39.7711, "rew_std": 10.2011, "Agent": "TRPO"}, {"env_step": 1198080, "rew": 40.3729, "rew_std": 11.5894, "Agent": "TRPO"}, {"env_step": 1228800, "rew": 38.7288, "rew_std": 14.6177, "Agent": "TRPO"}, {"env_step": 1259520, "rew": 40.6935, "rew_std": 11.953, "Agent": "TRPO"}, {"env_step": 1290240, "rew": 40.923, "rew_std": 11.6621, "Agent": "TRPO"}, {"env_step": 1320960, "rew": 40.5632, "rew_std": 12.2226, "Agent": "TRPO"}, {"env_step": 1351680, "rew": 41.5803, "rew_std": 12.3069, "Agent": "TRPO"}, {"env_step": 1382400, "rew": 42.841, "rew_std": 13.1908, "Agent": "TRPO"}, {"env_step": 1413120, "rew": 40.7195, "rew_std": 14.052, "Agent": "TRPO"}, {"env_step": 1443840, "rew": 40.825, "rew_std": 14.2874, "Agent": "TRPO"}, {"env_step": 1474560, "rew": 41.2722, "rew_std": 16.3205, "Agent": "TRPO"}, {"env_step": 1505280, "rew": 41.3137, "rew_std": 14.5586, "Agent": "TRPO"}, {"env_step": 1536000, "rew": 39.9332, "rew_std": 18.1791, "Agent": "TRPO"}, {"env_step": 1566720, "rew": 41.4336, "rew_std": 14.8714, "Agent": "TRPO"}, {"env_step": 1597440, "rew": 40.6074, "rew_std": 14.2556, "Agent": "TRPO"}, {"env_step": 1628160, "rew": 40.3314, "rew_std": 14.6359, "Agent": "TRPO"}, {"env_step": 1658880, "rew": 40.6411, "rew_std": 13.7657, "Agent": "TRPO"}, {"env_step": 1689600, "rew": 40.063, "rew_std": 13.1091, "Agent": "TRPO"}, {"env_step": 1720320, "rew": 39.2744, "rew_std": 14.5692, "Agent": "TRPO"}, {"env_step": 1751040, "rew": 43.0201, "rew_std": 13.7228, "Agent": "TRPO"}, {"env_step": 1781760, "rew": 43.1458, "rew_std": 11.4684, "Agent": "TRPO"}, {"env_step": 1812480, "rew": 39.9404, "rew_std": 15.0808, "Agent": "TRPO"}, {"env_step": 1843200, "rew": 43.333, "rew_std": 13.852, "Agent": "TRPO"}, {"env_step": 1873920, "rew": 42.9801, "rew_std": 12.7705, "Agent": "TRPO"}, {"env_step": 1904640, "rew": 44.6854, "rew_std": 12.6985, "Agent": "TRPO"}, {"env_step": 1935360, "rew": 42.9459, "rew_std": 12.4341, "Agent": "TRPO"}, {"env_step": 1966080, "rew": 43.0257, "rew_std": 12.266, "Agent": "TRPO"}, {"env_step": 1996800, "rew": 42.3165, "rew_std": 12.166, "Agent": "TRPO"}, {"env_step": 2027520, "rew": 42.8874, "rew_std": 13.8315, "Agent": "TRPO"}, {"env_step": 2058240, "rew": 43.5802, "rew_std": 11.809, "Agent": "TRPO"}, {"env_step": 2088960, "rew": 43.3643, "rew_std": 13.5887, "Agent": "TRPO"}, {"env_step": 2119680, "rew": 42.7233, "rew_std": 13.8014, "Agent": "TRPO"}, {"env_step": 2150400, "rew": 44.399, "rew_std": 12.0618, "Agent": "TRPO"}, {"env_step": 2181120, "rew": 42.5993, "rew_std": 12.0986, "Agent": "TRPO"}, {"env_step": 2211840, "rew": 44.0034, "rew_std": 11.469, "Agent": "TRPO"}, {"env_step": 2242560, "rew": 43.0665, "rew_std": 12.3106, "Agent": "TRPO"}, {"env_step": 2273280, "rew": 42.4313, "rew_std": 12.7302, "Agent": "TRPO"}, {"env_step": 2304000, "rew": 44.0498, "rew_std": 11.5515, "Agent": "TRPO"}, {"env_step": 2334720, "rew": 43.1084, "rew_std": 12.4292, "Agent": "TRPO"}, {"env_step": 2365440, "rew": 42.4667, "rew_std": 13.2913, "Agent": "TRPO"}, {"env_step": 2396160, "rew": 43.4829, "rew_std": 12.1768, "Agent": "TRPO"}, {"env_step": 2426880, "rew": 44.5822, "rew_std": 11.1271, "Agent": "TRPO"}, {"env_step": 2457600, "rew": 44.8384, "rew_std": 11.115, "Agent": "TRPO"}, {"env_step": 2488320, "rew": 45.1578, "rew_std": 11.1132, "Agent": "TRPO"}, {"env_step": 2519040, "rew": 44.4818, "rew_std": 11.4255, "Agent": "TRPO"}, {"env_step": 2549760, "rew": 43.9457, "rew_std": 11.4149, "Agent": "TRPO"}, {"env_step": 2580480, "rew": 46.2701, "rew_std": 10.7292, "Agent": "TRPO"}, {"env_step": 2611200, "rew": 46.7152, "rew_std": 10.955, "Agent": "TRPO"}, {"env_step": 2641920, "rew": 45.143, "rew_std": 11.1811, "Agent": "TRPO"}, {"env_step": 2672640, "rew": 45.6513, "rew_std": 11.4575, "Agent": "TRPO"}, {"env_step": 2703360, "rew": 45.9318, "rew_std": 10.8268, "Agent": "TRPO"}, {"env_step": 2734080, "rew": 45.412, "rew_std": 11.4522, "Agent": "TRPO"}, {"env_step": 2764800, "rew": 45.9734, "rew_std": 11.2923, "Agent": "TRPO"}, {"env_step": 2795520, "rew": 45.7451, "rew_std": 11.7504, "Agent": "TRPO"}, {"env_step": 2826240, "rew": 45.9365, "rew_std": 10.9782, "Agent": "TRPO"}, {"env_step": 2856960, "rew": 45.5058, "rew_std": 11.6701, "Agent": "TRPO"}, {"env_step": 2887680, "rew": 46.4317, "rew_std": 11.8878, "Agent": "TRPO"}, {"env_step": 2918400, "rew": 45.7954, "rew_std": 10.7242, "Agent": "TRPO"}, {"env_step": 2949120, "rew": 46.4324, "rew_std": 10.8928, "Agent": "TRPO"}, {"env_step": 2979840, "rew": 46.8533, "rew_std": 11.1076, "Agent": "TRPO"}, {"env_step": 3010560, "rew": 47.1498, "rew_std": 10.6239, "Agent": "TRPO"}, {"env_step": 3041280, "rew": 46.2512, "rew_std": 11.4401, "Agent": "TRPO"}, {"env_step": 3072000, "rew": 45.8183, "rew_std": 11.201, "Agent": "TRPO"}, {"env_step": 0, "rew": 1.0013, "rew_std": 3.8528, "Agent": "A2C"}, {"env_step": 30000, "rew": 29.7993, "rew_std": 3.9754, "Agent": "A2C"}, {"env_step": 60000, "rew": 30.3959, "rew_std": 3.2532, "Agent": "A2C"}, {"env_step": 90000, "rew": 28.3456, "rew_std": 4.0923, "Agent": "A2C"}, {"env_step": 120000, "rew": 27.5501, "rew_std": 6.0253, "Agent": "A2C"}, {"env_step": 150000, "rew": 28.0867, "rew_std": 4.9332, "Agent": "A2C"}, {"env_step": 180000, "rew": 28.6474, "rew_std": 4.651, "Agent": "A2C"}, {"env_step": 210000, "rew": 30.9932, "rew_std": 4.2765, "Agent": "A2C"}, {"env_step": 240000, "rew": 28.4719, "rew_std": 5.4846, "Agent": "A2C"}, {"env_step": 270000, "rew": 31.8838, "rew_std": 5.2627, "Agent": "A2C"}, {"env_step": 300000, "rew": 30.2396, "rew_std": 5.2384, "Agent": "A2C"}, {"env_step": 330000, "rew": 30.2113, "rew_std": 4.9179, "Agent": "A2C"}, {"env_step": 360000, "rew": 30.1494, "rew_std": 4.1007, "Agent": "A2C"}, {"env_step": 390000, "rew": 30.4588, "rew_std": 5.2267, "Agent": "A2C"}, {"env_step": 420000, "rew": 26.5, "rew_std": 11.502, "Agent": "A2C"}, {"env_step": 450000, "rew": 25.217, "rew_std": 13.1053, "Agent": "A2C"}, {"env_step": 480000, "rew": 29.6318, "rew_std": 3.5898, "Agent": "A2C"}, {"env_step": 510000, "rew": 31.3575, "rew_std": 3.5037, "Agent": "A2C"}, {"env_step": 540000, "rew": 29.2128, "rew_std": 7.123, "Agent": "A2C"}, {"env_step": 570000, "rew": 27.5395, "rew_std": 13.1816, "Agent": "A2C"}, {"env_step": 600000, "rew": 32.1327, "rew_std": 4.1747, "Agent": "A2C"}, {"env_step": 630000, "rew": 33.766, "rew_std": 3.2507, "Agent": "A2C"}, {"env_step": 660000, "rew": 33.3526, "rew_std": 2.6203, "Agent": "A2C"}, {"env_step": 690000, "rew": 34.0419, "rew_std": 3.0868, "Agent": "A2C"}, {"env_step": 720000, "rew": 32.2121, "rew_std": 4.1134, "Agent": "A2C"}, {"env_step": 750000, "rew": 34.1606, "rew_std": 3.6611, "Agent": "A2C"}, {"env_step": 780000, "rew": 34.1478, "rew_std": 4.0238, "Agent": "A2C"}, {"env_step": 810000, "rew": 35.4491, "rew_std": 2.8849, "Agent": "A2C"}, {"env_step": 840000, "rew": 34.4226, "rew_std": 3.5149, "Agent": "A2C"}, {"env_step": 870000, "rew": 35.3543, "rew_std": 4.166, "Agent": "A2C"}, {"env_step": 900000, "rew": 36.1545, "rew_std": 2.3202, "Agent": "A2C"}, {"env_step": 930000, "rew": 36.5783, "rew_std": 2.0716, "Agent": "A2C"}, {"env_step": 960000, "rew": 36.4439, "rew_std": 1.685, "Agent": "A2C"}, {"env_step": 990000, "rew": 37.6793, "rew_std": 2.2051, "Agent": "A2C"}, {"env_step": 1020000, "rew": 37.2984, "rew_std": 1.7872, "Agent": "A2C"}, {"env_step": 1050000, "rew": 38.0321, "rew_std": 1.8195, "Agent": "A2C"}, {"env_step": 1080000, "rew": 37.8466, "rew_std": 1.4684, "Agent": "A2C"}, {"env_step": 1110000, "rew": 37.8256, "rew_std": 1.1826, "Agent": "A2C"}, {"env_step": 1140000, "rew": 39.0075, "rew_std": 1.0609, "Agent": "A2C"}, {"env_step": 1170000, "rew": 39.2442, "rew_std": 1.3947, "Agent": "A2C"}, {"env_step": 1200000, "rew": 39.453, "rew_std": 2.2734, "Agent": "A2C"}, {"env_step": 1230000, "rew": 35.9649, "rew_std": 6.3833, "Agent": "A2C"}, {"env_step": 1260000, "rew": 31.5987, "rew_std": 12.7203, "Agent": "A2C"}, {"env_step": 1290000, "rew": 32.8363, "rew_std": 9.2033, "Agent": "A2C"}, {"env_step": 1320000, "rew": 37.9098, "rew_std": 1.205, "Agent": "A2C"}, {"env_step": 1350000, "rew": 38.5353, "rew_std": 2.1037, "Agent": "A2C"}, {"env_step": 1380000, "rew": 38.1807, "rew_std": 1.2005, "Agent": "A2C"}, {"env_step": 1410000, "rew": 38.4203, "rew_std": 1.5115, "Agent": "A2C"}, {"env_step": 1440000, "rew": 39.6521, "rew_std": 1.7111, "Agent": "A2C"}, {"env_step": 1470000, "rew": 40.1757, "rew_std": 1.7654, "Agent": "A2C"}, {"env_step": 1500000, "rew": 38.9241, "rew_std": 4.0098, "Agent": "A2C"}, {"env_step": 1530000, "rew": 38.8691, "rew_std": 1.0207, "Agent": "A2C"}, {"env_step": 1560000, "rew": 37.6942, "rew_std": 1.4168, "Agent": "A2C"}, {"env_step": 1590000, "rew": 37.2206, "rew_std": 2.0337, "Agent": "A2C"}, {"env_step": 1620000, "rew": 37.5777, "rew_std": 1.6754, "Agent": "A2C"}, {"env_step": 1650000, "rew": 39.0639, "rew_std": 1.3262, "Agent": "A2C"}, {"env_step": 1680000, "rew": 37.425, "rew_std": 1.987, "Agent": "A2C"}, {"env_step": 1710000, "rew": 39.4677, "rew_std": 1.3648, "Agent": "A2C"}, {"env_step": 1740000, "rew": 39.3563, "rew_std": 1.0205, "Agent": "A2C"}, {"env_step": 1770000, "rew": 38.059, "rew_std": 1.6514, "Agent": "A2C"}, {"env_step": 1800000, "rew": 38.1195, "rew_std": 1.4545, "Agent": "A2C"}, {"env_step": 1830000, "rew": 38.2468, "rew_std": 1.1224, "Agent": "A2C"}, {"env_step": 1860000, "rew": 38.7659, "rew_std": 0.9623, "Agent": "A2C"}, {"env_step": 1890000, "rew": 38.4909, "rew_std": 2.7385, "Agent": "A2C"}, {"env_step": 1920000, "rew": 39.4811, "rew_std": 1.4997, "Agent": "A2C"}, {"env_step": 1950000, "rew": 38.6882, "rew_std": 1.5165, "Agent": "A2C"}, {"env_step": 1980000, "rew": 38.6259, "rew_std": 1.3783, "Agent": "A2C"}, {"env_step": 2010000, "rew": 38.206, "rew_std": 1.0947, "Agent": "A2C"}, {"env_step": 2040000, "rew": 38.7419, "rew_std": 1.2666, "Agent": "A2C"}, {"env_step": 2070000, "rew": 38.8753, "rew_std": 1.0511, "Agent": "A2C"}, {"env_step": 2100000, "rew": 39.2905, "rew_std": 0.8688, "Agent": "A2C"}, {"env_step": 2130000, "rew": 38.5898, "rew_std": 1.1922, "Agent": "A2C"}, {"env_step": 2160000, "rew": 38.8536, "rew_std": 1.4781, "Agent": "A2C"}, {"env_step": 2190000, "rew": 38.6747, "rew_std": 1.4462, "Agent": "A2C"}, {"env_step": 2220000, "rew": 39.1438, "rew_std": 1.8135, "Agent": "A2C"}, {"env_step": 2250000, "rew": 38.1845, "rew_std": 1.669, "Agent": "A2C"}, {"env_step": 2280000, "rew": 38.0937, "rew_std": 1.3581, "Agent": "A2C"}, {"env_step": 2310000, "rew": 39.145, "rew_std": 1.1566, "Agent": "A2C"}, {"env_step": 2340000, "rew": 38.9103, "rew_std": 1.674, "Agent": "A2C"}, {"env_step": 2370000, "rew": 39.5428, "rew_std": 1.1176, "Agent": "A2C"}, {"env_step": 2400000, "rew": 39.1527, "rew_std": 1.1771, "Agent": "A2C"}, {"env_step": 2430000, "rew": 39.2441, "rew_std": 1.3234, "Agent": "A2C"}, {"env_step": 2460000, "rew": 38.2308, "rew_std": 1.3427, "Agent": "A2C"}, {"env_step": 2490000, "rew": 38.306, "rew_std": 1.3113, "Agent": "A2C"}, {"env_step": 2520000, "rew": 38.9159, "rew_std": 1.0674, "Agent": "A2C"}, {"env_step": 2550000, "rew": 38.9894, "rew_std": 1.1316, "Agent": "A2C"}, {"env_step": 2580000, "rew": 39.2214, "rew_std": 1.4829, "Agent": "A2C"}, {"env_step": 2610000, "rew": 39.6471, "rew_std": 1.1784, "Agent": "A2C"}, {"env_step": 2640000, "rew": 39.0951, "rew_std": 1.156, "Agent": "A2C"}, {"env_step": 2670000, "rew": 38.9363, "rew_std": 1.1787, "Agent": "A2C"}, {"env_step": 2700000, "rew": 38.4542, "rew_std": 1.7708, "Agent": "A2C"}, {"env_step": 2730000, "rew": 38.2105, "rew_std": 1.439, "Agent": "A2C"}, {"env_step": 2760000, "rew": 38.8404, "rew_std": 1.7091, "Agent": "A2C"}, {"env_step": 2790000, "rew": 38.7218, "rew_std": 1.588, "Agent": "A2C"}, {"env_step": 2820000, "rew": 39.4069, "rew_std": 1.5121, "Agent": "A2C"}, {"env_step": 2850000, "rew": 39.1226, "rew_std": 1.2302, "Agent": "A2C"}, {"env_step": 2880000, "rew": 38.7814, "rew_std": 1.1653, "Agent": "A2C"}, {"env_step": 2910000, "rew": 38.7925, "rew_std": 1.3412, "Agent": "A2C"}, {"env_step": 2940000, "rew": 38.8147, "rew_std": 1.3375, "Agent": "A2C"}, {"env_step": 2970000, "rew": 38.8382, "rew_std": 1.1257, "Agent": "A2C"}, {"env_step": 3000000, "rew": 38.6791, "rew_std": 1.0833, "Agent": "A2C"}, {"env_step": 0, "rew": 0.7291, "rew_std": 3.4704, "Agent": "ACKTR"}, {"env_step": 30000, "rew": 16.1156, "rew_std": 17.5055, "Agent": "ACKTR"}, {"env_step": 60000, "rew": 26.0472, "rew_std": 10.5541, "Agent": "ACKTR"}, {"env_step": 90000, "rew": 32.057, "rew_std": 7.0379, "Agent": "ACKTR"}, {"env_step": 120000, "rew": 34.3079, "rew_std": 5.4228, "Agent": "ACKTR"}, {"env_step": 150000, "rew": 40.073, "rew_std": 11.6586, "Agent": "ACKTR"}, {"env_step": 180000, "rew": 41.6829, "rew_std": 20.9164, "Agent": "ACKTR"}, {"env_step": 210000, "rew": 46.8218, "rew_std": 22.7845, "Agent": "ACKTR"}, {"env_step": 240000, "rew": 48.4253, "rew_std": 19.708, "Agent": "ACKTR"}, {"env_step": 270000, "rew": 52.8069, "rew_std": 22.96, "Agent": "ACKTR"}, {"env_step": 300000, "rew": 58.1953, "rew_std": 25.0383, "Agent": "ACKTR"}, {"env_step": 330000, "rew": 62.8163, "rew_std": 25.632, "Agent": "ACKTR"}, {"env_step": 360000, "rew": 68.4201, "rew_std": 25.3657, "Agent": "ACKTR"}, {"env_step": 390000, "rew": 76.1497, "rew_std": 24.3487, "Agent": "ACKTR"}, {"env_step": 420000, "rew": 82.0617, "rew_std": 25.6338, "Agent": "ACKTR"}, {"env_step": 450000, "rew": 86.0658, "rew_std": 28.1079, "Agent": "ACKTR"}, {"env_step": 480000, "rew": 87.3938, "rew_std": 28.7587, "Agent": "ACKTR"}, {"env_step": 510000, "rew": 90.0831, "rew_std": 28.2023, "Agent": "ACKTR"}, {"env_step": 540000, "rew": 93.3634, "rew_std": 28.4218, "Agent": "ACKTR"}, {"env_step": 570000, "rew": 94.7138, "rew_std": 29.4864, "Agent": "ACKTR"}, {"env_step": 600000, "rew": 96.0964, "rew_std": 30.3279, "Agent": "ACKTR"}, {"env_step": 630000, "rew": 97.1682, "rew_std": 30.3667, "Agent": "ACKTR"}, {"env_step": 660000, "rew": 95.069, "rew_std": 29.1647, "Agent": "ACKTR"}, {"env_step": 690000, "rew": 96.9417, "rew_std": 29.005, "Agent": "ACKTR"}, {"env_step": 720000, "rew": 97.5663, "rew_std": 31.0027, "Agent": "ACKTR"}, {"env_step": 750000, "rew": 97.921, "rew_std": 30.6128, "Agent": "ACKTR"}, {"env_step": 780000, "rew": 101.438, "rew_std": 32.1726, "Agent": "ACKTR"}, {"env_step": 810000, "rew": 101.6066, "rew_std": 32.1387, "Agent": "ACKTR"}, {"env_step": 840000, "rew": 100.5394, "rew_std": 31.9, "Agent": "ACKTR"}, {"env_step": 870000, "rew": 100.8823, "rew_std": 32.3085, "Agent": "ACKTR"}, {"env_step": 900000, "rew": 100.4713, "rew_std": 31.791, "Agent": "ACKTR"}, {"env_step": 930000, "rew": 99.95, "rew_std": 31.6506, "Agent": "ACKTR"}, {"env_step": 960000, "rew": 101.1176, "rew_std": 32.1142, "Agent": "ACKTR"}, {"env_step": 990000, "rew": 100.48, "rew_std": 33.1721, "Agent": "ACKTR"}, {"env_step": 1020000, "rew": 102.9029, "rew_std": 32.909, "Agent": "ACKTR"}, {"env_step": 1050000, "rew": 103.2164, "rew_std": 33.2227, "Agent": "ACKTR"}, {"env_step": 1080000, "rew": 103.4409, "rew_std": 33.6099, "Agent": "ACKTR"}, {"env_step": 1110000, "rew": 103.0006, "rew_std": 33.8036, "Agent": "ACKTR"}, {"env_step": 1140000, "rew": 102.7968, "rew_std": 32.8109, "Agent": "ACKTR"}, {"env_step": 1170000, "rew": 101.9202, "rew_std": 32.0937, "Agent": "ACKTR"}, {"env_step": 1200000, "rew": 102.3284, "rew_std": 32.5445, "Agent": "ACKTR"}, {"env_step": 1230000, "rew": 103.1331, "rew_std": 33.9416, "Agent": "ACKTR"}, {"env_step": 1260000, "rew": 104.6618, "rew_std": 33.6632, "Agent": "ACKTR"}, {"env_step": 1290000, "rew": 105.7183, "rew_std": 34.5343, "Agent": "ACKTR"}, {"env_step": 1320000, "rew": 104.0436, "rew_std": 33.41, "Agent": "ACKTR"}, {"env_step": 1350000, "rew": 102.5194, "rew_std": 32.2822, "Agent": "ACKTR"}, {"env_step": 1380000, "rew": 103.6585, "rew_std": 32.9268, "Agent": "ACKTR"}, {"env_step": 1410000, "rew": 104.485, "rew_std": 34.2728, "Agent": "ACKTR"}, {"env_step": 1440000, "rew": 103.7928, "rew_std": 32.7273, "Agent": "ACKTR"}, {"env_step": 1470000, "rew": 105.1082, "rew_std": 32.9405, "Agent": "ACKTR"}, {"env_step": 1500000, "rew": 103.7885, "rew_std": 32.8596, "Agent": "ACKTR"}, {"env_step": 1530000, "rew": 105.9567, "rew_std": 34.0607, "Agent": "ACKTR"}, {"env_step": 1560000, "rew": 105.2026, "rew_std": 33.253, "Agent": "ACKTR"}, {"env_step": 1590000, "rew": 106.5636, "rew_std": 35.2588, "Agent": "ACKTR"}, {"env_step": 1620000, "rew": 106.2235, "rew_std": 34.5774, "Agent": "ACKTR"}, {"env_step": 1650000, "rew": 105.8435, "rew_std": 35.7613, "Agent": "ACKTR"}, {"env_step": 1680000, "rew": 105.058, "rew_std": 34.081, "Agent": "ACKTR"}, {"env_step": 1710000, "rew": 105.2318, "rew_std": 33.8789, "Agent": "ACKTR"}, {"env_step": 1740000, "rew": 105.4914, "rew_std": 35.0429, "Agent": "ACKTR"}, {"env_step": 1770000, "rew": 106.2321, "rew_std": 34.875, "Agent": "ACKTR"}, {"env_step": 1800000, "rew": 105.6087, "rew_std": 34.5931, "Agent": "ACKTR"}, {"env_step": 1830000, "rew": 106.7634, "rew_std": 35.2935, "Agent": "ACKTR"}, {"env_step": 1860000, "rew": 105.4142, "rew_std": 34.9183, "Agent": "ACKTR"}, {"env_step": 1890000, "rew": 105.7646, "rew_std": 35.2139, "Agent": "ACKTR"}, {"env_step": 1920000, "rew": 105.9258, "rew_std": 34.2383, "Agent": "ACKTR"}, {"env_step": 1950000, "rew": 106.7368, "rew_std": 35.0853, "Agent": "ACKTR"}, {"env_step": 1980000, "rew": 107.4783, "rew_std": 34.5306, "Agent": "ACKTR"}, {"env_step": 2010000, "rew": 108.0829, "rew_std": 35.7002, "Agent": "ACKTR"}, {"env_step": 2040000, "rew": 107.4322, "rew_std": 35.271, "Agent": "ACKTR"}, {"env_step": 2070000, "rew": 108.7529, "rew_std": 36.2032, "Agent": "ACKTR"}, {"env_step": 2100000, "rew": 107.3181, "rew_std": 35.4295, "Agent": "ACKTR"}, {"env_step": 2130000, "rew": 108.0066, "rew_std": 35.979, "Agent": "ACKTR"}, {"env_step": 2160000, "rew": 107.8602, "rew_std": 35.3109, "Agent": "ACKTR"}, {"env_step": 2190000, "rew": 107.7957, "rew_std": 34.9063, "Agent": "ACKTR"}, {"env_step": 2220000, "rew": 108.5944, "rew_std": 34.2298, "Agent": "ACKTR"}, {"env_step": 2250000, "rew": 109.6587, "rew_std": 36.0963, "Agent": "ACKTR"}, {"env_step": 2280000, "rew": 109.9554, "rew_std": 36.1506, "Agent": "ACKTR"}, {"env_step": 2310000, "rew": 109.1644, "rew_std": 36.8921, "Agent": "ACKTR"}, {"env_step": 2340000, "rew": 108.5692, "rew_std": 35.7915, "Agent": "ACKTR"}, {"env_step": 2370000, "rew": 108.4334, "rew_std": 37.4289, "Agent": "ACKTR"}, {"env_step": 2400000, "rew": 109.8947, "rew_std": 36.685, "Agent": "ACKTR"}, {"env_step": 2430000, "rew": 110.4385, "rew_std": 36.6434, "Agent": "ACKTR"}, {"env_step": 2460000, "rew": 109.9774, "rew_std": 35.8877, "Agent": "ACKTR"}, {"env_step": 2490000, "rew": 108.7004, "rew_std": 35.7559, "Agent": "ACKTR"}, {"env_step": 2520000, "rew": 110.5201, "rew_std": 36.2002, "Agent": "ACKTR"}, {"env_step": 2550000, "rew": 108.8395, "rew_std": 37.2365, "Agent": "ACKTR"}, {"env_step": 2580000, "rew": 108.1341, "rew_std": 35.9659, "Agent": "ACKTR"}, {"env_step": 2610000, "rew": 109.912, "rew_std": 36.9513, "Agent": "ACKTR"}, {"env_step": 2640000, "rew": 110.308, "rew_std": 36.4508, "Agent": "ACKTR"}, {"env_step": 2670000, "rew": 110.8231, "rew_std": 36.7277, "Agent": "ACKTR"}, {"env_step": 2700000, "rew": 109.9004, "rew_std": 36.6838, "Agent": "ACKTR"}, {"env_step": 2730000, "rew": 110.1751, "rew_std": 37.8331, "Agent": "ACKTR"}, {"env_step": 2760000, "rew": 110.3556, "rew_std": 36.5481, "Agent": "ACKTR"}, {"env_step": 2790000, "rew": 109.2395, "rew_std": 36.4852, "Agent": "ACKTR"}, {"env_step": 2820000, "rew": 111.5482, "rew_std": 37.9205, "Agent": "ACKTR"}, {"env_step": 2850000, "rew": 110.7781, "rew_std": 37.3948, "Agent": "ACKTR"}, {"env_step": 2880000, "rew": 111.6956, "rew_std": 37.6913, "Agent": "ACKTR"}, {"env_step": 2910000, "rew": 112.2976, "rew_std": 37.6584, "Agent": "ACKTR"}, {"env_step": 2940000, "rew": 111.8278, "rew_std": 37.8407, "Agent": "ACKTR"}, {"env_step": 2970000, "rew": 110.8731, "rew_std": 36.8636, "Agent": "ACKTR"}, {"env_step": 3000000, "rew": 111.5076, "rew_std": 36.1059, "Agent": "ACKTR"}, {"env_step": 0, "rew": -7.7439, "rew_std": 16.8878, "Agent": "DDPG"}, {"env_step": 5000, "rew": 27.111, "rew_std": 10.2362, "Agent": "DDPG"}, {"env_step": 10000, "rew": 28.6777, "rew_std": 26.9079, "Agent": "DDPG"}, {"env_step": 15000, "rew": 29.5172, "rew_std": 20.6009, "Agent": "DDPG"}, {"env_step": 20000, "rew": 31.1824, "rew_std": 12.3387, "Agent": "DDPG"}, {"env_step": 25000, "rew": 35.9658, "rew_std": 11.5662, "Agent": "DDPG"}, {"env_step": 30000, "rew": 32.4928, "rew_std": 11.4795, "Agent": "DDPG"}, {"env_step": 35000, "rew": 36.4445, "rew_std": 13.4968, "Agent": "DDPG"}, {"env_step": 40000, "rew": 29.8878, "rew_std": 17.7985, "Agent": "DDPG"}, {"env_step": 45000, "rew": 41.0883, "rew_std": 10.6527, "Agent": "DDPG"}, {"env_step": 50000, "rew": 39.2044, "rew_std": 5.6556, "Agent": "DDPG"}, {"env_step": 55000, "rew": 46.6439, "rew_std": 8.09, "Agent": "DDPG"}, {"env_step": 60000, "rew": 41.5579, "rew_std": 10.6506, "Agent": "DDPG"}, {"env_step": 65000, "rew": 44.8723, "rew_std": 10.5025, "Agent": "DDPG"}, {"env_step": 70000, "rew": 45.1928, "rew_std": 10.4595, "Agent": "DDPG"}, {"env_step": 75000, "rew": 41.8443, "rew_std": 10.1912, "Agent": "DDPG"}, {"env_step": 80000, "rew": 49.2066, "rew_std": 11.219, "Agent": "DDPG"}, {"env_step": 85000, "rew": 47.8705, "rew_std": 6.2717, "Agent": "DDPG"}, {"env_step": 90000, "rew": 51.3617, "rew_std": 6.4001, "Agent": "DDPG"}, {"env_step": 95000, "rew": 53.8505, "rew_std": 19.8274, "Agent": "DDPG"}, {"env_step": 100000, "rew": 54.9865, "rew_std": 14.7739, "Agent": "DDPG"}, {"env_step": 105000, "rew": 51.164, "rew_std": 5.3692, "Agent": "DDPG"}, {"env_step": 110000, "rew": 53.5985, "rew_std": 16.8755, "Agent": "DDPG"}, {"env_step": 115000, "rew": 53.6093, "rew_std": 16.448, "Agent": "DDPG"}, {"env_step": 120000, "rew": 54.4763, "rew_std": 6.8215, "Agent": "DDPG"}, {"env_step": 125000, "rew": 59.7466, "rew_std": 8.9492, "Agent": "DDPG"}, {"env_step": 130000, "rew": 58.1804, "rew_std": 10.4326, "Agent": "DDPG"}, {"env_step": 135000, "rew": 60.8608, "rew_std": 17.5299, "Agent": "DDPG"}, {"env_step": 140000, "rew": 61.3081, "rew_std": 19.6055, "Agent": "DDPG"}, {"env_step": 145000, "rew": 71.2575, "rew_std": 28.7301, "Agent": "DDPG"}, {"env_step": 150000, "rew": 64.1452, "rew_std": 22.4875, "Agent": "DDPG"}, {"env_step": 155000, "rew": 72.976, "rew_std": 23.0466, "Agent": "DDPG"}, {"env_step": 160000, "rew": 77.025, "rew_std": 28.1836, "Agent": "DDPG"}, {"env_step": 165000, "rew": 79.2977, "rew_std": 27.8582, "Agent": "DDPG"}, {"env_step": 170000, "rew": 77.7769, "rew_std": 27.7826, "Agent": "DDPG"}, {"env_step": 175000, "rew": 79.8337, "rew_std": 32.1006, "Agent": "DDPG"}, {"env_step": 180000, "rew": 86.3861, "rew_std": 29.9729, "Agent": "DDPG"}, {"env_step": 185000, "rew": 83.9423, "rew_std": 32.7325, "Agent": "DDPG"}, {"env_step": 190000, "rew": 87.4571, "rew_std": 29.596, "Agent": "DDPG"}, {"env_step": 195000, "rew": 88.5118, "rew_std": 34.1182, "Agent": "DDPG"}, {"env_step": 200000, "rew": 96.4085, "rew_std": 30.9893, "Agent": "DDPG"}, {"env_step": 205000, "rew": 90.2024, "rew_std": 27.9598, "Agent": "DDPG"}, {"env_step": 210000, "rew": 100.2493, "rew_std": 27.3851, "Agent": "DDPG"}, {"env_step": 215000, "rew": 100.3753, "rew_std": 29.3593, "Agent": "DDPG"}, {"env_step": 220000, "rew": 104.0079, "rew_std": 25.5209, "Agent": "DDPG"}, {"env_step": 225000, "rew": 104.117, "rew_std": 24.1255, "Agent": "DDPG"}, {"env_step": 230000, "rew": 101.1801, "rew_std": 27.2732, "Agent": "DDPG"}, {"env_step": 235000, "rew": 113.4582, "rew_std": 23.629, "Agent": "DDPG"}, {"env_step": 240000, "rew": 113.4486, "rew_std": 23.8049, "Agent": "DDPG"}, {"env_step": 245000, "rew": 111.7019, "rew_std": 25.4914, "Agent": "DDPG"}, {"env_step": 250000, "rew": 115.0514, "rew_std": 24.8545, "Agent": "DDPG"}, {"env_step": 255000, "rew": 115.979, "rew_std": 24.0976, "Agent": "DDPG"}, {"env_step": 260000, "rew": 122.0173, "rew_std": 24.6718, "Agent": "DDPG"}, {"env_step": 265000, "rew": 121.0905, "rew_std": 23.2614, "Agent": "DDPG"}, {"env_step": 270000, "rew": 118.8829, "rew_std": 28.7329, "Agent": "DDPG"}, {"env_step": 275000, "rew": 121.1204, "rew_std": 22.4617, "Agent": "DDPG"}, {"env_step": 280000, "rew": 120.106, "rew_std": 22.087, "Agent": "DDPG"}, {"env_step": 285000, "rew": 122.4843, "rew_std": 25.8522, "Agent": "DDPG"}, {"env_step": 290000, "rew": 126.2871, "rew_std": 19.0177, "Agent": "DDPG"}, {"env_step": 295000, "rew": 121.7824, "rew_std": 19.3339, "Agent": "DDPG"}, {"env_step": 300000, "rew": 124.2313, "rew_std": 22.2559, "Agent": "DDPG"}, {"env_step": 305000, "rew": 127.2795, "rew_std": 18.6246, "Agent": "DDPG"}, {"env_step": 310000, "rew": 126.778, "rew_std": 19.8358, "Agent": "DDPG"}, {"env_step": 315000, "rew": 128.4156, "rew_std": 21.5798, "Agent": "DDPG"}, {"env_step": 320000, "rew": 126.0861, "rew_std": 20.0165, "Agent": "DDPG"}, {"env_step": 325000, "rew": 129.3534, "rew_std": 19.0216, "Agent": "DDPG"}, {"env_step": 330000, "rew": 130.358, "rew_std": 17.8578, "Agent": "DDPG"}, {"env_step": 335000, "rew": 132.1706, "rew_std": 13.9828, "Agent": "DDPG"}, {"env_step": 340000, "rew": 129.9149, "rew_std": 12.1114, "Agent": "DDPG"}, {"env_step": 345000, "rew": 131.798, "rew_std": 15.8348, "Agent": "DDPG"}, {"env_step": 350000, "rew": 131.8573, "rew_std": 13.4496, "Agent": "DDPG"}, {"env_step": 355000, "rew": 130.0461, "rew_std": 11.5573, "Agent": "DDPG"}, {"env_step": 360000, "rew": 129.0096, "rew_std": 12.2683, "Agent": "DDPG"}, {"env_step": 365000, "rew": 129.1626, "rew_std": 9.9854, "Agent": "DDPG"}, {"env_step": 370000, "rew": 128.7662, "rew_std": 9.881, "Agent": "DDPG"}, {"env_step": 375000, "rew": 130.6815, "rew_std": 9.6643, "Agent": "DDPG"}, {"env_step": 380000, "rew": 132.8223, "rew_std": 10.335, "Agent": "DDPG"}, {"env_step": 385000, "rew": 133.3924, "rew_std": 13.4702, "Agent": "DDPG"}, {"env_step": 390000, "rew": 133.1555, "rew_std": 11.541, "Agent": "DDPG"}, {"env_step": 395000, "rew": 131.1679, "rew_std": 8.1387, "Agent": "DDPG"}, {"env_step": 400000, "rew": 129.9687, "rew_std": 15.068, "Agent": "DDPG"}, {"env_step": 405000, "rew": 134.1776, "rew_std": 10.885, "Agent": "DDPG"}, {"env_step": 410000, "rew": 136.1757, "rew_std": 9.1146, "Agent": "DDPG"}, {"env_step": 415000, "rew": 133.9262, "rew_std": 12.703, "Agent": "DDPG"}, {"env_step": 420000, "rew": 136.7213, "rew_std": 11.2332, "Agent": "DDPG"}, {"env_step": 425000, "rew": 135.8019, "rew_std": 12.0867, "Agent": "DDPG"}, {"env_step": 430000, "rew": 137.1716, "rew_std": 11.1026, "Agent": "DDPG"}, {"env_step": 435000, "rew": 137.9368, "rew_std": 10.9157, "Agent": "DDPG"}, {"env_step": 440000, "rew": 135.5737, "rew_std": 12.0013, "Agent": "DDPG"}, {"env_step": 445000, "rew": 136.3091, "rew_std": 12.8528, "Agent": "DDPG"}, {"env_step": 450000, "rew": 132.9403, "rew_std": 13.7779, "Agent": "DDPG"}, {"env_step": 455000, "rew": 137.4564, "rew_std": 7.8761, "Agent": "DDPG"}, {"env_step": 460000, "rew": 138.432, "rew_std": 7.0544, "Agent": "DDPG"}, {"env_step": 465000, "rew": 133.4846, "rew_std": 8.8001, "Agent": "DDPG"}, {"env_step": 470000, "rew": 133.5229, "rew_std": 10.4753, "Agent": "DDPG"}, {"env_step": 475000, "rew": 135.3913, "rew_std": 9.919, "Agent": "DDPG"}, {"env_step": 480000, "rew": 132.1134, "rew_std": 26.522, "Agent": "DDPG"}, {"env_step": 485000, "rew": 138.0401, "rew_std": 13.214, "Agent": "DDPG"}, {"env_step": 490000, "rew": 137.6227, "rew_std": 9.5667, "Agent": "DDPG"}, {"env_step": 495000, "rew": 132.7349, "rew_std": 15.8578, "Agent": "DDPG"}, {"env_step": 500000, "rew": 136.57, "rew_std": 6.4353, "Agent": "DDPG"}, {"env_step": 505000, "rew": 139.3636, "rew_std": 9.0841, "Agent": "DDPG"}, {"env_step": 510000, "rew": 136.9163, "rew_std": 7.471, "Agent": "DDPG"}, {"env_step": 515000, "rew": 136.207, "rew_std": 9.6977, "Agent": "DDPG"}, {"env_step": 520000, "rew": 138.2055, "rew_std": 6.4213, "Agent": "DDPG"}, {"env_step": 525000, "rew": 136.4244, "rew_std": 5.5003, "Agent": "DDPG"}, {"env_step": 530000, "rew": 136.5625, "rew_std": 4.0473, "Agent": "DDPG"}, {"env_step": 535000, "rew": 138.2565, "rew_std": 5.4598, "Agent": "DDPG"}, {"env_step": 540000, "rew": 137.4138, "rew_std": 7.1241, "Agent": "DDPG"}, {"env_step": 545000, "rew": 140.4092, "rew_std": 10.8827, "Agent": "DDPG"}, {"env_step": 550000, "rew": 138.3283, "rew_std": 8.6329, "Agent": "DDPG"}, {"env_step": 555000, "rew": 136.1647, "rew_std": 7.8454, "Agent": "DDPG"}, {"env_step": 560000, "rew": 140.6664, "rew_std": 6.8785, "Agent": "DDPG"}, {"env_step": 565000, "rew": 139.045, "rew_std": 9.4246, "Agent": "DDPG"}, {"env_step": 570000, "rew": 135.7369, "rew_std": 9.8926, "Agent": "DDPG"}, {"env_step": 575000, "rew": 136.6039, "rew_std": 6.9162, "Agent": "DDPG"}, {"env_step": 580000, "rew": 138.3082, "rew_std": 5.7867, "Agent": "DDPG"}, {"env_step": 585000, "rew": 139.113, "rew_std": 7.4853, "Agent": "DDPG"}, {"env_step": 590000, "rew": 139.5336, "rew_std": 8.0436, "Agent": "DDPG"}, {"env_step": 595000, "rew": 135.7219, "rew_std": 9.0493, "Agent": "DDPG"}, {"env_step": 600000, "rew": 139.0518, "rew_std": 5.966, "Agent": "DDPG"}, {"env_step": 605000, "rew": 134.7683, "rew_std": 10.3015, "Agent": "DDPG"}, {"env_step": 610000, "rew": 138.8106, "rew_std": 8.7777, "Agent": "DDPG"}, {"env_step": 615000, "rew": 137.989, "rew_std": 8.3029, "Agent": "DDPG"}, {"env_step": 620000, "rew": 135.4547, "rew_std": 11.4179, "Agent": "DDPG"}, {"env_step": 625000, "rew": 138.5979, "rew_std": 13.4474, "Agent": "DDPG"}, {"env_step": 630000, "rew": 137.1638, "rew_std": 4.0057, "Agent": "DDPG"}, {"env_step": 635000, "rew": 138.6027, "rew_std": 6.9118, "Agent": "DDPG"}, {"env_step": 640000, "rew": 138.4561, "rew_std": 5.3458, "Agent": "DDPG"}, {"env_step": 645000, "rew": 137.6744, "rew_std": 9.7438, "Agent": "DDPG"}, {"env_step": 650000, "rew": 140.8803, "rew_std": 10.5245, "Agent": "DDPG"}, {"env_step": 655000, "rew": 137.6448, "rew_std": 10.9617, "Agent": "DDPG"}, {"env_step": 660000, "rew": 140.081, "rew_std": 6.8093, "Agent": "DDPG"}, {"env_step": 665000, "rew": 140.6238, "rew_std": 6.7335, "Agent": "DDPG"}, {"env_step": 670000, "rew": 137.5476, "rew_std": 5.7097, "Agent": "DDPG"}, {"env_step": 675000, "rew": 140.0157, "rew_std": 3.6635, "Agent": "DDPG"}, {"env_step": 680000, "rew": 139.8821, "rew_std": 6.7079, "Agent": "DDPG"}, {"env_step": 685000, "rew": 139.6744, "rew_std": 4.1447, "Agent": "DDPG"}, {"env_step": 690000, "rew": 140.5739, "rew_std": 3.8759, "Agent": "DDPG"}, {"env_step": 695000, "rew": 140.9771, "rew_std": 5.3847, "Agent": "DDPG"}, {"env_step": 700000, "rew": 141.7002, "rew_std": 4.175, "Agent": "DDPG"}, {"env_step": 705000, "rew": 140.0991, "rew_std": 6.4371, "Agent": "DDPG"}, {"env_step": 710000, "rew": 138.9222, "rew_std": 4.4813, "Agent": "DDPG"}, {"env_step": 715000, "rew": 140.0551, "rew_std": 9.8149, "Agent": "DDPG"}, {"env_step": 720000, "rew": 140.2259, "rew_std": 4.8199, "Agent": "DDPG"}, {"env_step": 725000, "rew": 138.2153, "rew_std": 8.7884, "Agent": "DDPG"}, {"env_step": 730000, "rew": 139.7536, "rew_std": 6.6101, "Agent": "DDPG"}, {"env_step": 735000, "rew": 140.7631, "rew_std": 4.6529, "Agent": "DDPG"}, {"env_step": 740000, "rew": 138.884, "rew_std": 5.6056, "Agent": "DDPG"}, {"env_step": 745000, "rew": 142.3084, "rew_std": 7.3071, "Agent": "DDPG"}, {"env_step": 750000, "rew": 143.9028, "rew_std": 5.4536, "Agent": "DDPG"}, {"env_step": 755000, "rew": 143.2372, "rew_std": 7.275, "Agent": "DDPG"}, {"env_step": 760000, "rew": 140.6356, "rew_std": 4.3539, "Agent": "DDPG"}, {"env_step": 765000, "rew": 137.9779, "rew_std": 6.4228, "Agent": "DDPG"}, {"env_step": 770000, "rew": 139.6024, "rew_std": 4.6246, "Agent": "DDPG"}, {"env_step": 775000, "rew": 139.0619, "rew_std": 7.1484, "Agent": "DDPG"}, {"env_step": 780000, "rew": 138.1545, "rew_std": 11.656, "Agent": "DDPG"}, {"env_step": 785000, "rew": 138.0749, "rew_std": 3.3782, "Agent": "DDPG"}, {"env_step": 790000, "rew": 140.7768, "rew_std": 8.0989, "Agent": "DDPG"}, {"env_step": 795000, "rew": 138.3206, "rew_std": 7.3118, "Agent": "DDPG"}, {"env_step": 800000, "rew": 140.6746, "rew_std": 4.9365, "Agent": "DDPG"}, {"env_step": 805000, "rew": 142.133, "rew_std": 3.0798, "Agent": "DDPG"}, {"env_step": 810000, "rew": 141.6982, "rew_std": 5.9378, "Agent": "DDPG"}, {"env_step": 815000, "rew": 139.0957, "rew_std": 5.2462, "Agent": "DDPG"}, {"env_step": 820000, "rew": 141.4906, "rew_std": 5.9738, "Agent": "DDPG"}, {"env_step": 825000, "rew": 139.0263, "rew_std": 8.3833, "Agent": "DDPG"}, {"env_step": 830000, "rew": 142.5686, "rew_std": 7.9465, "Agent": "DDPG"}, {"env_step": 835000, "rew": 139.6923, "rew_std": 4.4107, "Agent": "DDPG"}, {"env_step": 840000, "rew": 141.8938, "rew_std": 4.7214, "Agent": "DDPG"}, {"env_step": 845000, "rew": 140.2036, "rew_std": 3.3937, "Agent": "DDPG"}, {"env_step": 850000, "rew": 138.7109, "rew_std": 5.7588, "Agent": "DDPG"}, {"env_step": 855000, "rew": 140.7613, "rew_std": 7.2326, "Agent": "DDPG"}, {"env_step": 860000, "rew": 141.6586, "rew_std": 7.8614, "Agent": "DDPG"}, {"env_step": 865000, "rew": 140.926, "rew_std": 4.7326, "Agent": "DDPG"}, {"env_step": 870000, "rew": 139.1153, "rew_std": 6.172, "Agent": "DDPG"}, {"env_step": 875000, "rew": 142.6159, "rew_std": 3.4461, "Agent": "DDPG"}, {"env_step": 880000, "rew": 142.8545, "rew_std": 6.1448, "Agent": "DDPG"}, {"env_step": 885000, "rew": 141.4641, "rew_std": 6.418, "Agent": "DDPG"}, {"env_step": 890000, "rew": 142.9374, "rew_std": 6.063, "Agent": "DDPG"}, {"env_step": 895000, "rew": 142.308, "rew_std": 6.3968, "Agent": "DDPG"}, {"env_step": 900000, "rew": 141.8166, "rew_std": 4.2354, "Agent": "DDPG"}, {"env_step": 905000, "rew": 141.3372, "rew_std": 3.6162, "Agent": "DDPG"}, {"env_step": 910000, "rew": 142.54, "rew_std": 7.2792, "Agent": "DDPG"}, {"env_step": 915000, "rew": 142.4178, "rew_std": 4.8727, "Agent": "DDPG"}, {"env_step": 920000, "rew": 139.7616, "rew_std": 9.0963, "Agent": "DDPG"}, {"env_step": 925000, "rew": 140.8662, "rew_std": 7.1925, "Agent": "DDPG"}, {"env_step": 930000, "rew": 142.59, "rew_std": 7.5659, "Agent": "DDPG"}, {"env_step": 935000, "rew": 141.1232, "rew_std": 5.4951, "Agent": "DDPG"}, {"env_step": 940000, "rew": 140.9761, "rew_std": 4.436, "Agent": "DDPG"}, {"env_step": 945000, "rew": 142.694, "rew_std": 6.0702, "Agent": "DDPG"}, {"env_step": 950000, "rew": 143.414, "rew_std": 7.787, "Agent": "DDPG"}, {"env_step": 955000, "rew": 141.0688, "rew_std": 5.583, "Agent": "DDPG"}, {"env_step": 960000, "rew": 141.8118, "rew_std": 8.1901, "Agent": "DDPG"}, {"env_step": 965000, "rew": 141.6261, "rew_std": 6.3236, "Agent": "DDPG"}, {"env_step": 970000, "rew": 142.2169, "rew_std": 7.4153, "Agent": "DDPG"}, {"env_step": 975000, "rew": 139.8413, "rew_std": 5.3582, "Agent": "DDPG"}, {"env_step": 980000, "rew": 141.311, "rew_std": 7.0072, "Agent": "DDPG"}, {"env_step": 985000, "rew": 140.5871, "rew_std": 5.2723, "Agent": "DDPG"}, {"env_step": 990000, "rew": 144.0535, "rew_std": 6.4924, "Agent": "DDPG"}, {"env_step": 995000, "rew": 141.8434, "rew_std": 4.2558, "Agent": "DDPG"}, {"env_step": 1000000, "rew": 142.2982, "rew_std": 7.6682, "Agent": "DDPG"}, {"env_step": 1005000, "rew": 139.1055, "rew_std": 9.2758, "Agent": "DDPG"}, {"env_step": 1010000, "rew": 141.0416, "rew_std": 5.0772, "Agent": "DDPG"}, {"env_step": 1015000, "rew": 141.6343, "rew_std": 6.0345, "Agent": "DDPG"}, {"env_step": 1020000, "rew": 141.7569, "rew_std": 4.6563, "Agent": "DDPG"}, {"env_step": 1025000, "rew": 141.4089, "rew_std": 4.7605, "Agent": "DDPG"}, {"env_step": 1030000, "rew": 141.2138, "rew_std": 5.7038, "Agent": "DDPG"}, {"env_step": 1035000, "rew": 144.4552, "rew_std": 6.0544, "Agent": "DDPG"}, {"env_step": 1040000, "rew": 140.9662, "rew_std": 3.1099, "Agent": "DDPG"}, {"env_step": 1045000, "rew": 141.1972, "rew_std": 4.5801, "Agent": "DDPG"}, {"env_step": 1050000, "rew": 140.5965, "rew_std": 7.0805, "Agent": "DDPG"}, {"env_step": 1055000, "rew": 140.1733, "rew_std": 4.7662, "Agent": "DDPG"}, {"env_step": 1060000, "rew": 140.4672, "rew_std": 5.3948, "Agent": "DDPG"}, {"env_step": 1065000, "rew": 143.2305, "rew_std": 3.5909, "Agent": "DDPG"}, {"env_step": 1070000, "rew": 143.6553, "rew_std": 5.7578, "Agent": "DDPG"}, {"env_step": 1075000, "rew": 142.2234, "rew_std": 7.5004, "Agent": "DDPG"}, {"env_step": 1080000, "rew": 139.3473, "rew_std": 10.9533, "Agent": "DDPG"}, {"env_step": 1085000, "rew": 140.791, "rew_std": 8.3328, "Agent": "DDPG"}, {"env_step": 1090000, "rew": 141.3331, "rew_std": 9.4282, "Agent": "DDPG"}, {"env_step": 1095000, "rew": 143.6647, "rew_std": 6.6349, "Agent": "DDPG"}, {"env_step": 1100000, "rew": 142.53, "rew_std": 5.9298, "Agent": "DDPG"}, {"env_step": 1105000, "rew": 141.2602, "rew_std": 6.2225, "Agent": "DDPG"}, {"env_step": 1110000, "rew": 140.7595, "rew_std": 4.7542, "Agent": "DDPG"}, {"env_step": 1115000, "rew": 140.6618, "rew_std": 5.5336, "Agent": "DDPG"}, {"env_step": 1120000, "rew": 142.304, "rew_std": 8.0534, "Agent": "DDPG"}, {"env_step": 1125000, "rew": 144.1979, "rew_std": 3.9518, "Agent": "DDPG"}, {"env_step": 1130000, "rew": 141.9399, "rew_std": 5.1798, "Agent": "DDPG"}, {"env_step": 1135000, "rew": 141.6419, "rew_std": 5.5409, "Agent": "DDPG"}, {"env_step": 1140000, "rew": 141.4458, "rew_std": 5.9887, "Agent": "DDPG"}, {"env_step": 1145000, "rew": 140.9982, "rew_std": 5.9734, "Agent": "DDPG"}, {"env_step": 1150000, "rew": 142.6737, "rew_std": 9.5289, "Agent": "DDPG"}, {"env_step": 1155000, "rew": 141.9587, "rew_std": 9.3877, "Agent": "DDPG"}, {"env_step": 1160000, "rew": 137.8503, "rew_std": 14.5437, "Agent": "DDPG"}, {"env_step": 1165000, "rew": 139.3552, "rew_std": 21.4731, "Agent": "DDPG"}, {"env_step": 1170000, "rew": 141.687, "rew_std": 7.7627, "Agent": "DDPG"}, {"env_step": 1175000, "rew": 142.3425, "rew_std": 7.2573, "Agent": "DDPG"}, {"env_step": 1180000, "rew": 138.1963, "rew_std": 16.6084, "Agent": "DDPG"}, {"env_step": 1185000, "rew": 141.6446, "rew_std": 6.3986, "Agent": "DDPG"}, {"env_step": 1190000, "rew": 143.3347, "rew_std": 9.8443, "Agent": "DDPG"}, {"env_step": 1195000, "rew": 140.4516, "rew_std": 6.6021, "Agent": "DDPG"}, {"env_step": 1200000, "rew": 140.1266, "rew_std": 5.6212, "Agent": "DDPG"}, {"env_step": 1205000, "rew": 143.1696, "rew_std": 5.1804, "Agent": "DDPG"}, {"env_step": 1210000, "rew": 143.2144, "rew_std": 4.4858, "Agent": "DDPG"}, {"env_step": 1215000, "rew": 138.569, "rew_std": 12.7858, "Agent": "DDPG"}, {"env_step": 1220000, "rew": 141.7806, "rew_std": 5.4688, "Agent": "DDPG"}, {"env_step": 1225000, "rew": 145.6152, "rew_std": 6.855, "Agent": "DDPG"}, {"env_step": 1230000, "rew": 137.5698, "rew_std": 21.3122, "Agent": "DDPG"}, {"env_step": 1235000, "rew": 143.4506, "rew_std": 7.6401, "Agent": "DDPG"}, {"env_step": 1240000, "rew": 144.9408, "rew_std": 7.5304, "Agent": "DDPG"}, {"env_step": 1245000, "rew": 135.8165, "rew_std": 15.8613, "Agent": "DDPG"}, {"env_step": 1250000, "rew": 140.8486, "rew_std": 11.2777, "Agent": "DDPG"}, {"env_step": 0, "rew": 1.0258, "rew_std": 3.8982, "Agent": "NPG"}, {"env_step": 30720, "rew": 23.7146, "rew_std": 2.9296, "Agent": "NPG"}, {"env_step": 61440, "rew": 21.5204, "rew_std": 5.9224, "Agent": "NPG"}, {"env_step": 92160, "rew": 13.6331, "rew_std": 8.2169, "Agent": "NPG"}, {"env_step": 122880, "rew": 8.7427, "rew_std": 5.8546, "Agent": "NPG"}, {"env_step": 153600, "rew": 6.7801, "rew_std": 9.2345, "Agent": "NPG"}, {"env_step": 184320, "rew": 6.4069, "rew_std": 8.5255, "Agent": "NPG"}, {"env_step": 215040, "rew": 8.4752, "rew_std": 9.2114, "Agent": "NPG"}, {"env_step": 245760, "rew": 9.0475, "rew_std": 7.5991, "Agent": "NPG"}, {"env_step": 276480, "rew": 10.4524, "rew_std": 8.8479, "Agent": "NPG"}, {"env_step": 307200, "rew": 12.7068, "rew_std": 10.8028, "Agent": "NPG"}, {"env_step": 337920, "rew": 13.2985, "rew_std": 9.4718, "Agent": "NPG"}, {"env_step": 368640, "rew": 11.9742, "rew_std": 11.9124, "Agent": "NPG"}, {"env_step": 399360, "rew": 13.6661, "rew_std": 13.2112, "Agent": "NPG"}, {"env_step": 430080, "rew": 14.5806, "rew_std": 12.1707, "Agent": "NPG"}, {"env_step": 460800, "rew": 14.3626, "rew_std": 13.5778, "Agent": "NPG"}, {"env_step": 491520, "rew": 14.3562, "rew_std": 13.6016, "Agent": "NPG"}, {"env_step": 522240, "rew": 11.2651, "rew_std": 13.3187, "Agent": "NPG"}, {"env_step": 552960, "rew": 12.3707, "rew_std": 13.7796, "Agent": "NPG"}, {"env_step": 583680, "rew": 15.743, "rew_std": 14.353, "Agent": "NPG"}, {"env_step": 614400, "rew": 15.141, "rew_std": 13.8719, "Agent": "NPG"}, {"env_step": 645120, "rew": 14.4111, "rew_std": 13.1943, "Agent": "NPG"}, {"env_step": 675840, "rew": 14.9368, "rew_std": 13.5259, "Agent": "NPG"}, {"env_step": 706560, "rew": 18.0811, "rew_std": 11.3189, "Agent": "NPG"}, {"env_step": 737280, "rew": 16.2298, "rew_std": 10.6969, "Agent": "NPG"}, {"env_step": 768000, "rew": 18.2274, "rew_std": 10.5519, "Agent": "NPG"}, {"env_step": 798720, "rew": 21.7817, "rew_std": 10.6298, "Agent": "NPG"}, {"env_step": 829440, "rew": 23.369, "rew_std": 12.2062, "Agent": "NPG"}, {"env_step": 860160, "rew": 23.1065, "rew_std": 10.319, "Agent": "NPG"}, {"env_step": 890880, "rew": 25.8288, "rew_std": 10.2378, "Agent": "NPG"}, {"env_step": 921600, "rew": 25.1132, "rew_std": 9.3431, "Agent": "NPG"}, {"env_step": 952320, "rew": 26.6115, "rew_std": 9.3921, "Agent": "NPG"}, {"env_step": 983040, "rew": 29.4691, "rew_std": 8.764, "Agent": "NPG"}, {"env_step": 1013760, "rew": 33.1585, "rew_std": 7.4503, "Agent": "NPG"}, {"env_step": 1044480, "rew": 32.2367, "rew_std": 8.2393, "Agent": "NPG"}, {"env_step": 1075200, "rew": 33.607, "rew_std": 7.3821, "Agent": "NPG"}, {"env_step": 1105920, "rew": 34.5258, "rew_std": 7.4975, "Agent": "NPG"}, {"env_step": 1136640, "rew": 34.507, "rew_std": 7.0593, "Agent": "NPG"}, {"env_step": 1167360, "rew": 36.6782, "rew_std": 5.9374, "Agent": "NPG"}, {"env_step": 1198080, "rew": 37.6589, "rew_std": 5.3523, "Agent": "NPG"}, {"env_step": 1228800, "rew": 38.4201, "rew_std": 4.1903, "Agent": "NPG"}, {"env_step": 1259520, "rew": 38.9307, "rew_std": 3.4278, "Agent": "NPG"}, {"env_step": 1290240, "rew": 38.7358, "rew_std": 6.0647, "Agent": "NPG"}, {"env_step": 1320960, "rew": 39.9352, "rew_std": 6.1794, "Agent": "NPG"}, {"env_step": 1351680, "rew": 41.2821, "rew_std": 5.224, "Agent": "NPG"}, {"env_step": 1382400, "rew": 40.9985, "rew_std": 6.713, "Agent": "NPG"}, {"env_step": 1413120, "rew": 41.0461, "rew_std": 6.8698, "Agent": "NPG"}, {"env_step": 1443840, "rew": 41.5886, "rew_std": 7.9765, "Agent": "NPG"}, {"env_step": 1474560, "rew": 43.7387, "rew_std": 6.739, "Agent": "NPG"}, {"env_step": 1505280, "rew": 42.9215, "rew_std": 7.2525, "Agent": "NPG"}, {"env_step": 1536000, "rew": 44.6128, "rew_std": 6.518, "Agent": "NPG"}, {"env_step": 1566720, "rew": 44.8393, "rew_std": 6.5894, "Agent": "NPG"}, {"env_step": 1597440, "rew": 43.51, "rew_std": 8.0776, "Agent": "NPG"}, {"env_step": 1628160, "rew": 46.1572, "rew_std": 7.4945, "Agent": "NPG"}, {"env_step": 1658880, "rew": 46.4691, "rew_std": 7.8053, "Agent": "NPG"}, {"env_step": 1689600, "rew": 48.7264, "rew_std": 7.6369, "Agent": "NPG"}, {"env_step": 1720320, "rew": 46.4575, "rew_std": 8.4536, "Agent": "NPG"}, {"env_step": 1751040, "rew": 47.6156, "rew_std": 9.882, "Agent": "NPG"}, {"env_step": 1781760, "rew": 48.4912, "rew_std": 8.2259, "Agent": "NPG"}, {"env_step": 1812480, "rew": 47.8659, "rew_std": 8.615, "Agent": "NPG"}, {"env_step": 1843200, "rew": 49.9064, "rew_std": 7.9016, "Agent": "NPG"}, {"env_step": 1873920, "rew": 49.6945, "rew_std": 8.1372, "Agent": "NPG"}, {"env_step": 1904640, "rew": 49.3308, "rew_std": 8.2622, "Agent": "NPG"}, {"env_step": 1935360, "rew": 51.0023, "rew_std": 7.4984, "Agent": "NPG"}, {"env_step": 1966080, "rew": 50.3444, "rew_std": 8.7265, "Agent": "NPG"}, {"env_step": 1996800, "rew": 51.1145, "rew_std": 8.3731, "Agent": "NPG"}, {"env_step": 2027520, "rew": 50.4669, "rew_std": 8.7647, "Agent": "NPG"}, {"env_step": 2058240, "rew": 50.8541, "rew_std": 8.3398, "Agent": "NPG"}, {"env_step": 2088960, "rew": 52.832, "rew_std": 8.1892, "Agent": "NPG"}, {"env_step": 2119680, "rew": 52.4514, "rew_std": 7.6594, "Agent": "NPG"}, {"env_step": 2150400, "rew": 52.8823, "rew_std": 8.3869, "Agent": "NPG"}, {"env_step": 2181120, "rew": 52.4933, "rew_std": 7.9919, "Agent": "NPG"}, {"env_step": 2211840, "rew": 52.3862, "rew_std": 9.4877, "Agent": "NPG"}, {"env_step": 2242560, "rew": 52.4636, "rew_std": 8.82, "Agent": "NPG"}, {"env_step": 2273280, "rew": 53.5679, "rew_std": 8.0208, "Agent": "NPG"}, {"env_step": 2304000, "rew": 53.8706, "rew_std": 8.2057, "Agent": "NPG"}, {"env_step": 2334720, "rew": 53.0509, "rew_std": 8.6204, "Agent": "NPG"}, {"env_step": 2365440, "rew": 54.2658, "rew_std": 8.4651, "Agent": "NPG"}, {"env_step": 2396160, "rew": 53.9384, "rew_std": 8.7643, "Agent": "NPG"}, {"env_step": 2426880, "rew": 54.6414, "rew_std": 8.3831, "Agent": "NPG"}, {"env_step": 2457600, "rew": 53.631, "rew_std": 9.6735, "Agent": "NPG"}, {"env_step": 2488320, "rew": 55.0658, "rew_std": 8.0061, "Agent": "NPG"}, {"env_step": 2519040, "rew": 55.0112, "rew_std": 8.3882, "Agent": "NPG"}, {"env_step": 2549760, "rew": 54.435, "rew_std": 9.0805, "Agent": "NPG"}, {"env_step": 2580480, "rew": 56.1105, "rew_std": 8.1764, "Agent": "NPG"}, {"env_step": 2611200, "rew": 55.5773, "rew_std": 8.3568, "Agent": "NPG"}, {"env_step": 2641920, "rew": 55.6756, "rew_std": 7.7048, "Agent": "NPG"}, {"env_step": 2672640, "rew": 55.3642, "rew_std": 8.6515, "Agent": "NPG"}, {"env_step": 2703360, "rew": 54.5606, "rew_std": 10.0831, "Agent": "NPG"}, {"env_step": 2734080, "rew": 54.6366, "rew_std": 9.9787, "Agent": "NPG"}, {"env_step": 2764800, "rew": 55.0624, "rew_std": 9.4791, "Agent": "NPG"}, {"env_step": 2795520, "rew": 56.1847, "rew_std": 8.3219, "Agent": "NPG"}, {"env_step": 2826240, "rew": 55.9843, "rew_std": 8.5039, "Agent": "NPG"}, {"env_step": 2856960, "rew": 56.2396, "rew_std": 8.3994, "Agent": "NPG"}, {"env_step": 2887680, "rew": 56.6028, "rew_std": 8.7185, "Agent": "NPG"}, {"env_step": 2918400, "rew": 56.2149, "rew_std": 7.9654, "Agent": "NPG"}, {"env_step": 2949120, "rew": 56.4201, "rew_std": 8.251, "Agent": "NPG"}, {"env_step": 2979840, "rew": 55.9212, "rew_std": 9.1663, "Agent": "NPG"}, {"env_step": 3010560, "rew": 56.5446, "rew_std": 8.7647, "Agent": "NPG"}, {"env_step": 3041280, "rew": 56.8012, "rew_std": 9.4088, "Agent": "NPG"}, {"env_step": 3072000, "rew": 56.5011, "rew_std": 8.127, "Agent": "NPG"}]