[{"env_step": 0, "rew": 53.5579, "rew_std": 5.4624, "Agent": "PPO"}, {"env_step": 30720, "rew": 390.6844, "rew_std": 47.2152, "Agent": "PPO"}, {"env_step": 61440, "rew": 4440.7883, "rew_std": 1477.9099, "Agent": "PPO"}, {"env_step": 92160, "rew": 7432.4452, "rew_std": 1137.4445, "Agent": "PPO"}, {"env_step": 122880, "rew": 8723.7104, "rew_std": 840.5556, "Agent": "PPO"}, {"env_step": 153600, "rew": 8128.2175, "rew_std": 847.2373, "Agent": "PPO"}, {"env_step": 184320, "rew": 7939.7183, "rew_std": 1185.3614, "Agent": "PPO"}, {"env_step": 215040, "rew": 8215.0721, "rew_std": 1687.6094, "Agent": "PPO"}, {"env_step": 245760, "rew": 8299.0993, "rew_std": 2014.0479, "Agent": "PPO"}, {"env_step": 276480, "rew": 7574.2882, "rew_std": 1851.2534, "Agent": "PPO"}, {"env_step": 307200, "rew": 7608.4809, "rew_std": 2040.837, "Agent": "PPO"}, {"env_step": 337920, "rew": 9160.846, "rew_std": 370.1676, "Agent": "PPO"}, {"env_step": 368640, "rew": 8165.264, "rew_std": 1476.0656, "Agent": "PPO"}, {"env_step": 399360, "rew": 9231.3001, "rew_std": 270.4215, "Agent": "PPO"}, {"env_step": 430080, "rew": 8863.8433, "rew_std": 804.7622, "Agent": "PPO"}, {"env_step": 460800, "rew": 8912.687, "rew_std": 583.0749, "Agent": "PPO"}, {"env_step": 491520, "rew": 9178.6727, "rew_std": 351.559, "Agent": "PPO"}, {"env_step": 522240, "rew": 8551.0671, "rew_std": 1781.7509, "Agent": "PPO"}, {"env_step": 552960, "rew": 8041.7706, "rew_std": 1343.6888, "Agent": "PPO"}, {"env_step": 583680, "rew": 8463.9937, "rew_std": 1607.719, "Agent": "PPO"}, {"env_step": 614400, "rew": 7499.9099, "rew_std": 1967.5161, "Agent": "PPO"}, {"env_step": 645120, "rew": 7426.7158, "rew_std": 1688.5658, "Agent": "PPO"}, {"env_step": 675840, "rew": 7450.5741, "rew_std": 1562.2172, "Agent": "PPO"}, {"env_step": 706560, "rew": 7919.1652, "rew_std": 1307.948, "Agent": "PPO"}, {"env_step": 737280, "rew": 8058.6832, "rew_std": 1555.2311, "Agent": "PPO"}, {"env_step": 768000, "rew": 7796.2947, "rew_std": 1427.9864, "Agent": "PPO"}, {"env_step": 798720, "rew": 7871.2745, "rew_std": 2091.2387, "Agent": "PPO"}, {"env_step": 829440, "rew": 7788.3739, "rew_std": 1169.7356, "Agent": "PPO"}, {"env_step": 860160, "rew": 8649.8336, "rew_std": 880.0055, "Agent": "PPO"}, {"env_step": 890880, "rew": 8629.5956, "rew_std": 883.1806, "Agent": "PPO"}, {"env_step": 921600, "rew": 7053.2239, "rew_std": 1975.2603, "Agent": "PPO"}, {"env_step": 952320, "rew": 8832.0522, "rew_std": 720.8276, "Agent": "PPO"}, {"env_step": 983040, "rew": 8695.0495, "rew_std": 1114.9476, "Agent": "PPO"}, {"env_step": 1013760, "rew": 7769.8183, "rew_std": 1044.702, "Agent": "PPO"}, {"env_step": 1044480, "rew": 7672.861, "rew_std": 2120.0992, "Agent": "PPO"}, {"env_step": 1075200, "rew": 7210.2176, "rew_std": 2072.4542, "Agent": "PPO"}, {"env_step": 1105920, "rew": 6198.4025, "rew_std": 2246.6461, "Agent": "PPO"}, {"env_step": 1136640, "rew": 6235.9517, "rew_std": 2022.0933, "Agent": "PPO"}, {"env_step": 1167360, "rew": 8930.9663, "rew_std": 552.711, "Agent": "PPO"}, {"env_step": 1198080, "rew": 7589.3857, "rew_std": 2375.9742, "Agent": "PPO"}, {"env_step": 1228800, "rew": 6630.552, "rew_std": 3211.1769, "Agent": "PPO"}, {"env_step": 1259520, "rew": 6154.6071, "rew_std": 2411.6233, "Agent": "PPO"}, {"env_step": 1290240, "rew": 6570.4411, "rew_std": 2282.5933, "Agent": "PPO"}, {"env_step": 1320960, "rew": 6988.3474, "rew_std": 1774.5001, "Agent": "PPO"}, {"env_step": 1351680, "rew": 6362.3528, "rew_std": 1873.2545, "Agent": "PPO"}, {"env_step": 1382400, "rew": 8103.1912, "rew_std": 1972.6555, "Agent": "PPO"}, {"env_step": 1413120, "rew": 8173.9319, "rew_std": 1462.2099, "Agent": "PPO"}, {"env_step": 1443840, "rew": 7561.3657, "rew_std": 1242.3688, "Agent": "PPO"}, {"env_step": 1474560, "rew": 7414.5475, "rew_std": 1797.1936, "Agent": "PPO"}, {"env_step": 1505280, "rew": 7456.7353, "rew_std": 2076.4739, "Agent": "PPO"}, {"env_step": 1536000, "rew": 7188.1632, "rew_std": 1879.0908, "Agent": "PPO"}, {"env_step": 1566720, "rew": 8456.162, "rew_std": 982.2274, "Agent": "PPO"}, {"env_step": 1597440, "rew": 7070.9443, "rew_std": 2235.7345, "Agent": "PPO"}, {"env_step": 1628160, "rew": 6318.5381, "rew_std": 1411.5987, "Agent": "PPO"}, {"env_step": 1658880, "rew": 6076.6026, "rew_std": 2673.6325, "Agent": "PPO"}, {"env_step": 1689600, "rew": 7328.0759, "rew_std": 2272.6423, "Agent": "PPO"}, {"env_step": 1720320, "rew": 7814.5406, "rew_std": 2963.4102, "Agent": "PPO"}, {"env_step": 1751040, "rew": 7140.9796, "rew_std": 2355.248, "Agent": "PPO"}, {"env_step": 1781760, "rew": 6766.0236, "rew_std": 2901.3291, "Agent": "PPO"}, {"env_step": 1812480, "rew": 5966.0184, "rew_std": 2419.0426, "Agent": "PPO"}, {"env_step": 1843200, "rew": 7952.3784, "rew_std": 2461.1629, "Agent": "PPO"}, {"env_step": 1873920, "rew": 7840.1507, "rew_std": 1948.9364, "Agent": "PPO"}, {"env_step": 1904640, "rew": 6536.9612, "rew_std": 1433.0194, "Agent": "PPO"}, {"env_step": 1935360, "rew": 6992.1694, "rew_std": 2035.752, "Agent": "PPO"}, {"env_step": 1966080, "rew": 7942.765, "rew_std": 1163.106, "Agent": "PPO"}, {"env_step": 1996800, "rew": 6991.8808, "rew_std": 2000.2169, "Agent": "PPO"}, {"env_step": 2027520, "rew": 7433.3263, "rew_std": 957.6863, "Agent": "PPO"}, {"env_step": 2058240, "rew": 7583.5617, "rew_std": 1624.175, "Agent": "PPO"}, {"env_step": 2088960, "rew": 7215.9013, "rew_std": 1515.0528, "Agent": "PPO"}, {"env_step": 2119680, "rew": 5971.309, "rew_std": 2303.5213, "Agent": "PPO"}, {"env_step": 2150400, "rew": 7132.0085, "rew_std": 1651.5937, "Agent": "PPO"}, {"env_step": 2181120, "rew": 5749.5429, "rew_std": 1756.0616, "Agent": "PPO"}, {"env_step": 2211840, "rew": 7625.1017, "rew_std": 1200.5677, "Agent": "PPO"}, {"env_step": 2242560, "rew": 5903.4396, "rew_std": 1907.4404, "Agent": "PPO"}, {"env_step": 2273280, "rew": 7209.7763, "rew_std": 1078.0066, "Agent": "PPO"}, {"env_step": 2304000, "rew": 8454.0754, "rew_std": 905.2939, "Agent": "PPO"}, {"env_step": 2334720, "rew": 6988.5313, "rew_std": 1284.9775, "Agent": "PPO"}, {"env_step": 2365440, "rew": 6159.7626, "rew_std": 1692.64, "Agent": "PPO"}, {"env_step": 2396160, "rew": 7005.0111, "rew_std": 1320.0732, "Agent": "PPO"}, {"env_step": 2426880, "rew": 6899.8644, "rew_std": 1396.3963, "Agent": "PPO"}, {"env_step": 2457600, "rew": 7638.5558, "rew_std": 1618.8543, "Agent": "PPO"}, {"env_step": 2488320, "rew": 7818.5143, "rew_std": 1324.091, "Agent": "PPO"}, {"env_step": 2519040, "rew": 6183.0189, "rew_std": 2073.5887, "Agent": "PPO"}, {"env_step": 2549760, "rew": 8044.4182, "rew_std": 922.0843, "Agent": "PPO"}, {"env_step": 2580480, "rew": 8066.0202, "rew_std": 1208.6707, "Agent": "PPO"}, {"env_step": 2611200, "rew": 7911.9955, "rew_std": 1461.3701, "Agent": "PPO"}, {"env_step": 2641920, "rew": 7744.7357, "rew_std": 1843.5026, "Agent": "PPO"}, {"env_step": 2672640, "rew": 7727.1222, "rew_std": 1227.0877, "Agent": "PPO"}, {"env_step": 2703360, "rew": 6815.0618, "rew_std": 1496.2736, "Agent": "PPO"}, {"env_step": 2734080, "rew": 6665.7163, "rew_std": 1282.2237, "Agent": "PPO"}, {"env_step": 2764800, "rew": 6194.4134, "rew_std": 1379.2422, "Agent": "PPO"}, {"env_step": 2795520, "rew": 7207.3626, "rew_std": 935.8931, "Agent": "PPO"}, {"env_step": 2826240, "rew": 8002.2676, "rew_std": 1064.0059, "Agent": "PPO"}, {"env_step": 2856960, "rew": 7120.8058, "rew_std": 1433.227, "Agent": "PPO"}, {"env_step": 2887680, "rew": 6511.8525, "rew_std": 1660.6839, "Agent": "PPO"}, {"env_step": 2918400, "rew": 6734.165, "rew_std": 1341.1131, "Agent": "PPO"}, {"env_step": 2949120, "rew": 6980.5115, "rew_std": 1604.3832, "Agent": "PPO"}, {"env_step": 2979840, "rew": 6470.7865, "rew_std": 1530.6075, "Agent": "PPO"}, {"env_step": 3010560, "rew": 7347.2895, "rew_std": 1853.1296, "Agent": "PPO"}, {"env_step": 3041280, "rew": 7558.1526, "rew_std": 1060.3463, "Agent": "PPO"}, {"env_step": 3072000, "rew": 7189.4355, "rew_std": 2075.9112, "Agent": "PPO"}, {"env_step": 5000, "rew": 282.9489, "rew_std": 105.3973, "Agent": "TD3"}, {"env_step": 10000, "rew": 967.198, "rew_std": 587.396, "Agent": "TD3"}, {"env_step": 15000, "rew": 2603.2403, "rew_std": 2591.978, "Agent": "TD3"}, {"env_step": 20000, "rew": 7167.7542, "rew_std": 3486.9054, "Agent": "TD3"}, {"env_step": 25000, "rew": 8426.4864, "rew_std": 2799.8999, "Agent": "TD3"}, {"env_step": 30000, "rew": 8421.4054, "rew_std": 2798.2367, "Agent": "TD3"}, {"env_step": 35000, "rew": 8434.9704, "rew_std": 2749.6202, "Agent": "TD3"}, {"env_step": 40000, "rew": 8462.4527, "rew_std": 2679.5802, "Agent": "TD3"}, {"env_step": 45000, "rew": 9264.4194, "rew_std": 264.6839, "Agent": "TD3"}, {"env_step": 50000, "rew": 9342.7878, "rew_std": 16.0342, "Agent": "TD3"}, {"env_step": 55000, "rew": 9349.233, "rew_std": 14.2728, "Agent": "TD3"}, {"env_step": 60000, "rew": 9251.8021, "rew_std": 277.0279, "Agent": "TD3"}, {"env_step": 65000, "rew": 9063.1921, "rew_std": 408.0763, "Agent": "TD3"}, {"env_step": 70000, "rew": 9239.0729, "rew_std": 268.5189, "Agent": "TD3"}, {"env_step": 75000, "rew": 9315.5051, "rew_std": 10.5088, "Agent": "TD3"}, {"env_step": 80000, "rew": 9311.2797, "rew_std": 3.2938, "Agent": "TD3"}, {"env_step": 85000, "rew": 9315.4548, "rew_std": 14.4811, "Agent": "TD3"}, {"env_step": 90000, "rew": 9315.1414, "rew_std": 14.8833, "Agent": "TD3"}, {"env_step": 95000, "rew": 9316.2116, "rew_std": 14.8043, "Agent": "TD3"}, {"env_step": 100000, "rew": 9315.5365, "rew_std": 14.7679, "Agent": "TD3"}, {"env_step": 105000, "rew": 9315.3719, "rew_std": 14.7958, "Agent": "TD3"}, {"env_step": 110000, "rew": 9314.6993, "rew_std": 14.8525, "Agent": "TD3"}, {"env_step": 115000, "rew": 9315.4553, "rew_std": 14.81, "Agent": "TD3"}, {"env_step": 120000, "rew": 9314.5234, "rew_std": 14.8132, "Agent": "TD3"}, {"env_step": 125000, "rew": 9313.8028, "rew_std": 12.1399, "Agent": "TD3"}, {"env_step": 130000, "rew": 9314.5627, "rew_std": 14.6963, "Agent": "TD3"}, {"env_step": 135000, "rew": 9312.9483, "rew_std": 9.0585, "Agent": "TD3"}, {"env_step": 140000, "rew": 9229.2644, "rew_std": 241.3705, "Agent": "TD3"}, {"env_step": 145000, "rew": 9309.6136, "rew_std": 0.7793, "Agent": "TD3"}, {"env_step": 150000, "rew": 9310.1716, "rew_std": 1.6606, "Agent": "TD3"}, {"env_step": 155000, "rew": 9311.2081, "rew_std": 1.3916, "Agent": "TD3"}, {"env_step": 160000, "rew": 8471.2184, "rew_std": 2516.0911, "Agent": "TD3"}, {"env_step": 165000, "rew": 8036.5291, "rew_std": 2707.4981, "Agent": "TD3"}, {"env_step": 170000, "rew": 8293.0254, "rew_std": 2553.5993, "Agent": "TD3"}, {"env_step": 175000, "rew": 8314.9329, "rew_std": 2476.8869, "Agent": "TD3"}, {"env_step": 180000, "rew": 8455.8738, "rew_std": 2564.073, "Agent": "TD3"}, {"env_step": 185000, "rew": 8452.5523, "rew_std": 2571.196, "Agent": "TD3"}, {"env_step": 190000, "rew": 8467.5006, "rew_std": 2527.4494, "Agent": "TD3"}, {"env_step": 195000, "rew": 9309.6068, "rew_std": 0.6428, "Agent": "TD3"}, {"env_step": 200000, "rew": 9309.982, "rew_std": 1.4155, "Agent": "TD3"}, {"env_step": 205000, "rew": 9310.3987, "rew_std": 2.7655, "Agent": "TD3"}, {"env_step": 210000, "rew": 9310.9153, "rew_std": 2.8681, "Agent": "TD3"}, {"env_step": 215000, "rew": 9310.6003, "rew_std": 2.9948, "Agent": "TD3"}, {"env_step": 220000, "rew": 9309.9613, "rew_std": 1.6709, "Agent": "TD3"}, {"env_step": 225000, "rew": 9310.7892, "rew_std": 2.3935, "Agent": "TD3"}, {"env_step": 230000, "rew": 9310.0957, "rew_std": 1.6486, "Agent": "TD3"}, {"env_step": 235000, "rew": 9313.6597, "rew_std": 10.337, "Agent": "TD3"}, {"env_step": 240000, "rew": 9309.9069, "rew_std": 2.888, "Agent": "TD3"}, {"env_step": 245000, "rew": 9223.8129, "rew_std": 257.1406, "Agent": "TD3"}, {"env_step": 250000, "rew": 9310.8441, "rew_std": 2.4554, "Agent": "TD3"}, {"env_step": 255000, "rew": 9310.2397, "rew_std": 2.7111, "Agent": "TD3"}, {"env_step": 260000, "rew": 9310.0834, "rew_std": 1.0443, "Agent": "TD3"}, {"env_step": 265000, "rew": 9310.5597, "rew_std": 2.2972, "Agent": "TD3"}, {"env_step": 270000, "rew": 9310.237, "rew_std": 3.2016, "Agent": "TD3"}, {"env_step": 275000, "rew": 9310.3845, "rew_std": 2.2792, "Agent": "TD3"}, {"env_step": 280000, "rew": 9312.2651, "rew_std": 6.7065, "Agent": "TD3"}, {"env_step": 285000, "rew": 9312.2881, "rew_std": 6.6489, "Agent": "TD3"}, {"env_step": 290000, "rew": 9310.0907, "rew_std": 3.6352, "Agent": "TD3"}, {"env_step": 295000, "rew": 9314.1539, "rew_std": 15.0218, "Agent": "TD3"}, {"env_step": 300000, "rew": 9051.2807, "rew_std": 775.6418, "Agent": "TD3"}, {"env_step": 305000, "rew": 8184.3012, "rew_std": 2622.3709, "Agent": "TD3"}, {"env_step": 310000, "rew": 8874.6879, "rew_std": 1312.1528, "Agent": "TD3"}, {"env_step": 315000, "rew": 9314.4322, "rew_std": 14.1116, "Agent": "TD3"}, {"env_step": 320000, "rew": 9312.8483, "rew_std": 7.482, "Agent": "TD3"}, {"env_step": 325000, "rew": 9313.6615, "rew_std": 8.8537, "Agent": "TD3"}, {"env_step": 330000, "rew": 9312.3362, "rew_std": 9.6878, "Agent": "TD3"}, {"env_step": 335000, "rew": 9311.1867, "rew_std": 4.9263, "Agent": "TD3"}, {"env_step": 340000, "rew": 9311.1632, "rew_std": 4.0272, "Agent": "TD3"}, {"env_step": 345000, "rew": 9311.8437, "rew_std": 3.7329, "Agent": "TD3"}, {"env_step": 350000, "rew": 8525.1915, "rew_std": 2368.4822, "Agent": "TD3"}, {"env_step": 355000, "rew": 9314.4612, "rew_std": 11.0448, "Agent": "TD3"}, {"env_step": 360000, "rew": 9311.3431, "rew_std": 6.6012, "Agent": "TD3"}, {"env_step": 365000, "rew": 9311.3624, "rew_std": 5.7543, "Agent": "TD3"}, {"env_step": 370000, "rew": 8267.0577, "rew_std": 2620.0102, "Agent": "TD3"}, {"env_step": 375000, "rew": 8436.7321, "rew_std": 2631.9562, "Agent": "TD3"}, {"env_step": 380000, "rew": 9144.4516, "rew_std": 514.1179, "Agent": "TD3"}, {"env_step": 385000, "rew": 9313.9002, "rew_std": 14.1223, "Agent": "TD3"}, {"env_step": 390000, "rew": 9145.3532, "rew_std": 507.4234, "Agent": "TD3"}, {"env_step": 395000, "rew": 8885.2745, "rew_std": 1022.9433, "Agent": "TD3"}, {"env_step": 400000, "rew": 9099.8592, "rew_std": 633.7039, "Agent": "TD3"}, {"env_step": 405000, "rew": 9060.6217, "rew_std": 769.8305, "Agent": "TD3"}, {"env_step": 410000, "rew": 9317.8565, "rew_std": 15.6384, "Agent": "TD3"}, {"env_step": 415000, "rew": 9317.4512, "rew_std": 15.2292, "Agent": "TD3"}, {"env_step": 420000, "rew": 9315.6176, "rew_std": 13.6355, "Agent": "TD3"}, {"env_step": 425000, "rew": 8472.1398, "rew_std": 2542.5459, "Agent": "TD3"}, {"env_step": 430000, "rew": 8639.4106, "rew_std": 2031.7747, "Agent": "TD3"}, {"env_step": 435000, "rew": 9319.8521, "rew_std": 18.4469, "Agent": "TD3"}, {"env_step": 440000, "rew": 9316.8172, "rew_std": 16.1172, "Agent": "TD3"}, {"env_step": 445000, "rew": 9319.7009, "rew_std": 20.0731, "Agent": "TD3"}, {"env_step": 450000, "rew": 9066.934, "rew_std": 762.7563, "Agent": "TD3"}, {"env_step": 455000, "rew": 8814.4498, "rew_std": 1510.9292, "Agent": "TD3"}, {"env_step": 460000, "rew": 9320.5916, "rew_std": 18.5887, "Agent": "TD3"}, {"env_step": 465000, "rew": 9318.9374, "rew_std": 18.6527, "Agent": "TD3"}, {"env_step": 470000, "rew": 8383.681, "rew_std": 2528.0881, "Agent": "TD3"}, {"env_step": 475000, "rew": 9320.2665, "rew_std": 16.8646, "Agent": "TD3"}, {"env_step": 480000, "rew": 9320.4374, "rew_std": 17.5623, "Agent": "TD3"}, {"env_step": 485000, "rew": 8444.0166, "rew_std": 2625.2926, "Agent": "TD3"}, {"env_step": 490000, "rew": 9313.9254, "rew_std": 12.639, "Agent": "TD3"}, {"env_step": 495000, "rew": 9152.4438, "rew_std": 507.472, "Agent": "TD3"}, {"env_step": 500000, "rew": 9320.859, "rew_std": 12.8297, "Agent": "TD3"}, {"env_step": 505000, "rew": 9238.7633, "rew_std": 252.8251, "Agent": "TD3"}, {"env_step": 510000, "rew": 8614.0148, "rew_std": 2124.8329, "Agent": "TD3"}, {"env_step": 515000, "rew": 9322.0179, "rew_std": 17.8638, "Agent": "TD3"}, {"env_step": 520000, "rew": 9323.2759, "rew_std": 19.0967, "Agent": "TD3"}, {"env_step": 525000, "rew": 9328.2951, "rew_std": 20.2475, "Agent": "TD3"}, {"env_step": 530000, "rew": 7765.9104, "rew_std": 3149.1228, "Agent": "TD3"}, {"env_step": 535000, "rew": 9327.4452, "rew_std": 20.3214, "Agent": "TD3"}, {"env_step": 540000, "rew": 9329.074, "rew_std": 20.3596, "Agent": "TD3"}, {"env_step": 545000, "rew": 9325.3436, "rew_std": 17.1185, "Agent": "TD3"}, {"env_step": 550000, "rew": 8989.8726, "rew_std": 1031.1772, "Agent": "TD3"}, {"env_step": 555000, "rew": 9331.0296, "rew_std": 21.2146, "Agent": "TD3"}, {"env_step": 560000, "rew": 9330.7565, "rew_std": 19.3693, "Agent": "TD3"}, {"env_step": 565000, "rew": 9329.7398, "rew_std": 20.3798, "Agent": "TD3"}, {"env_step": 570000, "rew": 9325.1319, "rew_std": 19.1622, "Agent": "TD3"}, {"env_step": 575000, "rew": 8480.9527, "rew_std": 2520.0155, "Agent": "TD3"}, {"env_step": 580000, "rew": 9321.9878, "rew_std": 15.8911, "Agent": "TD3"}, {"env_step": 585000, "rew": 8391.7263, "rew_std": 2485.2671, "Agent": "TD3"}, {"env_step": 590000, "rew": 9320.116, "rew_std": 13.4094, "Agent": "TD3"}, {"env_step": 595000, "rew": 8479.5073, "rew_std": 2522.3627, "Agent": "TD3"}, {"env_step": 600000, "rew": 9321.8606, "rew_std": 14.7027, "Agent": "TD3"}, {"env_step": 605000, "rew": 9062.4936, "rew_std": 789.4461, "Agent": "TD3"}, {"env_step": 610000, "rew": 8267.8905, "rew_std": 2266.138, "Agent": "TD3"}, {"env_step": 615000, "rew": 8488.8207, "rew_std": 2511.8177, "Agent": "TD3"}, {"env_step": 620000, "rew": 9325.2056, "rew_std": 17.2205, "Agent": "TD3"}, {"env_step": 625000, "rew": 8471.006, "rew_std": 2551.4845, "Agent": "TD3"}, {"env_step": 630000, "rew": 9243.0092, "rew_std": 243.8519, "Agent": "TD3"}, {"env_step": 635000, "rew": 9323.9628, "rew_std": 18.2174, "Agent": "TD3"}, {"env_step": 640000, "rew": 9174.3501, "rew_std": 461.7308, "Agent": "TD3"}, {"env_step": 645000, "rew": 9327.2489, "rew_std": 17.2679, "Agent": "TD3"}, {"env_step": 650000, "rew": 8608.7013, "rew_std": 2165.4249, "Agent": "TD3"}, {"env_step": 655000, "rew": 8917.4672, "rew_std": 1245.5319, "Agent": "TD3"}, {"env_step": 660000, "rew": 9333.3707, "rew_std": 18.4717, "Agent": "TD3"}, {"env_step": 665000, "rew": 8293.4616, "rew_std": 2412.2377, "Agent": "TD3"}, {"env_step": 670000, "rew": 9333.9283, "rew_std": 18.5759, "Agent": "TD3"}, {"env_step": 675000, "rew": 8487.5841, "rew_std": 2523.9032, "Agent": "TD3"}, {"env_step": 680000, "rew": 8483.1521, "rew_std": 2541.145, "Agent": "TD3"}, {"env_step": 685000, "rew": 9267.9299, "rew_std": 185.369, "Agent": "TD3"}, {"env_step": 690000, "rew": 8483.5027, "rew_std": 2533.8052, "Agent": "TD3"}, {"env_step": 695000, "rew": 8395.0935, "rew_std": 2524.5447, "Agent": "TD3"}, {"env_step": 700000, "rew": 8470.1905, "rew_std": 2562.094, "Agent": "TD3"}, {"env_step": 705000, "rew": 8476.3315, "rew_std": 2549.8972, "Agent": "TD3"}, {"env_step": 710000, "rew": 8464.8866, "rew_std": 2613.7263, "Agent": "TD3"}, {"env_step": 715000, "rew": 8537.5775, "rew_std": 2385.8565, "Agent": "TD3"}, {"env_step": 720000, "rew": 8489.6683, "rew_std": 2513.7786, "Agent": "TD3"}, {"env_step": 725000, "rew": 8475.4442, "rew_std": 2568.3238, "Agent": "TD3"}, {"env_step": 730000, "rew": 8476.2893, "rew_std": 2576.5732, "Agent": "TD3"}, {"env_step": 735000, "rew": 8451.9808, "rew_std": 2637.4094, "Agent": "TD3"}, {"env_step": 740000, "rew": 8438.7148, "rew_std": 2646.9911, "Agent": "TD3"}, {"env_step": 745000, "rew": 8551.6528, "rew_std": 2306.6298, "Agent": "TD3"}, {"env_step": 750000, "rew": 9320.1892, "rew_std": 18.8426, "Agent": "TD3"}, {"env_step": 755000, "rew": 9324.6405, "rew_std": 18.1221, "Agent": "TD3"}, {"env_step": 760000, "rew": 8951.4759, "rew_std": 1113.7195, "Agent": "TD3"}, {"env_step": 765000, "rew": 9008.1179, "rew_std": 529.2366, "Agent": "TD3"}, {"env_step": 770000, "rew": 8767.8096, "rew_std": 1685.5353, "Agent": "TD3"}, {"env_step": 775000, "rew": 8495.5212, "rew_std": 2507.0633, "Agent": "TD3"}, {"env_step": 780000, "rew": 8246.6138, "rew_std": 2562.1309, "Agent": "TD3"}, {"env_step": 785000, "rew": 8475.1777, "rew_std": 2579.23, "Agent": "TD3"}, {"env_step": 790000, "rew": 8479.8606, "rew_std": 2072.6119, "Agent": "TD3"}, {"env_step": 795000, "rew": 7802.9669, "rew_std": 3063.6171, "Agent": "TD3"}, {"env_step": 800000, "rew": 8453.7153, "rew_std": 2637.2187, "Agent": "TD3"}, {"env_step": 805000, "rew": 9238.6734, "rew_std": 276.5512, "Agent": "TD3"}, {"env_step": 810000, "rew": 9333.529, "rew_std": 21.4153, "Agent": "TD3"}, {"env_step": 815000, "rew": 9327.587, "rew_std": 19.7504, "Agent": "TD3"}, {"env_step": 820000, "rew": 9330.4714, "rew_std": 20.4379, "Agent": "TD3"}, {"env_step": 825000, "rew": 9336.9744, "rew_std": 19.5782, "Agent": "TD3"}, {"env_step": 830000, "rew": 9329.7092, "rew_std": 21.4864, "Agent": "TD3"}, {"env_step": 835000, "rew": 9331.23, "rew_std": 18.5596, "Agent": "TD3"}, {"env_step": 840000, "rew": 9328.854, "rew_std": 21.1961, "Agent": "TD3"}, {"env_step": 845000, "rew": 9327.2057, "rew_std": 22.8246, "Agent": "TD3"}, {"env_step": 850000, "rew": 8903.428, "rew_std": 1283.9923, "Agent": "TD3"}, {"env_step": 855000, "rew": 8621.8355, "rew_std": 2140.9923, "Agent": "TD3"}, {"env_step": 860000, "rew": 9331.3873, "rew_std": 21.2049, "Agent": "TD3"}, {"env_step": 865000, "rew": 8512.1406, "rew_std": 2475.3905, "Agent": "TD3"}, {"env_step": 870000, "rew": 9267.4105, "rew_std": 213.968, "Agent": "TD3"}, {"env_step": 875000, "rew": 9333.9985, "rew_std": 19.9086, "Agent": "TD3"}, {"env_step": 880000, "rew": 9335.3527, "rew_std": 18.5561, "Agent": "TD3"}, {"env_step": 885000, "rew": 9162.3701, "rew_std": 536.2045, "Agent": "TD3"}, {"env_step": 890000, "rew": 8418.461, "rew_std": 2207.2014, "Agent": "TD3"}, {"env_step": 895000, "rew": 8492.1865, "rew_std": 1591.2265, "Agent": "TD3"}, {"env_step": 900000, "rew": 8446.7387, "rew_std": 2652.4248, "Agent": "TD3"}, {"env_step": 905000, "rew": 8747.1687, "rew_std": 1331.51, "Agent": "TD3"}, {"env_step": 910000, "rew": 8839.1724, "rew_std": 1487.8274, "Agent": "TD3"}, {"env_step": 915000, "rew": 9336.9595, "rew_std": 20.1037, "Agent": "TD3"}, {"env_step": 920000, "rew": 9338.5807, "rew_std": 19.6659, "Agent": "TD3"}, {"env_step": 925000, "rew": 8468.7912, "rew_std": 2574.2131, "Agent": "TD3"}, {"env_step": 930000, "rew": 9327.7642, "rew_std": 15.1276, "Agent": "TD3"}, {"env_step": 935000, "rew": 9334.2831, "rew_std": 16.6168, "Agent": "TD3"}, {"env_step": 940000, "rew": 9328.7489, "rew_std": 19.5544, "Agent": "TD3"}, {"env_step": 945000, "rew": 9333.8926, "rew_std": 21.3318, "Agent": "TD3"}, {"env_step": 950000, "rew": 8653.8862, "rew_std": 2015.9693, "Agent": "TD3"}, {"env_step": 955000, "rew": 7621.0775, "rew_std": 2831.5293, "Agent": "TD3"}, {"env_step": 960000, "rew": 9333.3804, "rew_std": 19.1393, "Agent": "TD3"}, {"env_step": 965000, "rew": 9327.7606, "rew_std": 15.0447, "Agent": "TD3"}, {"env_step": 970000, "rew": 9330.358, "rew_std": 18.4475, "Agent": "TD3"}, {"env_step": 975000, "rew": 8709.456, "rew_std": 1851.1411, "Agent": "TD3"}, {"env_step": 980000, "rew": 9333.1847, "rew_std": 19.0763, "Agent": "TD3"}, {"env_step": 985000, "rew": 9328.7851, "rew_std": 19.2249, "Agent": "TD3"}, {"env_step": 990000, "rew": 9334.8215, "rew_std": 17.4106, "Agent": "TD3"}, {"env_step": 995000, "rew": 9330.7308, "rew_std": 16.6466, "Agent": "TD3"}, {"env_step": 1000000, "rew": 9333.4001, "rew_std": 18.7685, "Agent": "TD3"}, {"env_step": 1005000, "rew": 9327.9781, "rew_std": 15.018, "Agent": "TD3"}, {"env_step": 1010000, "rew": 8995.3494, "rew_std": 764.8608, "Agent": "TD3"}, {"env_step": 1015000, "rew": 9330.6447, "rew_std": 20.8002, "Agent": "TD3"}, {"env_step": 1020000, "rew": 9323.7909, "rew_std": 15.9208, "Agent": "TD3"}, {"env_step": 1025000, "rew": 9328.5144, "rew_std": 14.8415, "Agent": "TD3"}, {"env_step": 1030000, "rew": 9329.8467, "rew_std": 17.4232, "Agent": "TD3"}, {"env_step": 1035000, "rew": 9326.6478, "rew_std": 14.85, "Agent": "TD3"}, {"env_step": 1040000, "rew": 9149.0301, "rew_std": 356.8972, "Agent": "TD3"}, {"env_step": 1045000, "rew": 9327.1727, "rew_std": 13.5036, "Agent": "TD3"}, {"env_step": 1050000, "rew": 9333.3892, "rew_std": 17.5108, "Agent": "TD3"}, {"env_step": 1055000, "rew": 8927.7454, "rew_std": 1201.0765, "Agent": "TD3"}, {"env_step": 1060000, "rew": 8845.8415, "rew_std": 1166.0041, "Agent": "TD3"}, {"env_step": 1065000, "rew": 9325.4141, "rew_std": 15.648, "Agent": "TD3"}, {"env_step": 1070000, "rew": 9319.1911, "rew_std": 14.7747, "Agent": "TD3"}, {"env_step": 1075000, "rew": 9322.9721, "rew_std": 11.5142, "Agent": "TD3"}, {"env_step": 1080000, "rew": 9321.295, "rew_std": 8.3382, "Agent": "TD3"}, {"env_step": 1085000, "rew": 8626.7788, "rew_std": 2096.5287, "Agent": "TD3"}, {"env_step": 1090000, "rew": 8702.9198, "rew_std": 1852.4358, "Agent": "TD3"}, {"env_step": 1095000, "rew": 8883.6199, "rew_std": 1310.4064, "Agent": "TD3"}, {"env_step": 1100000, "rew": 8636.9099, "rew_std": 2058.3565, "Agent": "TD3"}, {"env_step": 1105000, "rew": 9319.5485, "rew_std": 13.8536, "Agent": "TD3"}, {"env_step": 1110000, "rew": 9319.021, "rew_std": 11.4661, "Agent": "TD3"}, {"env_step": 1115000, "rew": 9319.6046, "rew_std": 11.8647, "Agent": "TD3"}, {"env_step": 1120000, "rew": 9322.6937, "rew_std": 13.0633, "Agent": "TD3"}, {"env_step": 1125000, "rew": 8474.7102, "rew_std": 2555.5902, "Agent": "TD3"}, {"env_step": 1130000, "rew": 8490.9087, "rew_std": 2063.7339, "Agent": "TD3"}, {"env_step": 1135000, "rew": 9156.6945, "rew_std": 513.5511, "Agent": "TD3"}, {"env_step": 1140000, "rew": 9323.0957, "rew_std": 17.2924, "Agent": "TD3"}, {"env_step": 1145000, "rew": 9234.5272, "rew_std": 259.9814, "Agent": "TD3"}, {"env_step": 1150000, "rew": 8800.384, "rew_std": 1114.5204, "Agent": "TD3"}, {"env_step": 1155000, "rew": 8976.3803, "rew_std": 1050.1321, "Agent": "TD3"}, {"env_step": 1160000, "rew": 9326.5404, "rew_std": 13.1945, "Agent": "TD3"}, {"env_step": 1165000, "rew": 9325.8077, "rew_std": 17.0369, "Agent": "TD3"}, {"env_step": 1170000, "rew": 8887.2947, "rew_std": 1309.6168, "Agent": "TD3"}, {"env_step": 1175000, "rew": 9322.4509, "rew_std": 17.1221, "Agent": "TD3"}, {"env_step": 1180000, "rew": 9323.5382, "rew_std": 16.3925, "Agent": "TD3"}, {"env_step": 1185000, "rew": 9325.3668, "rew_std": 17.4452, "Agent": "TD3"}, {"env_step": 1190000, "rew": 8981.4488, "rew_std": 1037.9468, "Agent": "TD3"}, {"env_step": 1195000, "rew": 8478.0402, "rew_std": 2549.7415, "Agent": "TD3"}, {"env_step": 1200000, "rew": 8589.0557, "rew_std": 2228.981, "Agent": "TD3"}, {"env_step": 1205000, "rew": 9329.7533, "rew_std": 14.2779, "Agent": "TD3"}, {"env_step": 1210000, "rew": 8508.0089, "rew_std": 2489.3719, "Agent": "TD3"}, {"env_step": 1215000, "rew": 9080.1032, "rew_std": 743.7643, "Agent": "TD3"}, {"env_step": 1220000, "rew": 8915.0462, "rew_std": 1257.401, "Agent": "TD3"}, {"env_step": 1225000, "rew": 9331.3188, "rew_std": 14.9061, "Agent": "TD3"}, {"env_step": 1230000, "rew": 9332.644, "rew_std": 15.5307, "Agent": "TD3"}, {"env_step": 1235000, "rew": 9327.1162, "rew_std": 12.8789, "Agent": "TD3"}, {"env_step": 1240000, "rew": 9318.4714, "rew_std": 7.6461, "Agent": "TD3"}, {"env_step": 1245000, "rew": 9321.1796, "rew_std": 11.7523, "Agent": "TD3"}, {"env_step": 1250000, "rew": 9326.545, "rew_std": 11.7313, "Agent": "TD3"}, {"env_step": 0, "rew": 60.0108, "rew_std": 6.0382, "Agent": "REINFORCE"}, {"env_step": 30720, "rew": 66.8851, "rew_std": 4.8886, "Agent": "REINFORCE"}, {"env_step": 61440, "rew": 82.7432, "rew_std": 7.4298, "Agent": "REINFORCE"}, {"env_step": 92160, "rew": 96.5871, "rew_std": 14.5135, "Agent": "REINFORCE"}, {"env_step": 122880, "rew": 112.431, "rew_std": 7.34, "Agent": "REINFORCE"}, {"env_step": 153600, "rew": 122.4389, "rew_std": 18.2545, "Agent": "REINFORCE"}, {"env_step": 184320, "rew": 155.4821, "rew_std": 34.0244, "Agent": "REINFORCE"}, {"env_step": 215040, "rew": 183.7388, "rew_std": 29.0268, "Agent": "REINFORCE"}, {"env_step": 245760, "rew": 228.9308, "rew_std": 42.0714, "Agent": "REINFORCE"}, {"env_step": 276480, "rew": 295.3232, "rew_std": 37.5235, "Agent": "REINFORCE"}, {"env_step": 307200, "rew": 290.0857, "rew_std": 26.9366, "Agent": "REINFORCE"}, {"env_step": 337920, "rew": 327.8566, "rew_std": 61.7201, "Agent": "REINFORCE"}, {"env_step": 368640, "rew": 357.6878, "rew_std": 41.0322, "Agent": "REINFORCE"}, {"env_step": 399360, "rew": 366.3419, "rew_std": 33.2445, "Agent": "REINFORCE"}, {"env_step": 430080, "rew": 381.9601, "rew_std": 66.8866, "Agent": "REINFORCE"}, {"env_step": 460800, "rew": 368.2484, "rew_std": 48.6524, "Agent": "REINFORCE"}, {"env_step": 491520, "rew": 378.9139, "rew_std": 37.3082, "Agent": "REINFORCE"}, {"env_step": 522240, "rew": 380.7339, "rew_std": 55.8626, "Agent": "REINFORCE"}, {"env_step": 552960, "rew": 387.7164, "rew_std": 34.7361, "Agent": "REINFORCE"}, {"env_step": 583680, "rew": 376.7374, "rew_std": 31.788, "Agent": "REINFORCE"}, {"env_step": 614400, "rew": 353.7732, "rew_std": 37.8586, "Agent": "REINFORCE"}, {"env_step": 645120, "rew": 357.7262, "rew_std": 68.3217, "Agent": "REINFORCE"}, {"env_step": 675840, "rew": 370.7562, "rew_std": 67.7155, "Agent": "REINFORCE"}, {"env_step": 706560, "rew": 383.0227, "rew_std": 54.1512, "Agent": "REINFORCE"}, {"env_step": 737280, "rew": 368.886, "rew_std": 56.9815, "Agent": "REINFORCE"}, {"env_step": 768000, "rew": 404.9809, "rew_std": 47.8215, "Agent": "REINFORCE"}, {"env_step": 798720, "rew": 426.8464, "rew_std": 50.1806, "Agent": "REINFORCE"}, {"env_step": 829440, "rew": 370.5083, "rew_std": 42.005, "Agent": "REINFORCE"}, {"env_step": 860160, "rew": 436.8902, "rew_std": 60.5663, "Agent": "REINFORCE"}, {"env_step": 890880, "rew": 420.3315, "rew_std": 82.9773, "Agent": "REINFORCE"}, {"env_step": 921600, "rew": 382.7165, "rew_std": 64.6931, "Agent": "REINFORCE"}, {"env_step": 952320, "rew": 424.8106, "rew_std": 55.993, "Agent": "REINFORCE"}, {"env_step": 983040, "rew": 434.6915, "rew_std": 56.8445, "Agent": "REINFORCE"}, {"env_step": 1013760, "rew": 427.4304, "rew_std": 54.1882, "Agent": "REINFORCE"}, {"env_step": 1044480, "rew": 435.5741, "rew_std": 80.3884, "Agent": "REINFORCE"}, {"env_step": 1075200, "rew": 417.8789, "rew_std": 48.7039, "Agent": "REINFORCE"}, {"env_step": 1105920, "rew": 388.0945, "rew_std": 69.9208, "Agent": "REINFORCE"}, {"env_step": 1136640, "rew": 416.8366, "rew_std": 48.7602, "Agent": "REINFORCE"}, {"env_step": 1167360, "rew": 490.229, "rew_std": 59.7515, "Agent": "REINFORCE"}, {"env_step": 1198080, "rew": 416.1175, "rew_std": 39.6707, "Agent": "REINFORCE"}, {"env_step": 1228800, "rew": 422.501, "rew_std": 63.4279, "Agent": "REINFORCE"}, {"env_step": 1259520, "rew": 445.428, "rew_std": 79.5721, "Agent": "REINFORCE"}, {"env_step": 1290240, "rew": 484.8554, "rew_std": 54.9234, "Agent": "REINFORCE"}, {"env_step": 1320960, "rew": 405.2333, "rew_std": 64.6929, "Agent": "REINFORCE"}, {"env_step": 1351680, "rew": 439.0572, "rew_std": 77.0379, "Agent": "REINFORCE"}, {"env_step": 1382400, "rew": 413.4107, "rew_std": 64.2411, "Agent": "REINFORCE"}, {"env_step": 1413120, "rew": 477.1185, "rew_std": 70.4266, "Agent": "REINFORCE"}, {"env_step": 1443840, "rew": 437.3873, "rew_std": 65.7348, "Agent": "REINFORCE"}, {"env_step": 1474560, "rew": 508.2686, "rew_std": 53.6442, "Agent": "REINFORCE"}, {"env_step": 1505280, "rew": 431.5613, "rew_std": 58.691, "Agent": "REINFORCE"}, {"env_step": 1536000, "rew": 504.4616, "rew_std": 104.7558, "Agent": "REINFORCE"}, {"env_step": 1566720, "rew": 514.0627, "rew_std": 113.1402, "Agent": "REINFORCE"}, {"env_step": 1597440, "rew": 438.4226, "rew_std": 85.4795, "Agent": "REINFORCE"}, {"env_step": 1628160, "rew": 508.8552, "rew_std": 73.1902, "Agent": "REINFORCE"}, {"env_step": 1658880, "rew": 524.1776, "rew_std": 46.6835, "Agent": "REINFORCE"}, {"env_step": 1689600, "rew": 443.152, "rew_std": 72.039, "Agent": "REINFORCE"}, {"env_step": 1720320, "rew": 514.0757, "rew_std": 102.6964, "Agent": "REINFORCE"}, {"env_step": 1751040, "rew": 536.2226, "rew_std": 100.2774, "Agent": "REINFORCE"}, {"env_step": 1781760, "rew": 512.4202, "rew_std": 69.555, "Agent": "REINFORCE"}, {"env_step": 1812480, "rew": 466.9226, "rew_std": 51.3613, "Agent": "REINFORCE"}, {"env_step": 1843200, "rew": 526.6333, "rew_std": 110.1826, "Agent": "REINFORCE"}, {"env_step": 1873920, "rew": 563.423, "rew_std": 88.7347, "Agent": "REINFORCE"}, {"env_step": 1904640, "rew": 488.7421, "rew_std": 94.6149, "Agent": "REINFORCE"}, {"env_step": 1935360, "rew": 527.4116, "rew_std": 72.0684, "Agent": "REINFORCE"}, {"env_step": 1966080, "rew": 584.751, "rew_std": 106.5506, "Agent": "REINFORCE"}, {"env_step": 1996800, "rew": 512.967, "rew_std": 76.5018, "Agent": "REINFORCE"}, {"env_step": 2027520, "rew": 520.3164, "rew_std": 79.305, "Agent": "REINFORCE"}, {"env_step": 2058240, "rew": 543.088, "rew_std": 180.1451, "Agent": "REINFORCE"}, {"env_step": 2088960, "rew": 572.2448, "rew_std": 112.2051, "Agent": "REINFORCE"}, {"env_step": 2119680, "rew": 483.6695, "rew_std": 79.7298, "Agent": "REINFORCE"}, {"env_step": 2150400, "rew": 576.0319, "rew_std": 166.6031, "Agent": "REINFORCE"}, {"env_step": 2181120, "rew": 541.9739, "rew_std": 104.8883, "Agent": "REINFORCE"}, {"env_step": 2211840, "rew": 584.6133, "rew_std": 134.5258, "Agent": "REINFORCE"}, {"env_step": 2242560, "rew": 571.4616, "rew_std": 102.7021, "Agent": "REINFORCE"}, {"env_step": 2273280, "rew": 695.0859, "rew_std": 210.1589, "Agent": "REINFORCE"}, {"env_step": 2304000, "rew": 622.2008, "rew_std": 153.9995, "Agent": "REINFORCE"}, {"env_step": 2334720, "rew": 599.7726, "rew_std": 122.7385, "Agent": "REINFORCE"}, {"env_step": 2365440, "rew": 649.5761, "rew_std": 106.0541, "Agent": "REINFORCE"}, {"env_step": 2396160, "rew": 634.764, "rew_std": 102.9666, "Agent": "REINFORCE"}, {"env_step": 2426880, "rew": 647.247, "rew_std": 46.9642, "Agent": "REINFORCE"}, {"env_step": 2457600, "rew": 619.0498, "rew_std": 100.3413, "Agent": "REINFORCE"}, {"env_step": 2488320, "rew": 669.8866, "rew_std": 140.8498, "Agent": "REINFORCE"}, {"env_step": 2519040, "rew": 662.3441, "rew_std": 140.1168, "Agent": "REINFORCE"}, {"env_step": 2549760, "rew": 810.179, "rew_std": 110.0032, "Agent": "REINFORCE"}, {"env_step": 2580480, "rew": 725.5527, "rew_std": 201.8621, "Agent": "REINFORCE"}, {"env_step": 2611200, "rew": 698.9872, "rew_std": 191.0236, "Agent": "REINFORCE"}, {"env_step": 2641920, "rew": 767.5747, "rew_std": 260.1571, "Agent": "REINFORCE"}, {"env_step": 2672640, "rew": 753.5526, "rew_std": 214.4276, "Agent": "REINFORCE"}, {"env_step": 2703360, "rew": 666.5184, "rew_std": 142.1623, "Agent": "REINFORCE"}, {"env_step": 2734080, "rew": 755.6162, "rew_std": 171.7469, "Agent": "REINFORCE"}, {"env_step": 2764800, "rew": 802.2893, "rew_std": 151.2001, "Agent": "REINFORCE"}, {"env_step": 2795520, "rew": 828.3906, "rew_std": 168.4727, "Agent": "REINFORCE"}, {"env_step": 2826240, "rew": 859.1231, "rew_std": 185.7303, "Agent": "REINFORCE"}, {"env_step": 2856960, "rew": 847.9353, "rew_std": 255.6323, "Agent": "REINFORCE"}, {"env_step": 2887680, "rew": 848.9568, "rew_std": 255.9742, "Agent": "REINFORCE"}, {"env_step": 2918400, "rew": 980.2406, "rew_std": 319.6858, "Agent": "REINFORCE"}, {"env_step": 2949120, "rew": 948.7681, "rew_std": 169.0014, "Agent": "REINFORCE"}, {"env_step": 2979840, "rew": 1016.5807, "rew_std": 262.9115, "Agent": "REINFORCE"}, {"env_step": 3010560, "rew": 1019.1342, "rew_std": 297.7281, "Agent": "REINFORCE"}, {"env_step": 3041280, "rew": 1059.747, "rew_std": 307.6851, "Agent": "REINFORCE"}, {"env_step": 3072000, "rew": 978.2747, "rew_std": 345.3194, "Agent": "REINFORCE"}, {"env_step": 3102720, "rew": 1160.4319, "rew_std": 464.3403, "Agent": "REINFORCE"}, {"env_step": 3133440, "rew": 1200.1039, "rew_std": 362.0233, "Agent": "REINFORCE"}, {"env_step": 3164160, "rew": 1059.5822, "rew_std": 280.4559, "Agent": "REINFORCE"}, {"env_step": 3194880, "rew": 1225.6168, "rew_std": 371.406, "Agent": "REINFORCE"}, {"env_step": 3225600, "rew": 1282.9805, "rew_std": 302.5772, "Agent": "REINFORCE"}, {"env_step": 3256320, "rew": 1273.2309, "rew_std": 349.0168, "Agent": "REINFORCE"}, {"env_step": 3287040, "rew": 1300.563, "rew_std": 425.1841, "Agent": "REINFORCE"}, {"env_step": 3317760, "rew": 1011.3652, "rew_std": 267.331, "Agent": "REINFORCE"}, {"env_step": 3348480, "rew": 1282.4909, "rew_std": 294.3243, "Agent": "REINFORCE"}, {"env_step": 3379200, "rew": 1185.7562, "rew_std": 321.7863, "Agent": "REINFORCE"}, {"env_step": 3409920, "rew": 1171.4334, "rew_std": 360.5962, "Agent": "REINFORCE"}, {"env_step": 3440640, "rew": 1195.9001, "rew_std": 331.9413, "Agent": "REINFORCE"}, {"env_step": 3471360, "rew": 1312.6145, "rew_std": 329.9906, "Agent": "REINFORCE"}, {"env_step": 3502080, "rew": 1415.1494, "rew_std": 404.2971, "Agent": "REINFORCE"}, {"env_step": 3532800, "rew": 1402.2373, "rew_std": 322.0836, "Agent": "REINFORCE"}, {"env_step": 3563520, "rew": 1508.4332, "rew_std": 578.56, "Agent": "REINFORCE"}, {"env_step": 3594240, "rew": 1398.8295, "rew_std": 532.5828, "Agent": "REINFORCE"}, {"env_step": 3624960, "rew": 1158.1128, "rew_std": 349.4831, "Agent": "REINFORCE"}, {"env_step": 3655680, "rew": 1386.2969, "rew_std": 574.8848, "Agent": "REINFORCE"}, {"env_step": 3686400, "rew": 1214.1347, "rew_std": 394.7353, "Agent": "REINFORCE"}, {"env_step": 3717120, "rew": 1749.9282, "rew_std": 1070.3417, "Agent": "REINFORCE"}, {"env_step": 3747840, "rew": 1778.2408, "rew_std": 830.1728, "Agent": "REINFORCE"}, {"env_step": 3778560, "rew": 1788.488, "rew_std": 940.4839, "Agent": "REINFORCE"}, {"env_step": 3809280, "rew": 1806.6416, "rew_std": 694.6308, "Agent": "REINFORCE"}, {"env_step": 3840000, "rew": 1628.9717, "rew_std": 993.5847, "Agent": "REINFORCE"}, {"env_step": 3870720, "rew": 1612.6756, "rew_std": 955.6134, "Agent": "REINFORCE"}, {"env_step": 3901440, "rew": 1760.4958, "rew_std": 1022.6508, "Agent": "REINFORCE"}, {"env_step": 3932160, "rew": 1685.1773, "rew_std": 963.1458, "Agent": "REINFORCE"}, {"env_step": 3962880, "rew": 2038.9305, "rew_std": 873.6692, "Agent": "REINFORCE"}, {"env_step": 3993600, "rew": 1994.5574, "rew_std": 874.5238, "Agent": "REINFORCE"}, {"env_step": 4024320, "rew": 2290.5792, "rew_std": 893.5474, "Agent": "REINFORCE"}, {"env_step": 4055040, "rew": 2093.8009, "rew_std": 907.8444, "Agent": "REINFORCE"}, {"env_step": 4085760, "rew": 1935.4176, "rew_std": 949.8348, "Agent": "REINFORCE"}, {"env_step": 4116480, "rew": 1591.5349, "rew_std": 572.0568, "Agent": "REINFORCE"}, {"env_step": 4147200, "rew": 2063.1639, "rew_std": 1069.8277, "Agent": "REINFORCE"}, {"env_step": 4177920, "rew": 2142.1858, "rew_std": 856.4905, "Agent": "REINFORCE"}, {"env_step": 4208640, "rew": 2110.9033, "rew_std": 669.7878, "Agent": "REINFORCE"}, {"env_step": 4239360, "rew": 1877.9988, "rew_std": 973.6438, "Agent": "REINFORCE"}, {"env_step": 4270080, "rew": 2330.0562, "rew_std": 1048.8469, "Agent": "REINFORCE"}, {"env_step": 4300800, "rew": 2753.4828, "rew_std": 1178.0501, "Agent": "REINFORCE"}, {"env_step": 4331520, "rew": 2482.2992, "rew_std": 786.2175, "Agent": "REINFORCE"}, {"env_step": 4362240, "rew": 2500.011, "rew_std": 857.6858, "Agent": "REINFORCE"}, {"env_step": 4392960, "rew": 2082.2058, "rew_std": 875.8882, "Agent": "REINFORCE"}, {"env_step": 4423680, "rew": 2695.8844, "rew_std": 1156.2615, "Agent": "REINFORCE"}, {"env_step": 4454400, "rew": 2012.0529, "rew_std": 639.3927, "Agent": "REINFORCE"}, {"env_step": 4485120, "rew": 2192.864, "rew_std": 1125.1998, "Agent": "REINFORCE"}, {"env_step": 4515840, "rew": 3015.4809, "rew_std": 1806.7113, "Agent": "REINFORCE"}, {"env_step": 4546560, "rew": 2323.9941, "rew_std": 547.3481, "Agent": "REINFORCE"}, {"env_step": 4577280, "rew": 2732.3637, "rew_std": 1304.811, "Agent": "REINFORCE"}, {"env_step": 4608000, "rew": 2099.5867, "rew_std": 709.0763, "Agent": "REINFORCE"}, {"env_step": 4638720, "rew": 2504.8862, "rew_std": 1158.8266, "Agent": "REINFORCE"}, {"env_step": 4669440, "rew": 2336.4626, "rew_std": 1013.3587, "Agent": "REINFORCE"}, {"env_step": 4700160, "rew": 2820.9975, "rew_std": 700.505, "Agent": "REINFORCE"}, {"env_step": 4730880, "rew": 2551.0595, "rew_std": 751.2494, "Agent": "REINFORCE"}, {"env_step": 4761600, "rew": 2306.5164, "rew_std": 725.9532, "Agent": "REINFORCE"}, {"env_step": 4792320, "rew": 2176.1637, "rew_std": 741.4824, "Agent": "REINFORCE"}, {"env_step": 4823040, "rew": 2966.1284, "rew_std": 1269.1187, "Agent": "REINFORCE"}, {"env_step": 4853760, "rew": 3351.2094, "rew_std": 1112.0173, "Agent": "REINFORCE"}, {"env_step": 4884480, "rew": 3842.1464, "rew_std": 1570.3156, "Agent": "REINFORCE"}, {"env_step": 4915200, "rew": 2989.541, "rew_std": 1266.7222, "Agent": "REINFORCE"}, {"env_step": 4945920, "rew": 2758.6786, "rew_std": 990.1936, "Agent": "REINFORCE"}, {"env_step": 4976640, "rew": 3405.5566, "rew_std": 1518.9021, "Agent": "REINFORCE"}, {"env_step": 5007360, "rew": 3869.2983, "rew_std": 1851.353, "Agent": "REINFORCE"}, {"env_step": 5038080, "rew": 2729.3042, "rew_std": 892.573, "Agent": "REINFORCE"}, {"env_step": 5068800, "rew": 3314.1694, "rew_std": 1323.7672, "Agent": "REINFORCE"}, {"env_step": 5099520, "rew": 4038.4395, "rew_std": 943.1128, "Agent": "REINFORCE"}, {"env_step": 5130240, "rew": 3256.4594, "rew_std": 1306.8482, "Agent": "REINFORCE"}, {"env_step": 5160960, "rew": 2987.736, "rew_std": 839.0792, "Agent": "REINFORCE"}, {"env_step": 5191680, "rew": 3309.6143, "rew_std": 1086.4379, "Agent": "REINFORCE"}, {"env_step": 5222400, "rew": 3487.2926, "rew_std": 1349.5377, "Agent": "REINFORCE"}, {"env_step": 5253120, "rew": 3662.9314, "rew_std": 966.6369, "Agent": "REINFORCE"}, {"env_step": 5283840, "rew": 3951.659, "rew_std": 1427.5392, "Agent": "REINFORCE"}, {"env_step": 5314560, "rew": 3243.6001, "rew_std": 1070.5047, "Agent": "REINFORCE"}, {"env_step": 5345280, "rew": 3722.7722, "rew_std": 1532.4533, "Agent": "REINFORCE"}, {"env_step": 5376000, "rew": 3645.6966, "rew_std": 1085.0242, "Agent": "REINFORCE"}, {"env_step": 5406720, "rew": 3553.8285, "rew_std": 1506.3794, "Agent": "REINFORCE"}, {"env_step": 5437440, "rew": 3428.5119, "rew_std": 1508.2119, "Agent": "REINFORCE"}, {"env_step": 5468160, "rew": 3170.9381, "rew_std": 1967.1882, "Agent": "REINFORCE"}, {"env_step": 5498880, "rew": 3263.9317, "rew_std": 1140.5613, "Agent": "REINFORCE"}, {"env_step": 5529600, "rew": 2956.3149, "rew_std": 960.4775, "Agent": "REINFORCE"}, {"env_step": 5560320, "rew": 3669.0042, "rew_std": 1323.1323, "Agent": "REINFORCE"}, {"env_step": 5591040, "rew": 4026.5697, "rew_std": 1166.8394, "Agent": "REINFORCE"}, {"env_step": 5621760, "rew": 4183.9457, "rew_std": 1343.1734, "Agent": "REINFORCE"}, {"env_step": 5652480, "rew": 4219.2541, "rew_std": 968.9301, "Agent": "REINFORCE"}, {"env_step": 5683200, "rew": 3545.1333, "rew_std": 1469.0964, "Agent": "REINFORCE"}, {"env_step": 5713920, "rew": 3831.7193, "rew_std": 1692.2045, "Agent": "REINFORCE"}, {"env_step": 5744640, "rew": 3304.0221, "rew_std": 1336.8871, "Agent": "REINFORCE"}, {"env_step": 5775360, "rew": 3031.8385, "rew_std": 1379.532, "Agent": "REINFORCE"}, {"env_step": 5806080, "rew": 3934.2707, "rew_std": 889.5228, "Agent": "REINFORCE"}, {"env_step": 5836800, "rew": 3236.5811, "rew_std": 1150.3347, "Agent": "REINFORCE"}, {"env_step": 5867520, "rew": 3755.1395, "rew_std": 1577.0949, "Agent": "REINFORCE"}, {"env_step": 5898240, "rew": 4502.6478, "rew_std": 1060.7047, "Agent": "REINFORCE"}, {"env_step": 5928960, "rew": 4059.5553, "rew_std": 1356.9739, "Agent": "REINFORCE"}, {"env_step": 5959680, "rew": 4304.8758, "rew_std": 1531.4219, "Agent": "REINFORCE"}, {"env_step": 5990400, "rew": 4732.0622, "rew_std": 1401.7171, "Agent": "REINFORCE"}, {"env_step": 6021120, "rew": 4927.5947, "rew_std": 1735.7823, "Agent": "REINFORCE"}, {"env_step": 6051840, "rew": 4896.0143, "rew_std": 2095.2379, "Agent": "REINFORCE"}, {"env_step": 6082560, "rew": 4038.2881, "rew_std": 2124.3119, "Agent": "REINFORCE"}, {"env_step": 6113280, "rew": 4884.944, "rew_std": 2155.9927, "Agent": "REINFORCE"}, {"env_step": 6144000, "rew": 4460.7201, "rew_std": 1099.7811, "Agent": "REINFORCE"}, {"env_step": 6174720, "rew": 4355.8913, "rew_std": 994.335, "Agent": "REINFORCE"}, {"env_step": 6205440, "rew": 4483.3853, "rew_std": 1632.5418, "Agent": "REINFORCE"}, {"env_step": 6236160, "rew": 5376.8727, "rew_std": 1175.4768, "Agent": "REINFORCE"}, {"env_step": 6266880, "rew": 5028.3366, "rew_std": 1725.2833, "Agent": "REINFORCE"}, {"env_step": 6297600, "rew": 5834.3314, "rew_std": 1182.5593, "Agent": "REINFORCE"}, {"env_step": 6328320, "rew": 5169.7081, "rew_std": 1486.7668, "Agent": "REINFORCE"}, {"env_step": 6359040, "rew": 5154.2478, "rew_std": 1111.2708, "Agent": "REINFORCE"}, {"env_step": 6389760, "rew": 4502.9293, "rew_std": 1125.813, "Agent": "REINFORCE"}, {"env_step": 6420480, "rew": 4459.1707, "rew_std": 1108.9785, "Agent": "REINFORCE"}, {"env_step": 6451200, "rew": 5311.4787, "rew_std": 1873.4583, "Agent": "REINFORCE"}, {"env_step": 6481920, "rew": 5532.3912, "rew_std": 2139.4747, "Agent": "REINFORCE"}, {"env_step": 6512640, "rew": 5280.449, "rew_std": 1447.4049, "Agent": "REINFORCE"}, {"env_step": 6543360, "rew": 5015.1148, "rew_std": 1553.0882, "Agent": "REINFORCE"}, {"env_step": 6574080, "rew": 4470.1792, "rew_std": 1804.0072, "Agent": "REINFORCE"}, {"env_step": 6604800, "rew": 4214.2721, "rew_std": 1353.1881, "Agent": "REINFORCE"}, {"env_step": 6635520, "rew": 5256.508, "rew_std": 1465.1617, "Agent": "REINFORCE"}, {"env_step": 6666240, "rew": 5192.832, "rew_std": 1256.6718, "Agent": "REINFORCE"}, {"env_step": 6696960, "rew": 5149.1533, "rew_std": 1938.2363, "Agent": "REINFORCE"}, {"env_step": 6727680, "rew": 4871.797, "rew_std": 1085.56, "Agent": "REINFORCE"}, {"env_step": 6758400, "rew": 5401.9239, "rew_std": 1134.1753, "Agent": "REINFORCE"}, {"env_step": 6789120, "rew": 4990.7386, "rew_std": 1913.7971, "Agent": "REINFORCE"}, {"env_step": 6819840, "rew": 5715.5955, "rew_std": 1215.5666, "Agent": "REINFORCE"}, {"env_step": 6850560, "rew": 5857.0221, "rew_std": 1281.9894, "Agent": "REINFORCE"}, {"env_step": 6881280, "rew": 5648.1819, "rew_std": 1136.7722, "Agent": "REINFORCE"}, {"env_step": 6912000, "rew": 5817.961, "rew_std": 1547.1178, "Agent": "REINFORCE"}, {"env_step": 6942720, "rew": 6049.0488, "rew_std": 1193.2055, "Agent": "REINFORCE"}, {"env_step": 6973440, "rew": 5471.947, "rew_std": 1142.1615, "Agent": "REINFORCE"}, {"env_step": 7004160, "rew": 6081.4353, "rew_std": 1233.8771, "Agent": "REINFORCE"}, {"env_step": 7034880, "rew": 5363.5289, "rew_std": 970.5114, "Agent": "REINFORCE"}, {"env_step": 7065600, "rew": 5779.5069, "rew_std": 1246.4714, "Agent": "REINFORCE"}, {"env_step": 7096320, "rew": 5788.5086, "rew_std": 1228.3144, "Agent": "REINFORCE"}, {"env_step": 7127040, "rew": 4967.2815, "rew_std": 1767.1772, "Agent": "REINFORCE"}, {"env_step": 7157760, "rew": 4538.9419, "rew_std": 1589.6502, "Agent": "REINFORCE"}, {"env_step": 7188480, "rew": 5137.0493, "rew_std": 1700.3284, "Agent": "REINFORCE"}, {"env_step": 7219200, "rew": 5012.8316, "rew_std": 1527.0919, "Agent": "REINFORCE"}, {"env_step": 7249920, "rew": 6073.756, "rew_std": 1803.8926, "Agent": "REINFORCE"}, {"env_step": 7280640, "rew": 5434.4797, "rew_std": 1784.3038, "Agent": "REINFORCE"}, {"env_step": 7311360, "rew": 5634.7391, "rew_std": 1627.405, "Agent": "REINFORCE"}, {"env_step": 7342080, "rew": 6050.9446, "rew_std": 1251.8911, "Agent": "REINFORCE"}, {"env_step": 7372800, "rew": 5799.2364, "rew_std": 1298.4554, "Agent": "REINFORCE"}, {"env_step": 7403520, "rew": 5395.9884, "rew_std": 1760.5917, "Agent": "REINFORCE"}, {"env_step": 7434240, "rew": 5073.6754, "rew_std": 1554.3566, "Agent": "REINFORCE"}, {"env_step": 7464960, "rew": 5815.9828, "rew_std": 1015.2138, "Agent": "REINFORCE"}, {"env_step": 7495680, "rew": 5884.6845, "rew_std": 1499.5421, "Agent": "REINFORCE"}, {"env_step": 7526400, "rew": 6234.7842, "rew_std": 1264.545, "Agent": "REINFORCE"}, {"env_step": 7557120, "rew": 5556.2612, "rew_std": 1266.8728, "Agent": "REINFORCE"}, {"env_step": 7587840, "rew": 5691.0096, "rew_std": 1742.2202, "Agent": "REINFORCE"}, {"env_step": 7618560, "rew": 5424.3148, "rew_std": 1324.0728, "Agent": "REINFORCE"}, {"env_step": 7649280, "rew": 5504.6508, "rew_std": 1257.7258, "Agent": "REINFORCE"}, {"env_step": 7680000, "rew": 5705.7458, "rew_std": 1287.1892, "Agent": "REINFORCE"}, {"env_step": 7710720, "rew": 5963.5763, "rew_std": 1430.009, "Agent": "REINFORCE"}, {"env_step": 7741440, "rew": 5339.8363, "rew_std": 1447.4924, "Agent": "REINFORCE"}, {"env_step": 7772160, "rew": 5916.8767, "rew_std": 1510.3091, "Agent": "REINFORCE"}, {"env_step": 7802880, "rew": 5386.2398, "rew_std": 1841.1415, "Agent": "REINFORCE"}, {"env_step": 7833600, "rew": 5538.2181, "rew_std": 1806.8538, "Agent": "REINFORCE"}, {"env_step": 7864320, "rew": 5652.5788, "rew_std": 1777.7795, "Agent": "REINFORCE"}, {"env_step": 7895040, "rew": 6067.3995, "rew_std": 1497.3349, "Agent": "REINFORCE"}, {"env_step": 7925760, "rew": 6354.8653, "rew_std": 1497.8889, "Agent": "REINFORCE"}, {"env_step": 7956480, "rew": 5823.1186, "rew_std": 1269.9062, "Agent": "REINFORCE"}, {"env_step": 7987200, "rew": 6275.2123, "rew_std": 1495.5294, "Agent": "REINFORCE"}, {"env_step": 8017920, "rew": 6120.7756, "rew_std": 1372.5631, "Agent": "REINFORCE"}, {"env_step": 8048640, "rew": 6376.4303, "rew_std": 1571.4903, "Agent": "REINFORCE"}, {"env_step": 8079360, "rew": 6652.7371, "rew_std": 1835.958, "Agent": "REINFORCE"}, {"env_step": 8110080, "rew": 6444.4723, "rew_std": 1110.3799, "Agent": "REINFORCE"}, {"env_step": 8140800, "rew": 7217.0162, "rew_std": 1063.6642, "Agent": "REINFORCE"}, {"env_step": 8171520, "rew": 5653.2569, "rew_std": 1414.6232, "Agent": "REINFORCE"}, {"env_step": 8202240, "rew": 6460.5066, "rew_std": 952.3641, "Agent": "REINFORCE"}, {"env_step": 8232960, "rew": 5945.2504, "rew_std": 1054.7127, "Agent": "REINFORCE"}, {"env_step": 8263680, "rew": 5392.9994, "rew_std": 946.8632, "Agent": "REINFORCE"}, {"env_step": 8294400, "rew": 5711.6941, "rew_std": 1424.4968, "Agent": "REINFORCE"}, {"env_step": 8325120, "rew": 6544.5364, "rew_std": 1623.5174, "Agent": "REINFORCE"}, {"env_step": 8355840, "rew": 5464.2413, "rew_std": 2142.0475, "Agent": "REINFORCE"}, {"env_step": 8386560, "rew": 6105.3293, "rew_std": 2194.9652, "Agent": "REINFORCE"}, {"env_step": 8417280, "rew": 5271.8896, "rew_std": 1588.2101, "Agent": "REINFORCE"}, {"env_step": 8448000, "rew": 5453.34, "rew_std": 1647.1389, "Agent": "REINFORCE"}, {"env_step": 8478720, "rew": 5382.6643, "rew_std": 1333.2283, "Agent": "REINFORCE"}, {"env_step": 8509440, "rew": 6127.8232, "rew_std": 1471.4567, "Agent": "REINFORCE"}, {"env_step": 8540160, "rew": 5988.2806, "rew_std": 1687.2463, "Agent": "REINFORCE"}, {"env_step": 8570880, "rew": 6061.9376, "rew_std": 954.6449, "Agent": "REINFORCE"}, {"env_step": 8601600, "rew": 6159.4407, "rew_std": 1555.6679, "Agent": "REINFORCE"}, {"env_step": 8632320, "rew": 5990.1787, "rew_std": 1561.9069, "Agent": "REINFORCE"}, {"env_step": 8663040, "rew": 6602.3922, "rew_std": 1792.703, "Agent": "REINFORCE"}, {"env_step": 8693760, "rew": 6646.9446, "rew_std": 1388.1919, "Agent": "REINFORCE"}, {"env_step": 8724480, "rew": 6394.6836, "rew_std": 970.0849, "Agent": "REINFORCE"}, {"env_step": 8755200, "rew": 6877.8872, "rew_std": 1009.9845, "Agent": "REINFORCE"}, {"env_step": 8785920, "rew": 6184.5929, "rew_std": 1464.8502, "Agent": "REINFORCE"}, {"env_step": 8816640, "rew": 6062.8531, "rew_std": 1367.4635, "Agent": "REINFORCE"}, {"env_step": 8847360, "rew": 6737.3933, "rew_std": 1261.609, "Agent": "REINFORCE"}, {"env_step": 8878080, "rew": 6322.801, "rew_std": 1068.3317, "Agent": "REINFORCE"}, {"env_step": 8908800, "rew": 6125.2032, "rew_std": 1196.5361, "Agent": "REINFORCE"}, {"env_step": 8939520, "rew": 6146.5552, "rew_std": 1153.7217, "Agent": "REINFORCE"}, {"env_step": 8970240, "rew": 6812.214, "rew_std": 530.805, "Agent": "REINFORCE"}, {"env_step": 9000960, "rew": 6844.0914, "rew_std": 841.6548, "Agent": "REINFORCE"}, {"env_step": 9031680, "rew": 6873.7066, "rew_std": 1135.0747, "Agent": "REINFORCE"}, {"env_step": 9062400, "rew": 6635.5172, "rew_std": 1004.5649, "Agent": "REINFORCE"}, {"env_step": 9093120, "rew": 6693.6973, "rew_std": 1015.4753, "Agent": "REINFORCE"}, {"env_step": 9123840, "rew": 6887.9459, "rew_std": 1380.6248, "Agent": "REINFORCE"}, {"env_step": 9154560, "rew": 6694.8057, "rew_std": 1666.3847, "Agent": "REINFORCE"}, {"env_step": 9185280, "rew": 6762.1576, "rew_std": 1212.6116, "Agent": "REINFORCE"}, {"env_step": 9216000, "rew": 7726.2164, "rew_std": 1287.2782, "Agent": "REINFORCE"}, {"env_step": 9246720, "rew": 6567.3651, "rew_std": 969.8238, "Agent": "REINFORCE"}, {"env_step": 9277440, "rew": 6641.0387, "rew_std": 1302.7611, "Agent": "REINFORCE"}, {"env_step": 9308160, "rew": 6559.1865, "rew_std": 1104.5484, "Agent": "REINFORCE"}, {"env_step": 9338880, "rew": 6207.0497, "rew_std": 1099.3404, "Agent": "REINFORCE"}, {"env_step": 9369600, "rew": 6919.7114, "rew_std": 1198.3527, "Agent": "REINFORCE"}, {"env_step": 9400320, "rew": 6900.913, "rew_std": 1189.5731, "Agent": "REINFORCE"}, {"env_step": 9431040, "rew": 6333.3599, "rew_std": 1552.1746, "Agent": "REINFORCE"}, {"env_step": 9461760, "rew": 6961.7171, "rew_std": 1292.5547, "Agent": "REINFORCE"}, {"env_step": 9492480, "rew": 6839.8277, "rew_std": 928.9957, "Agent": "REINFORCE"}, {"env_step": 9523200, "rew": 6278.2224, "rew_std": 572.1307, "Agent": "REINFORCE"}, {"env_step": 9553920, "rew": 6150.1885, "rew_std": 1659.5018, "Agent": "REINFORCE"}, {"env_step": 9584640, "rew": 6263.9494, "rew_std": 778.401, "Agent": "REINFORCE"}, {"env_step": 9615360, "rew": 6700.659, "rew_std": 743.8524, "Agent": "REINFORCE"}, {"env_step": 9646080, "rew": 6855.1353, "rew_std": 1217.9605, "Agent": "REINFORCE"}, {"env_step": 9676800, "rew": 7503.265, "rew_std": 839.6838, "Agent": "REINFORCE"}, {"env_step": 9707520, "rew": 7234.1868, "rew_std": 1186.2327, "Agent": "REINFORCE"}, {"env_step": 9738240, "rew": 7017.3017, "rew_std": 917.1484, "Agent": "REINFORCE"}, {"env_step": 9768960, "rew": 6725.5028, "rew_std": 800.6937, "Agent": "REINFORCE"}, {"env_step": 9799680, "rew": 7065.9637, "rew_std": 1153.5137, "Agent": "REINFORCE"}, {"env_step": 9830400, "rew": 6378.6522, "rew_std": 1429.952, "Agent": "REINFORCE"}, {"env_step": 9861120, "rew": 6962.9597, "rew_std": 1037.9087, "Agent": "REINFORCE"}, {"env_step": 9891840, "rew": 6958.6688, "rew_std": 1213.9064, "Agent": "REINFORCE"}, {"env_step": 9922560, "rew": 7098.3389, "rew_std": 1145.1282, "Agent": "REINFORCE"}, {"env_step": 9953280, "rew": 6609.1988, "rew_std": 1108.0279, "Agent": "REINFORCE"}, {"env_step": 9984000, "rew": 7164.6662, "rew_std": 1137.4225, "Agent": "REINFORCE"}, {"env_step": 10014720, "rew": 7364.7105, "rew_std": 993.5177, "Agent": "REINFORCE"}, {"env_step": 10045440, "rew": 6631.3363, "rew_std": 1164.1259, "Agent": "REINFORCE"}, {"env_step": 10076160, "rew": 6664.8013, "rew_std": 1606.3458, "Agent": "REINFORCE"}, {"env_step": 10106880, "rew": 6859.2966, "rew_std": 1411.2013, "Agent": "REINFORCE"}, {"env_step": 10137600, "rew": 6828.3037, "rew_std": 995.2747, "Agent": "REINFORCE"}, {"env_step": 10168320, "rew": 6260.87, "rew_std": 1026.5741, "Agent": "REINFORCE"}, {"env_step": 10199040, "rew": 6688.6403, "rew_std": 1283.3219, "Agent": "REINFORCE"}, {"env_step": 10229760, "rew": 7276.2345, "rew_std": 985.5105, "Agent": "REINFORCE"}, {"env_step": 0, "rew": 87.8507, "rew_std": 12.8325, "Agent": "SAC"}, {"env_step": 5000, "rew": 756.2125, "rew_std": 257.9012, "Agent": "SAC"}, {"env_step": 10000, "rew": 7728.6778, "rew_std": 3036.0068, "Agent": "SAC"}, {"env_step": 15000, "rew": 9345.2064, "rew_std": 7.1745, "Agent": "SAC"}, {"env_step": 20000, "rew": 9067.9081, "rew_std": 568.0202, "Agent": "SAC"}, {"env_step": 25000, "rew": 9251.3634, "rew_std": 273.4882, "Agent": "SAC"}, {"env_step": 30000, "rew": 9339.7022, "rew_std": 13.0168, "Agent": "SAC"}, {"env_step": 35000, "rew": 9341.0825, "rew_std": 8.3511, "Agent": "SAC"}, {"env_step": 40000, "rew": 9179.9443, "rew_std": 482.8777, "Agent": "SAC"}, {"env_step": 45000, "rew": 9349.2818, "rew_std": 7.345, "Agent": "SAC"}, {"env_step": 50000, "rew": 9347.1812, "rew_std": 5.5747, "Agent": "SAC"}, {"env_step": 55000, "rew": 9343.8767, "rew_std": 7.8371, "Agent": "SAC"}, {"env_step": 60000, "rew": 9348.0068, "rew_std": 5.8836, "Agent": "SAC"}, {"env_step": 65000, "rew": 9076.2041, "rew_std": 410.8547, "Agent": "SAC"}, {"env_step": 70000, "rew": 9351.7263, "rew_std": 4.4372, "Agent": "SAC"}, {"env_step": 75000, "rew": 9353.7934, "rew_std": 3.4108, "Agent": "SAC"}, {"env_step": 80000, "rew": 9353.4646, "rew_std": 3.3222, "Agent": "SAC"}, {"env_step": 85000, "rew": 9355.8036, "rew_std": 2.1557, "Agent": "SAC"}, {"env_step": 90000, "rew": 9353.5623, "rew_std": 4.9767, "Agent": "SAC"}, {"env_step": 95000, "rew": 9353.3058, "rew_std": 4.9776, "Agent": "SAC"}, {"env_step": 100000, "rew": 9354.1422, "rew_std": 4.1689, "Agent": "SAC"}, {"env_step": 105000, "rew": 9353.5129, "rew_std": 4.658, "Agent": "SAC"}, {"env_step": 110000, "rew": 9355.5423, "rew_std": 2.9517, "Agent": "SAC"}, {"env_step": 115000, "rew": 9193.4331, "rew_std": 492.2324, "Agent": "SAC"}, {"env_step": 120000, "rew": 9356.9442, "rew_std": 4.6735, "Agent": "SAC"}, {"env_step": 125000, "rew": 9358.2736, "rew_std": 1.8483, "Agent": "SAC"}, {"env_step": 130000, "rew": 9357.66, "rew_std": 2.5569, "Agent": "SAC"}, {"env_step": 135000, "rew": 9357.4056, "rew_std": 2.5524, "Agent": "SAC"}, {"env_step": 140000, "rew": 9357.8777, "rew_std": 2.6114, "Agent": "SAC"}, {"env_step": 145000, "rew": 9357.2298, "rew_std": 3.1278, "Agent": "SAC"}, {"env_step": 150000, "rew": 8600.7654, "rew_std": 2274.1217, "Agent": "SAC"}, {"env_step": 155000, "rew": 9199.7953, "rew_std": 472.8582, "Agent": "SAC"}, {"env_step": 160000, "rew": 9357.0128, "rew_std": 2.0788, "Agent": "SAC"}, {"env_step": 165000, "rew": 9270.2483, "rew_std": 266.3928, "Agent": "SAC"}, {"env_step": 170000, "rew": 9359.2144, "rew_std": 0.4645, "Agent": "SAC"}, {"env_step": 175000, "rew": 9358.4945, "rew_std": 1.9754, "Agent": "SAC"}, {"env_step": 180000, "rew": 9358.0269, "rew_std": 2.3514, "Agent": "SAC"}, {"env_step": 185000, "rew": 9358.1878, "rew_std": 2.0733, "Agent": "SAC"}, {"env_step": 190000, "rew": 9359.2768, "rew_std": 0.4847, "Agent": "SAC"}, {"env_step": 195000, "rew": 9359.55, "rew_std": 0.3739, "Agent": "SAC"}, {"env_step": 200000, "rew": 9358.4272, "rew_std": 2.6085, "Agent": "SAC"}, {"env_step": 205000, "rew": 9189.6563, "rew_std": 504.8487, "Agent": "SAC"}, {"env_step": 210000, "rew": 9358.7361, "rew_std": 1.912, "Agent": "SAC"}, {"env_step": 215000, "rew": 9359.223, "rew_std": 0.9374, "Agent": "SAC"}, {"env_step": 220000, "rew": 9358.6182, "rew_std": 1.5412, "Agent": "SAC"}, {"env_step": 225000, "rew": 9357.2911, "rew_std": 3.1816, "Agent": "SAC"}, {"env_step": 230000, "rew": 9358.2075, "rew_std": 1.7019, "Agent": "SAC"}, {"env_step": 235000, "rew": 9358.601, "rew_std": 1.2267, "Agent": "SAC"}, {"env_step": 240000, "rew": 9359.2408, "rew_std": 0.8431, "Agent": "SAC"}, {"env_step": 245000, "rew": 9272.3552, "rew_std": 256.1615, "Agent": "SAC"}, {"env_step": 250000, "rew": 9358.7978, "rew_std": 0.9196, "Agent": "SAC"}, {"env_step": 255000, "rew": 9359.4003, "rew_std": 0.611, "Agent": "SAC"}, {"env_step": 260000, "rew": 9289.9692, "rew_std": 206.5769, "Agent": "SAC"}, {"env_step": 265000, "rew": 9359.103, "rew_std": 0.7612, "Agent": "SAC"}, {"env_step": 270000, "rew": 9357.6548, "rew_std": 2.754, "Agent": "SAC"}, {"env_step": 275000, "rew": 9359.2981, "rew_std": 0.6554, "Agent": "SAC"}, {"env_step": 280000, "rew": 9358.866, "rew_std": 0.9736, "Agent": "SAC"}, {"env_step": 285000, "rew": 9357.7487, "rew_std": 3.921, "Agent": "SAC"}, {"env_step": 290000, "rew": 9357.2292, "rew_std": 2.6113, "Agent": "SAC"}, {"env_step": 295000, "rew": 8815.7244, "rew_std": 1630.2044, "Agent": "SAC"}, {"env_step": 300000, "rew": 8736.6906, "rew_std": 1865.9664, "Agent": "SAC"}, {"env_step": 305000, "rew": 9358.1978, "rew_std": 1.6803, "Agent": "SAC"}, {"env_step": 310000, "rew": 9357.3869, "rew_std": 3.205, "Agent": "SAC"}, {"env_step": 315000, "rew": 8690.9313, "rew_std": 1999.8899, "Agent": "SAC"}, {"env_step": 320000, "rew": 9357.4604, "rew_std": 2.3499, "Agent": "SAC"}, {"env_step": 325000, "rew": 9357.4597, "rew_std": 2.775, "Agent": "SAC"}, {"env_step": 330000, "rew": 9358.9668, "rew_std": 0.7506, "Agent": "SAC"}, {"env_step": 335000, "rew": 9355.8857, "rew_std": 10.1018, "Agent": "SAC"}, {"env_step": 340000, "rew": 8677.3081, "rew_std": 2045.4936, "Agent": "SAC"}, {"env_step": 345000, "rew": 8398.0554, "rew_std": 2619.1756, "Agent": "SAC"}, {"env_step": 350000, "rew": 7765.9506, "rew_std": 3186.7966, "Agent": "SAC"}, {"env_step": 355000, "rew": 9357.3369, "rew_std": 3.3379, "Agent": "SAC"}, {"env_step": 360000, "rew": 9358.0212, "rew_std": 1.5434, "Agent": "SAC"}, {"env_step": 365000, "rew": 9357.3291, "rew_std": 2.4368, "Agent": "SAC"}, {"env_step": 370000, "rew": 8527.6686, "rew_std": 2486.9701, "Agent": "SAC"}, {"env_step": 375000, "rew": 9356.9724, "rew_std": 3.4184, "Agent": "SAC"}, {"env_step": 380000, "rew": 9357.8325, "rew_std": 2.2129, "Agent": "SAC"}, {"env_step": 385000, "rew": 9358.8762, "rew_std": 1.1965, "Agent": "SAC"}, {"env_step": 390000, "rew": 9358.5068, "rew_std": 1.6315, "Agent": "SAC"}, {"env_step": 395000, "rew": 9358.6581, "rew_std": 1.2426, "Agent": "SAC"}, {"env_step": 400000, "rew": 9284.3148, "rew_std": 221.399, "Agent": "SAC"}, {"env_step": 405000, "rew": 8510.3777, "rew_std": 2542.6878, "Agent": "SAC"}, {"env_step": 410000, "rew": 8579.7797, "rew_std": 2329.1843, "Agent": "SAC"}, {"env_step": 415000, "rew": 9357.8998, "rew_std": 2.7608, "Agent": "SAC"}, {"env_step": 420000, "rew": 9357.865, "rew_std": 2.1883, "Agent": "SAC"}, {"env_step": 425000, "rew": 9356.5476, "rew_std": 4.8174, "Agent": "SAC"}, {"env_step": 430000, "rew": 9358.2478, "rew_std": 2.0621, "Agent": "SAC"}, {"env_step": 435000, "rew": 9357.224, "rew_std": 3.8015, "Agent": "SAC"}, {"env_step": 440000, "rew": 9357.3562, "rew_std": 3.3264, "Agent": "SAC"}, {"env_step": 445000, "rew": 9358.0301, "rew_std": 1.9789, "Agent": "SAC"}, {"env_step": 450000, "rew": 9358.1439, "rew_std": 1.3295, "Agent": "SAC"}, {"env_step": 455000, "rew": 9357.0635, "rew_std": 2.7428, "Agent": "SAC"}, {"env_step": 460000, "rew": 9358.3828, "rew_std": 2.1765, "Agent": "SAC"}, {"env_step": 465000, "rew": 9358.1382, "rew_std": 1.4252, "Agent": "SAC"}, {"env_step": 470000, "rew": 9182.7382, "rew_std": 521.5833, "Agent": "SAC"}, {"env_step": 475000, "rew": 8551.3778, "rew_std": 2412.8404, "Agent": "SAC"}, {"env_step": 480000, "rew": 9357.468, "rew_std": 2.7522, "Agent": "SAC"}, {"env_step": 485000, "rew": 9357.9983, "rew_std": 1.7244, "Agent": "SAC"}, {"env_step": 490000, "rew": 8534.6716, "rew_std": 2470.8785, "Agent": "SAC"}, {"env_step": 495000, "rew": 8514.5436, "rew_std": 2528.1433, "Agent": "SAC"}, {"env_step": 500000, "rew": 9296.5499, "rew_std": 183.7219, "Agent": "SAC"}, {"env_step": 505000, "rew": 9357.6859, "rew_std": 1.5885, "Agent": "SAC"}, {"env_step": 510000, "rew": 7917.2816, "rew_std": 2901.6283, "Agent": "SAC"}, {"env_step": 515000, "rew": 9355.8243, "rew_std": 2.8363, "Agent": "SAC"}, {"env_step": 520000, "rew": 8639.4952, "rew_std": 2154.2267, "Agent": "SAC"}, {"env_step": 525000, "rew": 9357.7612, "rew_std": 1.9323, "Agent": "SAC"}, {"env_step": 530000, "rew": 9357.5089, "rew_std": 2.2904, "Agent": "SAC"}, {"env_step": 535000, "rew": 8953.6934, "rew_std": 1213.18, "Agent": "SAC"}, {"env_step": 540000, "rew": 9357.9182, "rew_std": 2.6973, "Agent": "SAC"}, {"env_step": 545000, "rew": 9358.0829, "rew_std": 2.6316, "Agent": "SAC"}, {"env_step": 550000, "rew": 9358.3228, "rew_std": 1.9631, "Agent": "SAC"}, {"env_step": 555000, "rew": 9358.631, "rew_std": 1.5429, "Agent": "SAC"}, {"env_step": 560000, "rew": 9357.9939, "rew_std": 2.6106, "Agent": "SAC"}, {"env_step": 565000, "rew": 9357.863, "rew_std": 2.1863, "Agent": "SAC"}, {"env_step": 570000, "rew": 9269.8532, "rew_std": 264.2835, "Agent": "SAC"}, {"env_step": 575000, "rew": 8532.672, "rew_std": 2478.1488, "Agent": "SAC"}, {"env_step": 580000, "rew": 9268.4563, "rew_std": 269.2364, "Agent": "SAC"}, {"env_step": 585000, "rew": 9356.9148, "rew_std": 2.7939, "Agent": "SAC"}, {"env_step": 590000, "rew": 9357.5543, "rew_std": 3.2443, "Agent": "SAC"}, {"env_step": 595000, "rew": 9357.463, "rew_std": 4.0439, "Agent": "SAC"}, {"env_step": 600000, "rew": 9358.4626, "rew_std": 1.9303, "Agent": "SAC"}, {"env_step": 605000, "rew": 9358.3671, "rew_std": 1.6862, "Agent": "SAC"}, {"env_step": 610000, "rew": 9356.2164, "rew_std": 3.1168, "Agent": "SAC"}, {"env_step": 615000, "rew": 9196.5389, "rew_std": 479.0729, "Agent": "SAC"}, {"env_step": 620000, "rew": 9356.9592, "rew_std": 3.5518, "Agent": "SAC"}, {"env_step": 625000, "rew": 9357.161, "rew_std": 2.5809, "Agent": "SAC"}, {"env_step": 630000, "rew": 9357.3341, "rew_std": 3.0693, "Agent": "SAC"}, {"env_step": 635000, "rew": 9356.3924, "rew_std": 4.6242, "Agent": "SAC"}, {"env_step": 640000, "rew": 9358.5012, "rew_std": 1.1927, "Agent": "SAC"}, {"env_step": 645000, "rew": 9354.8708, "rew_std": 8.4384, "Agent": "SAC"}, {"env_step": 650000, "rew": 9356.4388, "rew_std": 4.5926, "Agent": "SAC"}, {"env_step": 655000, "rew": 9268.8286, "rew_std": 268.5847, "Agent": "SAC"}, {"env_step": 660000, "rew": 9358.5155, "rew_std": 0.8397, "Agent": "SAC"}, {"env_step": 665000, "rew": 9356.109, "rew_std": 4.5035, "Agent": "SAC"}, {"env_step": 670000, "rew": 8668.209, "rew_std": 2067.7502, "Agent": "SAC"}, {"env_step": 675000, "rew": 9356.4476, "rew_std": 2.7218, "Agent": "SAC"}, {"env_step": 680000, "rew": 9356.7041, "rew_std": 2.8959, "Agent": "SAC"}, {"env_step": 685000, "rew": 9183.2542, "rew_std": 507.7661, "Agent": "SAC"}, {"env_step": 690000, "rew": 9185.6077, "rew_std": 512.599, "Agent": "SAC"}, {"env_step": 695000, "rew": 9353.9835, "rew_std": 5.7664, "Agent": "SAC"}, {"env_step": 700000, "rew": 9356.6336, "rew_std": 2.2203, "Agent": "SAC"}, {"env_step": 705000, "rew": 9356.3002, "rew_std": 1.8897, "Agent": "SAC"}, {"env_step": 710000, "rew": 9358.1446, "rew_std": 1.2315, "Agent": "SAC"}, {"env_step": 715000, "rew": 9356.4302, "rew_std": 5.0337, "Agent": "SAC"}, {"env_step": 720000, "rew": 9357.4375, "rew_std": 2.3157, "Agent": "SAC"}, {"env_step": 725000, "rew": 9357.2368, "rew_std": 2.2183, "Agent": "SAC"}, {"env_step": 730000, "rew": 9358.8531, "rew_std": 0.8592, "Agent": "SAC"}, {"env_step": 735000, "rew": 9356.496, "rew_std": 4.2008, "Agent": "SAC"}, {"env_step": 740000, "rew": 9358.0214, "rew_std": 1.9654, "Agent": "SAC"}, {"env_step": 745000, "rew": 9185.1656, "rew_std": 514.708, "Agent": "SAC"}, {"env_step": 750000, "rew": 9357.9964, "rew_std": 1.2584, "Agent": "SAC"}, {"env_step": 755000, "rew": 9185.0382, "rew_std": 512.9892, "Agent": "SAC"}, {"env_step": 760000, "rew": 9355.9867, "rew_std": 4.5162, "Agent": "SAC"}, {"env_step": 765000, "rew": 9357.3264, "rew_std": 2.0687, "Agent": "SAC"}, {"env_step": 770000, "rew": 9358.5004, "rew_std": 1.0138, "Agent": "SAC"}, {"env_step": 775000, "rew": 9268.6565, "rew_std": 255.2189, "Agent": "SAC"}, {"env_step": 780000, "rew": 9358.1214, "rew_std": 1.6113, "Agent": "SAC"}, {"env_step": 785000, "rew": 9356.2192, "rew_std": 3.7295, "Agent": "SAC"}, {"env_step": 790000, "rew": 9356.6503, "rew_std": 3.8859, "Agent": "SAC"}, {"env_step": 795000, "rew": 9357.0889, "rew_std": 3.9538, "Agent": "SAC"}, {"env_step": 800000, "rew": 9357.3384, "rew_std": 1.7422, "Agent": "SAC"}, {"env_step": 805000, "rew": 9356.6001, "rew_std": 2.6288, "Agent": "SAC"}, {"env_step": 810000, "rew": 9355.0373, "rew_std": 4.3317, "Agent": "SAC"}, {"env_step": 815000, "rew": 9272.1791, "rew_std": 244.7629, "Agent": "SAC"}, {"env_step": 820000, "rew": 8584.3171, "rew_std": 2312.6697, "Agent": "SAC"}, {"env_step": 825000, "rew": 9355.9172, "rew_std": 3.118, "Agent": "SAC"}, {"env_step": 830000, "rew": 9355.178, "rew_std": 4.1283, "Agent": "SAC"}, {"env_step": 835000, "rew": 9354.8275, "rew_std": 3.0273, "Agent": "SAC"}, {"env_step": 840000, "rew": 9356.123, "rew_std": 2.7092, "Agent": "SAC"}, {"env_step": 845000, "rew": 9356.9006, "rew_std": 2.6423, "Agent": "SAC"}, {"env_step": 850000, "rew": 9097.4006, "rew_std": 776.0303, "Agent": "SAC"}, {"env_step": 855000, "rew": 9188.9318, "rew_std": 499.1948, "Agent": "SAC"}, {"env_step": 860000, "rew": 9357.2354, "rew_std": 2.9334, "Agent": "SAC"}, {"env_step": 865000, "rew": 9355.8375, "rew_std": 4.2123, "Agent": "SAC"}, {"env_step": 870000, "rew": 9353.5733, "rew_std": 9.3714, "Agent": "SAC"}, {"env_step": 875000, "rew": 9357.4238, "rew_std": 2.3234, "Agent": "SAC"}, {"env_step": 880000, "rew": 9356.2627, "rew_std": 6.0144, "Agent": "SAC"}, {"env_step": 885000, "rew": 9357.9774, "rew_std": 2.1263, "Agent": "SAC"}, {"env_step": 890000, "rew": 9357.6414, "rew_std": 1.6319, "Agent": "SAC"}, {"env_step": 895000, "rew": 9357.9668, "rew_std": 1.9952, "Agent": "SAC"}, {"env_step": 900000, "rew": 8471.5008, "rew_std": 2378.4696, "Agent": "SAC"}, {"env_step": 905000, "rew": 9356.7069, "rew_std": 3.7738, "Agent": "SAC"}, {"env_step": 910000, "rew": 9357.1332, "rew_std": 3.5212, "Agent": "SAC"}, {"env_step": 915000, "rew": 9355.6515, "rew_std": 4.1753, "Agent": "SAC"}, {"env_step": 920000, "rew": 9353.0939, "rew_std": 4.6991, "Agent": "SAC"}, {"env_step": 925000, "rew": 8509.6734, "rew_std": 2544.1191, "Agent": "SAC"}, {"env_step": 930000, "rew": 9356.5265, "rew_std": 3.1623, "Agent": "SAC"}, {"env_step": 935000, "rew": 9356.4495, "rew_std": 2.4185, "Agent": "SAC"}, {"env_step": 940000, "rew": 9356.1637, "rew_std": 3.4761, "Agent": "SAC"}, {"env_step": 945000, "rew": 8557.7586, "rew_std": 2391.4699, "Agent": "SAC"}, {"env_step": 950000, "rew": 9355.9067, "rew_std": 3.3597, "Agent": "SAC"}, {"env_step": 955000, "rew": 9355.8109, "rew_std": 2.0901, "Agent": "SAC"}, {"env_step": 960000, "rew": 9356.5445, "rew_std": 2.6151, "Agent": "SAC"}, {"env_step": 965000, "rew": 9356.6557, "rew_std": 3.2263, "Agent": "SAC"}, {"env_step": 970000, "rew": 9356.6071, "rew_std": 3.243, "Agent": "SAC"}, {"env_step": 975000, "rew": 9355.9793, "rew_std": 3.4355, "Agent": "SAC"}, {"env_step": 980000, "rew": 8523.7853, "rew_std": 2496.1878, "Agent": "SAC"}, {"env_step": 985000, "rew": 9354.4498, "rew_std": 4.182, "Agent": "SAC"}, {"env_step": 990000, "rew": 9357.3811, "rew_std": 1.9945, "Agent": "SAC"}, {"env_step": 995000, "rew": 9357.1444, "rew_std": 1.9249, "Agent": "SAC"}, {"env_step": 1000000, "rew": 9269.378, "rew_std": 265.5736, "Agent": "SAC"}, {"env_step": 1005000, "rew": 9355.054, "rew_std": 5.6732, "Agent": "SAC"}, {"env_step": 1010000, "rew": 8485.4707, "rew_std": 2610.2802, "Agent": "SAC"}, {"env_step": 1015000, "rew": 9355.2511, "rew_std": 3.5887, "Agent": "SAC"}, {"env_step": 1020000, "rew": 9357.6654, "rew_std": 2.0783, "Agent": "SAC"}, {"env_step": 1025000, "rew": 8824.9238, "rew_std": 1321.7067, "Agent": "SAC"}, {"env_step": 1030000, "rew": 9354.8854, "rew_std": 8.5901, "Agent": "SAC"}, {"env_step": 1035000, "rew": 8748.8442, "rew_std": 1823.8367, "Agent": "SAC"}, {"env_step": 1040000, "rew": 9355.839, "rew_std": 3.0407, "Agent": "SAC"}, {"env_step": 1045000, "rew": 9186.054, "rew_std": 498.5165, "Agent": "SAC"}, {"env_step": 1050000, "rew": 9355.953, "rew_std": 4.6684, "Agent": "SAC"}, {"env_step": 1055000, "rew": 8556.4775, "rew_std": 2402.5939, "Agent": "SAC"}, {"env_step": 1060000, "rew": 7979.0473, "rew_std": 2758.1903, "Agent": "SAC"}, {"env_step": 1065000, "rew": 9357.7278, "rew_std": 1.6492, "Agent": "SAC"}, {"env_step": 1070000, "rew": 9357.3245, "rew_std": 1.9565, "Agent": "SAC"}, {"env_step": 1075000, "rew": 9355.7818, "rew_std": 5.2267, "Agent": "SAC"}, {"env_step": 1080000, "rew": 8654.1202, "rew_std": 2108.016, "Agent": "SAC"}, {"env_step": 1085000, "rew": 9264.301, "rew_std": 280.1512, "Agent": "SAC"}, {"env_step": 1090000, "rew": 8669.3311, "rew_std": 1414.0249, "Agent": "SAC"}, {"env_step": 1095000, "rew": 9357.4627, "rew_std": 2.0457, "Agent": "SAC"}, {"env_step": 1100000, "rew": 9356.6594, "rew_std": 2.7395, "Agent": "SAC"}, {"env_step": 1105000, "rew": 9267.9669, "rew_std": 265.7297, "Agent": "SAC"}, {"env_step": 1110000, "rew": 9356.5423, "rew_std": 2.5126, "Agent": "SAC"}, {"env_step": 1115000, "rew": 8597.87, "rew_std": 2277.7467, "Agent": "SAC"}, {"env_step": 1120000, "rew": 9264.0892, "rew_std": 276.7349, "Agent": "SAC"}, {"env_step": 1125000, "rew": 7900.357, "rew_std": 2951.27, "Agent": "SAC"}, {"env_step": 1130000, "rew": 9354.4699, "rew_std": 6.3684, "Agent": "SAC"}, {"env_step": 1135000, "rew": 9356.0906, "rew_std": 4.4826, "Agent": "SAC"}, {"env_step": 1140000, "rew": 9354.2508, "rew_std": 6.1105, "Agent": "SAC"}, {"env_step": 1145000, "rew": 9356.163, "rew_std": 3.1381, "Agent": "SAC"}, {"env_step": 1150000, "rew": 9354.3438, "rew_std": 4.3484, "Agent": "SAC"}, {"env_step": 1155000, "rew": 9353.4378, "rew_std": 6.3306, "Agent": "SAC"}, {"env_step": 1160000, "rew": 9356.8536, "rew_std": 3.0736, "Agent": "SAC"}, {"env_step": 1165000, "rew": 9356.9584, "rew_std": 2.9037, "Agent": "SAC"}, {"env_step": 1170000, "rew": 9263.6426, "rew_std": 279.4552, "Agent": "SAC"}, {"env_step": 1175000, "rew": 9356.6183, "rew_std": 3.1622, "Agent": "SAC"}, {"env_step": 1180000, "rew": 9261.2321, "rew_std": 273.7961, "Agent": "SAC"}, {"env_step": 1185000, "rew": 9355.9645, "rew_std": 3.8095, "Agent": "SAC"}, {"env_step": 1190000, "rew": 9356.537, "rew_std": 2.3578, "Agent": "SAC"}, {"env_step": 1195000, "rew": 9357.0243, "rew_std": 2.3114, "Agent": "SAC"}, {"env_step": 1200000, "rew": 9007.6879, "rew_std": 1041.6742, "Agent": "SAC"}, {"env_step": 1205000, "rew": 9356.6688, "rew_std": 2.3098, "Agent": "SAC"}, {"env_step": 1210000, "rew": 9357.0209, "rew_std": 2.1465, "Agent": "SAC"}, {"env_step": 1215000, "rew": 9356.3172, "rew_std": 2.1724, "Agent": "SAC"}, {"env_step": 1220000, "rew": 9355.0894, "rew_std": 4.8487, "Agent": "SAC"}, {"env_step": 1225000, "rew": 9355.2638, "rew_std": 2.3195, "Agent": "SAC"}, {"env_step": 1230000, "rew": 9355.6464, "rew_std": 2.4159, "Agent": "SAC"}, {"env_step": 1235000, "rew": 9353.5888, "rew_std": 7.0113, "Agent": "SAC"}, {"env_step": 1240000, "rew": 9355.6813, "rew_std": 2.9253, "Agent": "SAC"}, {"env_step": 1245000, "rew": 9356.5849, "rew_std": 2.2778, "Agent": "SAC"}, {"env_step": 1250000, "rew": 9352.2148, "rew_std": 12.6716, "Agent": "SAC"}, {"env_step": 0, "rew": 53.5626, "rew_std": 5.4712, "Agent": "TRPO"}, {"env_step": 30720, "rew": 261.8917, "rew_std": 53.4098, "Agent": "TRPO"}, {"env_step": 61440, "rew": 556.3956, "rew_std": 163.1329, "Agent": "TRPO"}, {"env_step": 92160, "rew": 6024.5962, "rew_std": 2626.8481, "Agent": "TRPO"}, {"env_step": 122880, "rew": 8435.1516, "rew_std": 1073.3378, "Agent": "TRPO"}, {"env_step": 153600, "rew": 6321.6404, "rew_std": 1654.5351, "Agent": "TRPO"}, {"env_step": 184320, "rew": 5460.3046, "rew_std": 2159.549, "Agent": "TRPO"}, {"env_step": 215040, "rew": 5552.8667, "rew_std": 1645.6569, "Agent": "TRPO"}, {"env_step": 245760, "rew": 6117.8932, "rew_std": 1161.243, "Agent": "TRPO"}, {"env_step": 276480, "rew": 6140.454, "rew_std": 1274.2871, "Agent": "TRPO"}, {"env_step": 307200, "rew": 5604.0893, "rew_std": 2094.1793, "Agent": "TRPO"}, {"env_step": 337920, "rew": 4733.8243, "rew_std": 2455.4449, "Agent": "TRPO"}, {"env_step": 368640, "rew": 3576.1349, "rew_std": 2420.6042, "Agent": "TRPO"}, {"env_step": 399360, "rew": 4234.4622, "rew_std": 3054.4371, "Agent": "TRPO"}, {"env_step": 430080, "rew": 3721.2604, "rew_std": 2587.9909, "Agent": "TRPO"}, {"env_step": 460800, "rew": 4253.3959, "rew_std": 2831.927, "Agent": "TRPO"}, {"env_step": 491520, "rew": 3000.9859, "rew_std": 2305.565, "Agent": "TRPO"}, {"env_step": 522240, "rew": 3774.1206, "rew_std": 2412.0237, "Agent": "TRPO"}, {"env_step": 552960, "rew": 2637.774, "rew_std": 2438.7809, "Agent": "TRPO"}, {"env_step": 583680, "rew": 2761.7871, "rew_std": 1571.5899, "Agent": "TRPO"}, {"env_step": 614400, "rew": 2591.357, "rew_std": 1853.4057, "Agent": "TRPO"}, {"env_step": 645120, "rew": 3162.8687, "rew_std": 1679.7828, "Agent": "TRPO"}, {"env_step": 675840, "rew": 2713.4127, "rew_std": 2049.1118, "Agent": "TRPO"}, {"env_step": 706560, "rew": 2588.5211, "rew_std": 1598.6496, "Agent": "TRPO"}, {"env_step": 737280, "rew": 3127.6383, "rew_std": 1722.3851, "Agent": "TRPO"}, {"env_step": 768000, "rew": 3505.0184, "rew_std": 2232.7699, "Agent": "TRPO"}, {"env_step": 798720, "rew": 3437.8395, "rew_std": 2674.9589, "Agent": "TRPO"}, {"env_step": 829440, "rew": 2834.3988, "rew_std": 1487.5097, "Agent": "TRPO"}, {"env_step": 860160, "rew": 2889.5119, "rew_std": 2444.8602, "Agent": "TRPO"}, {"env_step": 890880, "rew": 3927.5854, "rew_std": 2049.2697, "Agent": "TRPO"}, {"env_step": 921600, "rew": 2907.2243, "rew_std": 2122.1556, "Agent": "TRPO"}, {"env_step": 952320, "rew": 3410.9617, "rew_std": 2333.8635, "Agent": "TRPO"}, {"env_step": 983040, "rew": 2742.4646, "rew_std": 2240.2084, "Agent": "TRPO"}, {"env_step": 1013760, "rew": 2313.7183, "rew_std": 2073.7954, "Agent": "TRPO"}, {"env_step": 1044480, "rew": 2152.3924, "rew_std": 860.2705, "Agent": "TRPO"}, {"env_step": 1075200, "rew": 2875.9442, "rew_std": 1712.2911, "Agent": "TRPO"}, {"env_step": 1105920, "rew": 987.9845, "rew_std": 881.0233, "Agent": "TRPO"}, {"env_step": 1136640, "rew": 2505.9952, "rew_std": 1564.8081, "Agent": "TRPO"}, {"env_step": 1167360, "rew": 3046.9737, "rew_std": 2256.3131, "Agent": "TRPO"}, {"env_step": 1198080, "rew": 3405.6145, "rew_std": 1579.8816, "Agent": "TRPO"}, {"env_step": 1228800, "rew": 1778.4643, "rew_std": 1329.6039, "Agent": "TRPO"}, {"env_step": 1259520, "rew": 1571.6279, "rew_std": 1358.0218, "Agent": "TRPO"}, {"env_step": 1290240, "rew": 2069.9224, "rew_std": 1186.9045, "Agent": "TRPO"}, {"env_step": 1320960, "rew": 2223.4399, "rew_std": 1158.24, "Agent": "TRPO"}, {"env_step": 1351680, "rew": 1597.1536, "rew_std": 902.1674, "Agent": "TRPO"}, {"env_step": 1382400, "rew": 2049.2875, "rew_std": 1215.2393, "Agent": "TRPO"}, {"env_step": 1413120, "rew": 3720.0218, "rew_std": 894.6003, "Agent": "TRPO"}, {"env_step": 1443840, "rew": 3439.859, "rew_std": 2177.9695, "Agent": "TRPO"}, {"env_step": 1474560, "rew": 2751.9302, "rew_std": 1530.0513, "Agent": "TRPO"}, {"env_step": 1505280, "rew": 2201.9053, "rew_std": 1397.6169, "Agent": "TRPO"}, {"env_step": 1536000, "rew": 1284.0257, "rew_std": 1218.4937, "Agent": "TRPO"}, {"env_step": 1566720, "rew": 4271.5546, "rew_std": 2116.253, "Agent": "TRPO"}, {"env_step": 1597440, "rew": 2560.8802, "rew_std": 1718.6728, "Agent": "TRPO"}, {"env_step": 1628160, "rew": 2646.396, "rew_std": 1531.2576, "Agent": "TRPO"}, {"env_step": 1658880, "rew": 1555.8823, "rew_std": 1169.7554, "Agent": "TRPO"}, {"env_step": 1689600, "rew": 2085.4617, "rew_std": 1519.8495, "Agent": "TRPO"}, {"env_step": 1720320, "rew": 2346.8782, "rew_std": 1323.4839, "Agent": "TRPO"}, {"env_step": 1751040, "rew": 2195.8408, "rew_std": 1078.8864, "Agent": "TRPO"}, {"env_step": 1781760, "rew": 2095.8517, "rew_std": 1070.0273, "Agent": "TRPO"}, {"env_step": 1812480, "rew": 2088.1241, "rew_std": 1393.2947, "Agent": "TRPO"}, {"env_step": 1843200, "rew": 2321.9152, "rew_std": 1579.2272, "Agent": "TRPO"}, {"env_step": 1873920, "rew": 3050.874, "rew_std": 1769.7151, "Agent": "TRPO"}, {"env_step": 1904640, "rew": 2952.0594, "rew_std": 1769.1773, "Agent": "TRPO"}, {"env_step": 1935360, "rew": 2151.7718, "rew_std": 1678.553, "Agent": "TRPO"}, {"env_step": 1966080, "rew": 2577.0553, "rew_std": 1429.7604, "Agent": "TRPO"}, {"env_step": 1996800, "rew": 2033.6806, "rew_std": 1427.4249, "Agent": "TRPO"}, {"env_step": 2027520, "rew": 2678.165, "rew_std": 1789.9722, "Agent": "TRPO"}, {"env_step": 2058240, "rew": 2436.1723, "rew_std": 1725.1597, "Agent": "TRPO"}, {"env_step": 2088960, "rew": 2589.1848, "rew_std": 1676.7095, "Agent": "TRPO"}, {"env_step": 2119680, "rew": 1924.3706, "rew_std": 1328.473, "Agent": "TRPO"}, {"env_step": 2150400, "rew": 2588.5063, "rew_std": 1565.9773, "Agent": "TRPO"}, {"env_step": 2181120, "rew": 2281.369, "rew_std": 1253.5793, "Agent": "TRPO"}, {"env_step": 2211840, "rew": 2493.7936, "rew_std": 1868.2228, "Agent": "TRPO"}, {"env_step": 2242560, "rew": 2026.7874, "rew_std": 1468.7833, "Agent": "TRPO"}, {"env_step": 2273280, "rew": 3319.2301, "rew_std": 2009.4682, "Agent": "TRPO"}, {"env_step": 2304000, "rew": 3713.9449, "rew_std": 2097.9346, "Agent": "TRPO"}, {"env_step": 2334720, "rew": 2857.8177, "rew_std": 1915.6668, "Agent": "TRPO"}, {"env_step": 2365440, "rew": 2870.1954, "rew_std": 1993.1097, "Agent": "TRPO"}, {"env_step": 2396160, "rew": 2998.2679, "rew_std": 1826.9552, "Agent": "TRPO"}, {"env_step": 2426880, "rew": 2911.0523, "rew_std": 1918.5489, "Agent": "TRPO"}, {"env_step": 2457600, "rew": 3641.3796, "rew_std": 1991.3939, "Agent": "TRPO"}, {"env_step": 2488320, "rew": 3153.6067, "rew_std": 1782.7791, "Agent": "TRPO"}, {"env_step": 2519040, "rew": 1456.1088, "rew_std": 942.0327, "Agent": "TRPO"}, {"env_step": 2549760, "rew": 3186.4096, "rew_std": 1418.0592, "Agent": "TRPO"}, {"env_step": 2580480, "rew": 3450.7127, "rew_std": 1243.4847, "Agent": "TRPO"}, {"env_step": 2611200, "rew": 2867.9201, "rew_std": 2317.2895, "Agent": "TRPO"}, {"env_step": 2641920, "rew": 2847.1381, "rew_std": 1339.6926, "Agent": "TRPO"}, {"env_step": 2672640, "rew": 2974.4306, "rew_std": 2499.9414, "Agent": "TRPO"}, {"env_step": 2703360, "rew": 2589.186, "rew_std": 1652.6024, "Agent": "TRPO"}, {"env_step": 2734080, "rew": 2606.2226, "rew_std": 1475.1118, "Agent": "TRPO"}, {"env_step": 2764800, "rew": 2864.1705, "rew_std": 1756.7181, "Agent": "TRPO"}, {"env_step": 2795520, "rew": 3498.5409, "rew_std": 2120.5779, "Agent": "TRPO"}, {"env_step": 2826240, "rew": 3308.2452, "rew_std": 1399.7237, "Agent": "TRPO"}, {"env_step": 2856960, "rew": 1879.7321, "rew_std": 1821.4177, "Agent": "TRPO"}, {"env_step": 2887680, "rew": 2450.376, "rew_std": 1911.9973, "Agent": "TRPO"}, {"env_step": 2918400, "rew": 2601.444, "rew_std": 1516.2042, "Agent": "TRPO"}, {"env_step": 2949120, "rew": 2404.9808, "rew_std": 1693.6965, "Agent": "TRPO"}, {"env_step": 2979840, "rew": 2597.6516, "rew_std": 1893.7043, "Agent": "TRPO"}, {"env_step": 3010560, "rew": 4318.039, "rew_std": 2129.4765, "Agent": "TRPO"}, {"env_step": 3041280, "rew": 3861.5413, "rew_std": 2370.5409, "Agent": "TRPO"}, {"env_step": 3072000, "rew": 3990.0621, "rew_std": 2349.5233, "Agent": "TRPO"}, {"env_step": 0, "rew": 53.5626, "rew_std": 5.4712, "Agent": "A2C"}, {"env_step": 30000, "rew": 165.3699, "rew_std": 15.8262, "Agent": "A2C"}, {"env_step": 60000, "rew": 278.5414, "rew_std": 35.5195, "Agent": "A2C"}, {"env_step": 90000, "rew": 370.5591, "rew_std": 64.1232, "Agent": "A2C"}, {"env_step": 120000, "rew": 515.2061, "rew_std": 76.4682, "Agent": "A2C"}, {"env_step": 150000, "rew": 705.1444, "rew_std": 92.1359, "Agent": "A2C"}, {"env_step": 180000, "rew": 1125.0754, "rew_std": 350.0867, "Agent": "A2C"}, {"env_step": 210000, "rew": 3093.8255, "rew_std": 1674.9932, "Agent": "A2C"}, {"env_step": 240000, "rew": 6080.3757, "rew_std": 1434.3889, "Agent": "A2C"}, {"env_step": 270000, "rew": 6683.2966, "rew_std": 1128.3915, "Agent": "A2C"}, {"env_step": 300000, "rew": 7589.9427, "rew_std": 849.6975, "Agent": "A2C"}, {"env_step": 330000, "rew": 5696.9149, "rew_std": 2277.6442, "Agent": "A2C"}, {"env_step": 360000, "rew": 5649.5662, "rew_std": 1297.3898, "Agent": "A2C"}, {"env_step": 390000, "rew": 7372.0974, "rew_std": 2547.9211, "Agent": "A2C"}, {"env_step": 420000, "rew": 6570.9616, "rew_std": 1163.1758, "Agent": "A2C"}, {"env_step": 450000, "rew": 6874.2586, "rew_std": 1602.3641, "Agent": "A2C"}, {"env_step": 480000, "rew": 7311.5666, "rew_std": 999.7631, "Agent": "A2C"}, {"env_step": 510000, "rew": 7592.0021, "rew_std": 1130.0516, "Agent": "A2C"}, {"env_step": 540000, "rew": 7053.2387, "rew_std": 1230.277, "Agent": "A2C"}, {"env_step": 570000, "rew": 8249.9909, "rew_std": 1725.9754, "Agent": "A2C"}, {"env_step": 600000, "rew": 6397.1525, "rew_std": 1793.332, "Agent": "A2C"}, {"env_step": 630000, "rew": 7227.102, "rew_std": 1103.6105, "Agent": "A2C"}, {"env_step": 660000, "rew": 7133.5374, "rew_std": 1445.3755, "Agent": "A2C"}, {"env_step": 690000, "rew": 7732.3018, "rew_std": 1844.5892, "Agent": "A2C"}, {"env_step": 720000, "rew": 8703.7419, "rew_std": 834.3039, "Agent": "A2C"}, {"env_step": 750000, "rew": 8633.7331, "rew_std": 1107.9686, "Agent": "A2C"}, {"env_step": 780000, "rew": 8274.7136, "rew_std": 2053.5267, "Agent": "A2C"}, {"env_step": 810000, "rew": 7322.6685, "rew_std": 1656.3385, "Agent": "A2C"}, {"env_step": 840000, "rew": 7923.2505, "rew_std": 2314.1175, "Agent": "A2C"}, {"env_step": 870000, "rew": 7855.25, "rew_std": 2656.8457, "Agent": "A2C"}, {"env_step": 900000, "rew": 8149.0521, "rew_std": 1381.1895, "Agent": "A2C"}, {"env_step": 930000, "rew": 7485.3729, "rew_std": 3531.042, "Agent": "A2C"}, {"env_step": 960000, "rew": 9257.6636, "rew_std": 277.4383, "Agent": "A2C"}, {"env_step": 990000, "rew": 8989.5551, "rew_std": 604.5116, "Agent": "A2C"}, {"env_step": 1020000, "rew": 8710.0884, "rew_std": 717.8418, "Agent": "A2C"}, {"env_step": 1050000, "rew": 7964.6811, "rew_std": 2670.7761, "Agent": "A2C"}, {"env_step": 1080000, "rew": 8139.1856, "rew_std": 2183.9688, "Agent": "A2C"}, {"env_step": 1110000, "rew": 7763.4722, "rew_std": 2407.9368, "Agent": "A2C"}, {"env_step": 1140000, "rew": 7343.0162, "rew_std": 3320.6158, "Agent": "A2C"}, {"env_step": 1170000, "rew": 7926.8729, "rew_std": 2558.491, "Agent": "A2C"}, {"env_step": 1200000, "rew": 9074.6163, "rew_std": 591.3742, "Agent": "A2C"}, {"env_step": 1230000, "rew": 8704.4275, "rew_std": 832.6564, "Agent": "A2C"}, {"env_step": 1260000, "rew": 8379.228, "rew_std": 2616.9612, "Agent": "A2C"}, {"env_step": 1290000, "rew": 7995.9326, "rew_std": 2099.1052, "Agent": "A2C"}, {"env_step": 1320000, "rew": 8597.2945, "rew_std": 934.2636, "Agent": "A2C"}, {"env_step": 1350000, "rew": 9043.1429, "rew_std": 677.0861, "Agent": "A2C"}, {"env_step": 1380000, "rew": 9350.4301, "rew_std": 12.0039, "Agent": "A2C"}, {"env_step": 1410000, "rew": 8298.0241, "rew_std": 1903.4005, "Agent": "A2C"}, {"env_step": 1440000, "rew": 8109.2874, "rew_std": 2016.9284, "Agent": "A2C"}, {"env_step": 1470000, "rew": 8642.3605, "rew_std": 1534.7333, "Agent": "A2C"}, {"env_step": 1500000, "rew": 8981.4328, "rew_std": 607.3778, "Agent": "A2C"}, {"env_step": 1530000, "rew": 7579.4363, "rew_std": 3559.5222, "Agent": "A2C"}, {"env_step": 1560000, "rew": 6014.9854, "rew_std": 3158.7687, "Agent": "A2C"}, {"env_step": 1590000, "rew": 8436.0225, "rew_std": 911.7899, "Agent": "A2C"}, {"env_step": 1620000, "rew": 7240.4051, "rew_std": 2977.2566, "Agent": "A2C"}, {"env_step": 1650000, "rew": 7376.5496, "rew_std": 3101.1354, "Agent": "A2C"}, {"env_step": 1680000, "rew": 6505.8345, "rew_std": 3945.7676, "Agent": "A2C"}, {"env_step": 1710000, "rew": 8214.8968, "rew_std": 2053.7879, "Agent": "A2C"}, {"env_step": 1740000, "rew": 8406.5618, "rew_std": 1766.4248, "Agent": "A2C"}, {"env_step": 1770000, "rew": 8609.5837, "rew_std": 1270.4979, "Agent": "A2C"}, {"env_step": 1800000, "rew": 9170.2991, "rew_std": 525.8975, "Agent": "A2C"}, {"env_step": 1830000, "rew": 9347.1827, "rew_std": 13.3392, "Agent": "A2C"}, {"env_step": 1860000, "rew": 8803.5903, "rew_std": 918.7437, "Agent": "A2C"}, {"env_step": 1890000, "rew": 9161.4353, "rew_std": 374.3905, "Agent": "A2C"}, {"env_step": 1920000, "rew": 9348.3455, "rew_std": 12.6689, "Agent": "A2C"}, {"env_step": 1950000, "rew": 9176.7473, "rew_std": 543.232, "Agent": "A2C"}, {"env_step": 1980000, "rew": 7453.3149, "rew_std": 3360.1904, "Agent": "A2C"}, {"env_step": 2010000, "rew": 9351.3157, "rew_std": 12.7785, "Agent": "A2C"}, {"env_step": 2040000, "rew": 8813.3769, "rew_std": 1075.499, "Agent": "A2C"}, {"env_step": 2070000, "rew": 9077.6345, "rew_std": 816.8358, "Agent": "A2C"}, {"env_step": 2100000, "rew": 8904.5094, "rew_std": 716.6057, "Agent": "A2C"}, {"env_step": 2130000, "rew": 8614.7209, "rew_std": 1345.6491, "Agent": "A2C"}, {"env_step": 2160000, "rew": 8171.675, "rew_std": 2683.0986, "Agent": "A2C"}, {"env_step": 2190000, "rew": 7869.7354, "rew_std": 2363.8685, "Agent": "A2C"}, {"env_step": 2220000, "rew": 8819.4359, "rew_std": 596.9582, "Agent": "A2C"}, {"env_step": 2250000, "rew": 8387.8828, "rew_std": 2584.99, "Agent": "A2C"}, {"env_step": 2280000, "rew": 7908.1091, "rew_std": 1331.1717, "Agent": "A2C"}, {"env_step": 2310000, "rew": 8712.9974, "rew_std": 718.7488, "Agent": "A2C"}, {"env_step": 2340000, "rew": 8893.5525, "rew_std": 621.7979, "Agent": "A2C"}, {"env_step": 2370000, "rew": 7149.2746, "rew_std": 3312.735, "Agent": "A2C"}, {"env_step": 2400000, "rew": 8279.6943, "rew_std": 2617.049, "Agent": "A2C"}, {"env_step": 2430000, "rew": 9347.9399, "rew_std": 12.6763, "Agent": "A2C"}, {"env_step": 2460000, "rew": 8618.9958, "rew_std": 1134.2173, "Agent": "A2C"}, {"env_step": 2490000, "rew": 9167.1785, "rew_std": 555.3044, "Agent": "A2C"}, {"env_step": 2520000, "rew": 9112.2709, "rew_std": 722.9989, "Agent": "A2C"}, {"env_step": 2550000, "rew": 9346.3538, "rew_std": 14.2909, "Agent": "A2C"}, {"env_step": 2580000, "rew": 9261.4516, "rew_std": 260.8552, "Agent": "A2C"}, {"env_step": 2610000, "rew": 8807.666, "rew_std": 819.9374, "Agent": "A2C"}, {"env_step": 2640000, "rew": 8299.3944, "rew_std": 2555.8638, "Agent": "A2C"}, {"env_step": 2670000, "rew": 7549.846, "rew_std": 3158.768, "Agent": "A2C"}, {"env_step": 2700000, "rew": 8893.9045, "rew_std": 608.1252, "Agent": "A2C"}, {"env_step": 2730000, "rew": 8581.0372, "rew_std": 942.1541, "Agent": "A2C"}, {"env_step": 2760000, "rew": 8160.1186, "rew_std": 2406.8291, "Agent": "A2C"}, {"env_step": 2790000, "rew": 8313.3783, "rew_std": 2274.0883, "Agent": "A2C"}, {"env_step": 2820000, "rew": 8888.0056, "rew_std": 619.69, "Agent": "A2C"}, {"env_step": 2850000, "rew": 8804.6519, "rew_std": 1080.8811, "Agent": "A2C"}, {"env_step": 2880000, "rew": 9142.4464, "rew_std": 356.4098, "Agent": "A2C"}, {"env_step": 2910000, "rew": 8983.9959, "rew_std": 601.4488, "Agent": "A2C"}, {"env_step": 2940000, "rew": 9080.3266, "rew_std": 407.971, "Agent": "A2C"}, {"env_step": 2970000, "rew": 9349.8121, "rew_std": 7.0154, "Agent": "A2C"}, {"env_step": 3000000, "rew": 9081.4192, "rew_std": 570.8176, "Agent": "A2C"}, {"env_step": 0, "rew": 53.6538, "rew_std": 5.1475, "Agent": "ACKTR"}, {"env_step": 30000, "rew": 205.086, "rew_std": 22.3773, "Agent": "ACKTR"}, {"env_step": 60000, "rew": 242.8813, "rew_std": 37.0494, "Agent": "ACKTR"}, {"env_step": 90000, "rew": 245.5758, "rew_std": 46.3137, "Agent": "ACKTR"}, {"env_step": 120000, "rew": 332.6798, "rew_std": 60.0705, "Agent": "ACKTR"}, {"env_step": 150000, "rew": 346.2826, "rew_std": 68.7464, "Agent": "ACKTR"}, {"env_step": 180000, "rew": 349.2419, "rew_std": 55.9086, "Agent": "ACKTR"}, {"env_step": 210000, "rew": 378.3318, "rew_std": 58.365, "Agent": "ACKTR"}, {"env_step": 240000, "rew": 387.7747, "rew_std": 69.5705, "Agent": "ACKTR"}, {"env_step": 270000, "rew": 425.2122, "rew_std": 115.1994, "Agent": "ACKTR"}, {"env_step": 300000, "rew": 542.3436, "rew_std": 171.4923, "Agent": "ACKTR"}, {"env_step": 330000, "rew": 486.2567, "rew_std": 143.1301, "Agent": "ACKTR"}, {"env_step": 360000, "rew": 483.4774, "rew_std": 119.7832, "Agent": "ACKTR"}, {"env_step": 390000, "rew": 649.8389, "rew_std": 336.8276, "Agent": "ACKTR"}, {"env_step": 420000, "rew": 717.4433, "rew_std": 263.4532, "Agent": "ACKTR"}, {"env_step": 450000, "rew": 808.2998, "rew_std": 434.5571, "Agent": "ACKTR"}, {"env_step": 480000, "rew": 791.4963, "rew_std": 394.4257, "Agent": "ACKTR"}, {"env_step": 510000, "rew": 818.2542, "rew_std": 242.8274, "Agent": "ACKTR"}, {"env_step": 540000, "rew": 1108.6574, "rew_std": 606.2485, "Agent": "ACKTR"}, {"env_step": 570000, "rew": 1053.8726, "rew_std": 421.8714, "Agent": "ACKTR"}, {"env_step": 600000, "rew": 1063.6855, "rew_std": 587.699, "Agent": "ACKTR"}, {"env_step": 630000, "rew": 1366.7775, "rew_std": 813.5606, "Agent": "ACKTR"}, {"env_step": 660000, "rew": 1008.0205, "rew_std": 601.2805, "Agent": "ACKTR"}, {"env_step": 690000, "rew": 1636.1172, "rew_std": 1312.2026, "Agent": "ACKTR"}, {"env_step": 720000, "rew": 1759.9855, "rew_std": 1185.124, "Agent": "ACKTR"}, {"env_step": 750000, "rew": 1115.3884, "rew_std": 498.1863, "Agent": "ACKTR"}, {"env_step": 780000, "rew": 2161.7273, "rew_std": 2405.4617, "Agent": "ACKTR"}, {"env_step": 810000, "rew": 1725.983, "rew_std": 1722.4558, "Agent": "ACKTR"}, {"env_step": 840000, "rew": 2388.3762, "rew_std": 2503.0362, "Agent": "ACKTR"}, {"env_step": 870000, "rew": 2897.3131, "rew_std": 2278.1056, "Agent": "ACKTR"}, {"env_step": 900000, "rew": 2442.9347, "rew_std": 2152.1372, "Agent": "ACKTR"}, {"env_step": 930000, "rew": 1886.8738, "rew_std": 1181.8806, "Agent": "ACKTR"}, {"env_step": 960000, "rew": 1857.7762, "rew_std": 970.2863, "Agent": "ACKTR"}, {"env_step": 990000, "rew": 3073.2792, "rew_std": 1281.6968, "Agent": "ACKTR"}, {"env_step": 1020000, "rew": 2672.3475, "rew_std": 2047.1383, "Agent": "ACKTR"}, {"env_step": 1050000, "rew": 2833.6576, "rew_std": 2531.4165, "Agent": "ACKTR"}, {"env_step": 1080000, "rew": 1993.2629, "rew_std": 853.6519, "Agent": "ACKTR"}, {"env_step": 1110000, "rew": 2299.1596, "rew_std": 1017.3348, "Agent": "ACKTR"}, {"env_step": 1140000, "rew": 4133.2011, "rew_std": 2351.0559, "Agent": "ACKTR"}, {"env_step": 1170000, "rew": 2311.135, "rew_std": 1882.8478, "Agent": "ACKTR"}, {"env_step": 1200000, "rew": 2845.4928, "rew_std": 1770.5768, "Agent": "ACKTR"}, {"env_step": 1230000, "rew": 3409.5642, "rew_std": 1724.4596, "Agent": "ACKTR"}, {"env_step": 1260000, "rew": 2348.9219, "rew_std": 930.9355, "Agent": "ACKTR"}, {"env_step": 1290000, "rew": 3024.0624, "rew_std": 1503.2362, "Agent": "ACKTR"}, {"env_step": 1320000, "rew": 2266.4518, "rew_std": 508.1994, "Agent": "ACKTR"}, {"env_step": 1350000, "rew": 3739.4321, "rew_std": 1604.6673, "Agent": "ACKTR"}, {"env_step": 1380000, "rew": 3110.1138, "rew_std": 1450.6002, "Agent": "ACKTR"}, {"env_step": 1410000, "rew": 3846.3276, "rew_std": 2973.2934, "Agent": "ACKTR"}, {"env_step": 1440000, "rew": 3187.7134, "rew_std": 1522.3903, "Agent": "ACKTR"}, {"env_step": 1470000, "rew": 3021.8217, "rew_std": 1571.6426, "Agent": "ACKTR"}, {"env_step": 1500000, "rew": 2524.0696, "rew_std": 1708.3912, "Agent": "ACKTR"}, {"env_step": 1530000, "rew": 2529.9472, "rew_std": 969.436, "Agent": "ACKTR"}, {"env_step": 1560000, "rew": 3399.718, "rew_std": 1931.6749, "Agent": "ACKTR"}, {"env_step": 1590000, "rew": 4047.7162, "rew_std": 2245.9658, "Agent": "ACKTR"}, {"env_step": 1620000, "rew": 3456.8778, "rew_std": 2183.5483, "Agent": "ACKTR"}, {"env_step": 1650000, "rew": 4421.8991, "rew_std": 2383.9312, "Agent": "ACKTR"}, {"env_step": 1680000, "rew": 4623.2833, "rew_std": 2737.8343, "Agent": "ACKTR"}, {"env_step": 1710000, "rew": 3972.1049, "rew_std": 1092.4037, "Agent": "ACKTR"}, {"env_step": 1740000, "rew": 2398.9498, "rew_std": 1561.2595, "Agent": "ACKTR"}, {"env_step": 1770000, "rew": 3513.4658, "rew_std": 2250.0689, "Agent": "ACKTR"}, {"env_step": 1800000, "rew": 3964.9724, "rew_std": 1645.4332, "Agent": "ACKTR"}, {"env_step": 1830000, "rew": 4135.5036, "rew_std": 2267.0778, "Agent": "ACKTR"}, {"env_step": 1860000, "rew": 4182.7329, "rew_std": 1622.2163, "Agent": "ACKTR"}, {"env_step": 1890000, "rew": 3612.9434, "rew_std": 1928.6272, "Agent": "ACKTR"}, {"env_step": 1920000, "rew": 4402.5249, "rew_std": 2400.1818, "Agent": "ACKTR"}, {"env_step": 1950000, "rew": 3246.9032, "rew_std": 957.3825, "Agent": "ACKTR"}, {"env_step": 1980000, "rew": 2832.1889, "rew_std": 1305.1838, "Agent": "ACKTR"}, {"env_step": 2010000, "rew": 2811.1203, "rew_std": 1948.4716, "Agent": "ACKTR"}, {"env_step": 2040000, "rew": 3005.8238, "rew_std": 1924.731, "Agent": "ACKTR"}, {"env_step": 2070000, "rew": 3502.9994, "rew_std": 1501.19, "Agent": "ACKTR"}, {"env_step": 2100000, "rew": 4168.7077, "rew_std": 1234.675, "Agent": "ACKTR"}, {"env_step": 2130000, "rew": 3166.7546, "rew_std": 1202.386, "Agent": "ACKTR"}, {"env_step": 2160000, "rew": 4223.7409, "rew_std": 1990.0041, "Agent": "ACKTR"}, {"env_step": 2190000, "rew": 3349.5737, "rew_std": 1302.2569, "Agent": "ACKTR"}, {"env_step": 2220000, "rew": 4644.1612, "rew_std": 2165.3754, "Agent": "ACKTR"}, {"env_step": 2250000, "rew": 3660.9681, "rew_std": 1925.8698, "Agent": "ACKTR"}, {"env_step": 2280000, "rew": 3262.0164, "rew_std": 1241.993, "Agent": "ACKTR"}, {"env_step": 2310000, "rew": 3211.2055, "rew_std": 1886.1509, "Agent": "ACKTR"}, {"env_step": 2340000, "rew": 2760.7795, "rew_std": 1643.2487, "Agent": "ACKTR"}, {"env_step": 2370000, "rew": 2983.2414, "rew_std": 1440.0369, "Agent": "ACKTR"}, {"env_step": 2400000, "rew": 4133.8434, "rew_std": 1977.7667, "Agent": "ACKTR"}, {"env_step": 2430000, "rew": 4076.6165, "rew_std": 1812.0822, "Agent": "ACKTR"}, {"env_step": 2460000, "rew": 2944.1648, "rew_std": 1454.1681, "Agent": "ACKTR"}, {"env_step": 2490000, "rew": 3381.0552, "rew_std": 1625.4565, "Agent": "ACKTR"}, {"env_step": 2520000, "rew": 3263.8067, "rew_std": 1529.4285, "Agent": "ACKTR"}, {"env_step": 2550000, "rew": 3291.6554, "rew_std": 2194.0305, "Agent": "ACKTR"}, {"env_step": 2580000, "rew": 3649.1483, "rew_std": 2426.0624, "Agent": "ACKTR"}, {"env_step": 2610000, "rew": 3680.0135, "rew_std": 1714.2302, "Agent": "ACKTR"}, {"env_step": 2640000, "rew": 3397.5858, "rew_std": 1568.7918, "Agent": "ACKTR"}, {"env_step": 2670000, "rew": 3165.495, "rew_std": 1563.3152, "Agent": "ACKTR"}, {"env_step": 2700000, "rew": 3533.9628, "rew_std": 1177.8878, "Agent": "ACKTR"}, {"env_step": 2730000, "rew": 3164.9266, "rew_std": 1605.4427, "Agent": "ACKTR"}, {"env_step": 2760000, "rew": 3304.0784, "rew_std": 1882.7672, "Agent": "ACKTR"}, {"env_step": 2790000, "rew": 2701.0322, "rew_std": 1135.0422, "Agent": "ACKTR"}, {"env_step": 2820000, "rew": 3114.4209, "rew_std": 1603.5992, "Agent": "ACKTR"}, {"env_step": 2850000, "rew": 3173.9256, "rew_std": 2012.6372, "Agent": "ACKTR"}, {"env_step": 2880000, "rew": 3592.0207, "rew_std": 1892.5176, "Agent": "ACKTR"}, {"env_step": 2910000, "rew": 3893.495, "rew_std": 1602.7668, "Agent": "ACKTR"}, {"env_step": 2940000, "rew": 3520.7811, "rew_std": 1788.4537, "Agent": "ACKTR"}, {"env_step": 2970000, "rew": 2868.6874, "rew_std": 1209.5682, "Agent": "ACKTR"}, {"env_step": 3000000, "rew": 3181.5864, "rew_std": 1469.3801, "Agent": "ACKTR"}, {"env_step": 0, "rew": 87.8507, "rew_std": 12.8325, "Agent": "DDPG"}, {"env_step": 5000, "rew": 1148.5608, "rew_std": 1411.8006, "Agent": "DDPG"}, {"env_step": 10000, "rew": 5683.871, "rew_std": 3495.3789, "Agent": "DDPG"}, {"env_step": 15000, "rew": 6564.777, "rew_std": 4061.7699, "Agent": "DDPG"}, {"env_step": 20000, "rew": 7379.0819, "rew_std": 3461.198, "Agent": "DDPG"}, {"env_step": 25000, "rew": 8364.3434, "rew_std": 2778.9295, "Agent": "DDPG"}, {"env_step": 30000, "rew": 8363.9272, "rew_std": 2779.0584, "Agent": "DDPG"}, {"env_step": 35000, "rew": 8354.9727, "rew_std": 2775.5436, "Agent": "DDPG"}, {"env_step": 40000, "rew": 8354.2209, "rew_std": 2775.5533, "Agent": "DDPG"}, {"env_step": 45000, "rew": 8353.3548, "rew_std": 2775.2758, "Agent": "DDPG"}, {"env_step": 50000, "rew": 8346.184, "rew_std": 2773.1462, "Agent": "DDPG"}, {"env_step": 55000, "rew": 8340.5262, "rew_std": 2770.9872, "Agent": "DDPG"}, {"env_step": 60000, "rew": 8338.25, "rew_std": 2770.5018, "Agent": "DDPG"}, {"env_step": 65000, "rew": 8336.6722, "rew_std": 2769.444, "Agent": "DDPG"}, {"env_step": 70000, "rew": 8332.4935, "rew_std": 2767.7795, "Agent": "DDPG"}, {"env_step": 75000, "rew": 8327.6732, "rew_std": 2766.4379, "Agent": "DDPG"}, {"env_step": 80000, "rew": 8300.2123, "rew_std": 2758.217, "Agent": "DDPG"}, {"env_step": 85000, "rew": 8321.4129, "rew_std": 2764.0878, "Agent": "DDPG"}, {"env_step": 90000, "rew": 8315.6078, "rew_std": 2762.7047, "Agent": "DDPG"}, {"env_step": 95000, "rew": 8313.166, "rew_std": 2761.6036, "Agent": "DDPG"}, {"env_step": 100000, "rew": 8312.4057, "rew_std": 2761.3488, "Agent": "DDPG"}, {"env_step": 105000, "rew": 8311.4733, "rew_std": 2761.5601, "Agent": "DDPG"}, {"env_step": 110000, "rew": 8307.8776, "rew_std": 2759.8442, "Agent": "DDPG"}, {"env_step": 115000, "rew": 8306.386, "rew_std": 2759.3404, "Agent": "DDPG"}, {"env_step": 120000, "rew": 8301.8255, "rew_std": 2758.0951, "Agent": "DDPG"}, {"env_step": 125000, "rew": 8301.0734, "rew_std": 2757.3022, "Agent": "DDPG"}, {"env_step": 130000, "rew": 8297.8948, "rew_std": 2756.7646, "Agent": "DDPG"}, {"env_step": 135000, "rew": 8300.1575, "rew_std": 2756.711, "Agent": "DDPG"}, {"env_step": 140000, "rew": 8299.4218, "rew_std": 2757.5534, "Agent": "DDPG"}, {"env_step": 145000, "rew": 8298.7566, "rew_std": 2756.7844, "Agent": "DDPG"}, {"env_step": 150000, "rew": 8207.5663, "rew_std": 2740.2049, "Agent": "DDPG"}, {"env_step": 155000, "rew": 8297.8394, "rew_std": 2755.9258, "Agent": "DDPG"}, {"env_step": 160000, "rew": 8296.2179, "rew_std": 2755.9276, "Agent": "DDPG"}, {"env_step": 165000, "rew": 8295.9536, "rew_std": 2756.1112, "Agent": "DDPG"}, {"env_step": 170000, "rew": 8295.9494, "rew_std": 2756.3831, "Agent": "DDPG"}, {"env_step": 175000, "rew": 8293.5577, "rew_std": 2755.3327, "Agent": "DDPG"}, {"env_step": 180000, "rew": 8292.3673, "rew_std": 2754.9256, "Agent": "DDPG"}, {"env_step": 185000, "rew": 8292.4829, "rew_std": 2754.6934, "Agent": "DDPG"}, {"env_step": 190000, "rew": 8292.4845, "rew_std": 2755.2319, "Agent": "DDPG"}, {"env_step": 195000, "rew": 8295.9467, "rew_std": 2755.58, "Agent": "DDPG"}, {"env_step": 200000, "rew": 8293.4849, "rew_std": 2755.315, "Agent": "DDPG"}, {"env_step": 205000, "rew": 8295.1456, "rew_std": 2755.5937, "Agent": "DDPG"}, {"env_step": 210000, "rew": 8292.4386, "rew_std": 2753.8752, "Agent": "DDPG"}, {"env_step": 215000, "rew": 8292.1814, "rew_std": 2754.5895, "Agent": "DDPG"}, {"env_step": 220000, "rew": 8294.0952, "rew_std": 2754.9637, "Agent": "DDPG"}, {"env_step": 225000, "rew": 8294.9958, "rew_std": 2754.735, "Agent": "DDPG"}, {"env_step": 230000, "rew": 8292.6771, "rew_std": 2755.0272, "Agent": "DDPG"}, {"env_step": 235000, "rew": 8290.456, "rew_std": 2754.5529, "Agent": "DDPG"}, {"env_step": 240000, "rew": 8292.1381, "rew_std": 2754.8685, "Agent": "DDPG"}, {"env_step": 245000, "rew": 8291.5933, "rew_std": 2754.1325, "Agent": "DDPG"}, {"env_step": 250000, "rew": 8292.011, "rew_std": 2754.5416, "Agent": "DDPG"}, {"env_step": 255000, "rew": 8293.3528, "rew_std": 2755.5253, "Agent": "DDPG"}, {"env_step": 260000, "rew": 8293.4076, "rew_std": 2754.9993, "Agent": "DDPG"}, {"env_step": 265000, "rew": 8290.5226, "rew_std": 2754.3122, "Agent": "DDPG"}, {"env_step": 270000, "rew": 8293.537, "rew_std": 2755.038, "Agent": "DDPG"}, {"env_step": 275000, "rew": 8289.003, "rew_std": 2753.8052, "Agent": "DDPG"}, {"env_step": 280000, "rew": 8291.2201, "rew_std": 2754.283, "Agent": "DDPG"}, {"env_step": 285000, "rew": 8291.5624, "rew_std": 2754.3976, "Agent": "DDPG"}, {"env_step": 290000, "rew": 8292.1208, "rew_std": 2754.8444, "Agent": "DDPG"}, {"env_step": 295000, "rew": 8292.2593, "rew_std": 2754.084, "Agent": "DDPG"}, {"env_step": 300000, "rew": 8292.862, "rew_std": 2754.8324, "Agent": "DDPG"}, {"env_step": 305000, "rew": 8291.4754, "rew_std": 2753.8274, "Agent": "DDPG"}, {"env_step": 310000, "rew": 8292.0324, "rew_std": 2754.5388, "Agent": "DDPG"}, {"env_step": 315000, "rew": 8291.5211, "rew_std": 2754.1126, "Agent": "DDPG"}, {"env_step": 320000, "rew": 8295.0906, "rew_std": 2755.3129, "Agent": "DDPG"}, {"env_step": 325000, "rew": 8290.7056, "rew_std": 2754.103, "Agent": "DDPG"}, {"env_step": 330000, "rew": 8289.1691, "rew_std": 2753.597, "Agent": "DDPG"}, {"env_step": 335000, "rew": 8291.5639, "rew_std": 2754.6603, "Agent": "DDPG"}, {"env_step": 340000, "rew": 8291.2692, "rew_std": 2754.5552, "Agent": "DDPG"}, {"env_step": 345000, "rew": 8291.326, "rew_std": 2754.592, "Agent": "DDPG"}, {"env_step": 350000, "rew": 8290.4233, "rew_std": 2754.2992, "Agent": "DDPG"}, {"env_step": 355000, "rew": 8288.9633, "rew_std": 2753.7956, "Agent": "DDPG"}, {"env_step": 360000, "rew": 8116.2298, "rew_std": 2746.018, "Agent": "DDPG"}, {"env_step": 365000, "rew": 8292.9889, "rew_std": 2755.1284, "Agent": "DDPG"}, {"env_step": 370000, "rew": 8292.0499, "rew_std": 2754.5696, "Agent": "DDPG"}, {"env_step": 375000, "rew": 8291.2033, "rew_std": 2754.554, "Agent": "DDPG"}, {"env_step": 380000, "rew": 8289.8346, "rew_std": 2754.3545, "Agent": "DDPG"}, {"env_step": 385000, "rew": 8291.7698, "rew_std": 2755.0038, "Agent": "DDPG"}, {"env_step": 390000, "rew": 8292.5342, "rew_std": 2755.2758, "Agent": "DDPG"}, {"env_step": 395000, "rew": 8291.0649, "rew_std": 2754.2264, "Agent": "DDPG"}, {"env_step": 400000, "rew": 8291.7335, "rew_std": 2754.4616, "Agent": "DDPG"}, {"env_step": 405000, "rew": 8292.3161, "rew_std": 2755.182, "Agent": "DDPG"}, {"env_step": 410000, "rew": 8292.905, "rew_std": 2755.1138, "Agent": "DDPG"}, {"env_step": 415000, "rew": 8292.1131, "rew_std": 2754.0447, "Agent": "DDPG"}, {"env_step": 420000, "rew": 8296.2261, "rew_std": 2755.6873, "Agent": "DDPG"}, {"env_step": 425000, "rew": 8292.7841, "rew_std": 2754.7871, "Agent": "DDPG"}, {"env_step": 430000, "rew": 8289.4164, "rew_std": 2754.2258, "Agent": "DDPG"}, {"env_step": 435000, "rew": 8290.0856, "rew_std": 2754.4358, "Agent": "DDPG"}, {"env_step": 440000, "rew": 8291.561, "rew_std": 2754.9278, "Agent": "DDPG"}, {"env_step": 445000, "rew": 8292.6104, "rew_std": 2754.7454, "Agent": "DDPG"}, {"env_step": 450000, "rew": 8293.0174, "rew_std": 2754.603, "Agent": "DDPG"}, {"env_step": 455000, "rew": 8290.9708, "rew_std": 2753.6444, "Agent": "DDPG"}, {"env_step": 460000, "rew": 8297.6342, "rew_std": 2756.4137, "Agent": "DDPG"}, {"env_step": 465000, "rew": 8291.2503, "rew_std": 2754.0156, "Agent": "DDPG"}, {"env_step": 470000, "rew": 8291.3019, "rew_std": 2754.5721, "Agent": "DDPG"}, {"env_step": 475000, "rew": 8292.475, "rew_std": 2755.2348, "Agent": "DDPG"}, {"env_step": 480000, "rew": 8294.4008, "rew_std": 2755.0725, "Agent": "DDPG"}, {"env_step": 485000, "rew": 8291.7367, "rew_std": 2754.7268, "Agent": "DDPG"}, {"env_step": 490000, "rew": 8293.2381, "rew_std": 2755.4898, "Agent": "DDPG"}, {"env_step": 495000, "rew": 8294.7888, "rew_std": 2755.4598, "Agent": "DDPG"}, {"env_step": 500000, "rew": 8296.2677, "rew_std": 2756.2544, "Agent": "DDPG"}, {"env_step": 505000, "rew": 8296.3363, "rew_std": 2756.2511, "Agent": "DDPG"}, {"env_step": 510000, "rew": 8298.5078, "rew_std": 2756.976, "Agent": "DDPG"}, {"env_step": 515000, "rew": 8290.4035, "rew_std": 2753.7381, "Agent": "DDPG"}, {"env_step": 520000, "rew": 8293.848, "rew_std": 2755.4232, "Agent": "DDPG"}, {"env_step": 525000, "rew": 8293.535, "rew_std": 2755.0527, "Agent": "DDPG"}, {"env_step": 530000, "rew": 8293.2774, "rew_std": 2754.9621, "Agent": "DDPG"}, {"env_step": 535000, "rew": 8292.2477, "rew_std": 2754.3555, "Agent": "DDPG"}, {"env_step": 540000, "rew": 8292.3039, "rew_std": 2754.3911, "Agent": "DDPG"}, {"env_step": 545000, "rew": 8292.5461, "rew_std": 2755.2645, "Agent": "DDPG"}, {"env_step": 550000, "rew": 8292.4917, "rew_std": 2754.9733, "Agent": "DDPG"}, {"env_step": 555000, "rew": 8292.9037, "rew_std": 2754.8334, "Agent": "DDPG"}, {"env_step": 560000, "rew": 8294.958, "rew_std": 2755.7869, "Agent": "DDPG"}, {"env_step": 565000, "rew": 8293.528, "rew_std": 2755.0432, "Agent": "DDPG"}, {"env_step": 570000, "rew": 8299.4294, "rew_std": 2757.0191, "Agent": "DDPG"}, {"env_step": 575000, "rew": 8293.6638, "rew_std": 2755.0938, "Agent": "DDPG"}, {"env_step": 580000, "rew": 8291.0625, "rew_std": 2754.5043, "Agent": "DDPG"}, {"env_step": 585000, "rew": 8294.6894, "rew_std": 2755.9684, "Agent": "DDPG"}, {"env_step": 590000, "rew": 8295.7791, "rew_std": 2755.8167, "Agent": "DDPG"}, {"env_step": 595000, "rew": 8292.8612, "rew_std": 2755.1106, "Agent": "DDPG"}, {"env_step": 600000, "rew": 8291.6771, "rew_std": 2753.8879, "Agent": "DDPG"}, {"env_step": 605000, "rew": 8295.3033, "rew_std": 2755.9122, "Agent": "DDPG"}, {"env_step": 610000, "rew": 8296.0122, "rew_std": 2756.4109, "Agent": "DDPG"}, {"env_step": 615000, "rew": 8295.3513, "rew_std": 2755.9098, "Agent": "DDPG"}, {"env_step": 620000, "rew": 8294.0031, "rew_std": 2754.9571, "Agent": "DDPG"}, {"env_step": 625000, "rew": 8292.0084, "rew_std": 2754.2688, "Agent": "DDPG"}, {"env_step": 630000, "rew": 8293.83, "rew_std": 2755.1403, "Agent": "DDPG"}, {"env_step": 635000, "rew": 8295.4863, "rew_std": 2755.9707, "Agent": "DDPG"}, {"env_step": 640000, "rew": 8293.4934, "rew_std": 2755.3081, "Agent": "DDPG"}, {"env_step": 645000, "rew": 8295.3632, "rew_std": 2755.9298, "Agent": "DDPG"}, {"env_step": 650000, "rew": 8296.3766, "rew_std": 2756.2698, "Agent": "DDPG"}, {"env_step": 655000, "rew": 8291.4066, "rew_std": 2754.0746, "Agent": "DDPG"}, {"env_step": 660000, "rew": 8293.2079, "rew_std": 2754.6713, "Agent": "DDPG"}, {"env_step": 665000, "rew": 8293.3277, "rew_std": 2754.9914, "Agent": "DDPG"}, {"env_step": 670000, "rew": 8292.8327, "rew_std": 2754.8237, "Agent": "DDPG"}, {"env_step": 675000, "rew": 8293.4509, "rew_std": 2755.3201, "Agent": "DDPG"}, {"env_step": 680000, "rew": 8297.0175, "rew_std": 2756.2111, "Agent": "DDPG"}, {"env_step": 685000, "rew": 8294.7786, "rew_std": 2755.2036, "Agent": "DDPG"}, {"env_step": 690000, "rew": 8295.8477, "rew_std": 2756.0947, "Agent": "DDPG"}, {"env_step": 695000, "rew": 8297.5199, "rew_std": 2756.1001, "Agent": "DDPG"}, {"env_step": 700000, "rew": 8294.6571, "rew_std": 2755.1663, "Agent": "DDPG"}, {"env_step": 705000, "rew": 8293.7032, "rew_std": 2755.1142, "Agent": "DDPG"}, {"env_step": 710000, "rew": 8297.6848, "rew_std": 2756.4248, "Agent": "DDPG"}, {"env_step": 715000, "rew": 8296.3341, "rew_std": 2756.2396, "Agent": "DDPG"}, {"env_step": 720000, "rew": 8297.6563, "rew_std": 2756.4191, "Agent": "DDPG"}, {"env_step": 725000, "rew": 8295.9062, "rew_std": 2756.3863, "Agent": "DDPG"}, {"env_step": 730000, "rew": 8295.1217, "rew_std": 2755.5904, "Agent": "DDPG"}, {"env_step": 735000, "rew": 8295.437, "rew_std": 2756.2321, "Agent": "DDPG"}, {"env_step": 740000, "rew": 8297.9849, "rew_std": 2756.8038, "Agent": "DDPG"}, {"env_step": 745000, "rew": 8295.0699, "rew_std": 2756.0934, "Agent": "DDPG"}, {"env_step": 750000, "rew": 8295.2069, "rew_std": 2755.054, "Agent": "DDPG"}, {"env_step": 755000, "rew": 8294.4887, "rew_std": 2755.6316, "Agent": "DDPG"}, {"env_step": 760000, "rew": 8295.5198, "rew_std": 2756.25, "Agent": "DDPG"}, {"env_step": 765000, "rew": 8298.3552, "rew_std": 2756.9195, "Agent": "DDPG"}, {"env_step": 770000, "rew": 8296.7929, "rew_std": 2756.1303, "Agent": "DDPG"}, {"env_step": 775000, "rew": 8299.761, "rew_std": 2756.8651, "Agent": "DDPG"}, {"env_step": 780000, "rew": 8298.0048, "rew_std": 2756.8088, "Agent": "DDPG"}, {"env_step": 785000, "rew": 8296.2551, "rew_std": 2755.9583, "Agent": "DDPG"}, {"env_step": 790000, "rew": 8295.302, "rew_std": 2755.6306, "Agent": "DDPG"}, {"env_step": 795000, "rew": 8292.0512, "rew_std": 2754.5373, "Agent": "DDPG"}, {"env_step": 800000, "rew": 8294.4388, "rew_std": 2755.6203, "Agent": "DDPG"}, {"env_step": 805000, "rew": 8297.1481, "rew_std": 2756.5269, "Agent": "DDPG"}, {"env_step": 810000, "rew": 8292.8083, "rew_std": 2755.3493, "Agent": "DDPG"}, {"env_step": 815000, "rew": 8301.0287, "rew_std": 2757.8421, "Agent": "DDPG"}, {"env_step": 820000, "rew": 8295.6358, "rew_std": 2755.7482, "Agent": "DDPG"}, {"env_step": 825000, "rew": 8291.6853, "rew_std": 2754.6938, "Agent": "DDPG"}, {"env_step": 830000, "rew": 8295.6276, "rew_std": 2755.7279, "Agent": "DDPG"}, {"env_step": 835000, "rew": 8295.8508, "rew_std": 2756.3616, "Agent": "DDPG"}, {"env_step": 840000, "rew": 8296.7933, "rew_std": 2756.6663, "Agent": "DDPG"}, {"env_step": 845000, "rew": 8297.2022, "rew_std": 2756.7935, "Agent": "DDPG"}, {"env_step": 850000, "rew": 8296.1111, "rew_std": 2756.1792, "Agent": "DDPG"}, {"env_step": 855000, "rew": 8296.2931, "rew_std": 2756.5108, "Agent": "DDPG"}, {"env_step": 860000, "rew": 8295.5999, "rew_std": 2756.2757, "Agent": "DDPG"}, {"env_step": 865000, "rew": 8300.1544, "rew_std": 2757.5203, "Agent": "DDPG"}, {"env_step": 870000, "rew": 8296.1314, "rew_std": 2755.9105, "Agent": "DDPG"}, {"env_step": 875000, "rew": 8297.2111, "rew_std": 2756.5472, "Agent": "DDPG"}, {"env_step": 880000, "rew": 8295.3819, "rew_std": 2754.5896, "Agent": "DDPG"}, {"env_step": 885000, "rew": 8296.8615, "rew_std": 2756.429, "Agent": "DDPG"}, {"env_step": 890000, "rew": 8298.6941, "rew_std": 2756.757, "Agent": "DDPG"}, {"env_step": 895000, "rew": 8297.697, "rew_std": 2756.437, "Agent": "DDPG"}, {"env_step": 900000, "rew": 8296.1023, "rew_std": 2755.8934, "Agent": "DDPG"}, {"env_step": 905000, "rew": 8298.3042, "rew_std": 2756.369, "Agent": "DDPG"}, {"env_step": 910000, "rew": 8296.4108, "rew_std": 2756.0118, "Agent": "DDPG"}, {"env_step": 915000, "rew": 8298.7159, "rew_std": 2757.064, "Agent": "DDPG"}, {"env_step": 920000, "rew": 8298.8204, "rew_std": 2757.3504, "Agent": "DDPG"}, {"env_step": 925000, "rew": 8300.3121, "rew_std": 2757.3023, "Agent": "DDPG"}, {"env_step": 930000, "rew": 8296.4645, "rew_std": 2756.0223, "Agent": "DDPG"}, {"env_step": 935000, "rew": 8300.1583, "rew_std": 2757.5244, "Agent": "DDPG"}, {"env_step": 940000, "rew": 8294.9937, "rew_std": 2755.7992, "Agent": "DDPG"}, {"env_step": 945000, "rew": 8297.501, "rew_std": 2756.9001, "Agent": "DDPG"}, {"env_step": 950000, "rew": 8295.0375, "rew_std": 2755.5536, "Agent": "DDPG"}, {"env_step": 955000, "rew": 8295.7071, "rew_std": 2755.5132, "Agent": "DDPG"}, {"env_step": 960000, "rew": 8302.3607, "rew_std": 2758.2533, "Agent": "DDPG"}, {"env_step": 965000, "rew": 8296.644, "rew_std": 2756.3489, "Agent": "DDPG"}, {"env_step": 970000, "rew": 8298.3855, "rew_std": 2756.926, "Agent": "DDPG"}, {"env_step": 975000, "rew": 8297.1022, "rew_std": 2756.7851, "Agent": "DDPG"}, {"env_step": 980000, "rew": 8300.2825, "rew_std": 2757.8324, "Agent": "DDPG"}, {"env_step": 985000, "rew": 8297.9532, "rew_std": 2756.5307, "Agent": "DDPG"}, {"env_step": 990000, "rew": 8296.4771, "rew_std": 2756.0346, "Agent": "DDPG"}, {"env_step": 995000, "rew": 8295.8242, "rew_std": 2756.0726, "Agent": "DDPG"}, {"env_step": 1000000, "rew": 8296.892, "rew_std": 2756.4241, "Agent": "DDPG"}, {"env_step": 1005000, "rew": 8297.6683, "rew_std": 2756.1623, "Agent": "DDPG"}, {"env_step": 1010000, "rew": 8295.0875, "rew_std": 2755.8313, "Agent": "DDPG"}, {"env_step": 1015000, "rew": 8297.3172, "rew_std": 2756.5848, "Agent": "DDPG"}, {"env_step": 1020000, "rew": 8293.767, "rew_std": 2755.3931, "Agent": "DDPG"}, {"env_step": 1025000, "rew": 8293.8516, "rew_std": 2755.699, "Agent": "DDPG"}, {"env_step": 1030000, "rew": 8292.2973, "rew_std": 2754.3564, "Agent": "DDPG"}, {"env_step": 1035000, "rew": 8293.4526, "rew_std": 2755.2837, "Agent": "DDPG"}, {"env_step": 1040000, "rew": 8293.6104, "rew_std": 2755.3343, "Agent": "DDPG"}, {"env_step": 1045000, "rew": 8293.7552, "rew_std": 2754.8439, "Agent": "DDPG"}, {"env_step": 1050000, "rew": 7662.5222, "rew_std": 3164.0049, "Agent": "DDPG"}, {"env_step": 1055000, "rew": 8294.0077, "rew_std": 2754.9234, "Agent": "DDPG"}, {"env_step": 1060000, "rew": 8293.2793, "rew_std": 2755.2315, "Agent": "DDPG"}, {"env_step": 1065000, "rew": 8292.5417, "rew_std": 2755.2513, "Agent": "DDPG"}, {"env_step": 1070000, "rew": 8292.0735, "rew_std": 2754.2833, "Agent": "DDPG"}, {"env_step": 1075000, "rew": 8293.0015, "rew_std": 2754.6026, "Agent": "DDPG"}, {"env_step": 1080000, "rew": 8291.2618, "rew_std": 2754.5517, "Agent": "DDPG"}, {"env_step": 1085000, "rew": 8292.1272, "rew_std": 2754.8365, "Agent": "DDPG"}, {"env_step": 1090000, "rew": 8291.3055, "rew_std": 2754.0306, "Agent": "DDPG"}, {"env_step": 1095000, "rew": 8292.1366, "rew_std": 2754.5853, "Agent": "DDPG"}, {"env_step": 1100000, "rew": 8292.0401, "rew_std": 2755.0818, "Agent": "DDPG"}, {"env_step": 1105000, "rew": 8291.6328, "rew_std": 2754.9401, "Agent": "DDPG"}, {"env_step": 1110000, "rew": 8290.2115, "rew_std": 2753.9331, "Agent": "DDPG"}, {"env_step": 1115000, "rew": 8290.8631, "rew_std": 2754.4196, "Agent": "DDPG"}, {"env_step": 1120000, "rew": 8289.9777, "rew_std": 2753.5913, "Agent": "DDPG"}, {"env_step": 1125000, "rew": 8292.2272, "rew_std": 2754.345, "Agent": "DDPG"}, {"env_step": 1130000, "rew": 8290.1447, "rew_std": 2754.1867, "Agent": "DDPG"}, {"env_step": 1135000, "rew": 8290.2864, "rew_std": 2753.9518, "Agent": "DDPG"}, {"env_step": 1140000, "rew": 8289.5183, "rew_std": 2753.9746, "Agent": "DDPG"}, {"env_step": 1145000, "rew": 8288.7194, "rew_std": 2753.4345, "Agent": "DDPG"}, {"env_step": 1150000, "rew": 8291.2075, "rew_std": 2754.2573, "Agent": "DDPG"}, {"env_step": 1155000, "rew": 8290.7335, "rew_std": 2753.8476, "Agent": "DDPG"}, {"env_step": 1160000, "rew": 8293.1154, "rew_std": 2754.9056, "Agent": "DDPG"}, {"env_step": 1165000, "rew": 8290.8389, "rew_std": 2753.8674, "Agent": "DDPG"}, {"env_step": 1170000, "rew": 8290.7747, "rew_std": 2754.1264, "Agent": "DDPG"}, {"env_step": 1175000, "rew": 8254.041, "rew_std": 2744.3561, "Agent": "DDPG"}, {"env_step": 1180000, "rew": 8292.2006, "rew_std": 2754.6063, "Agent": "DDPG"}, {"env_step": 1185000, "rew": 8290.7599, "rew_std": 2754.396, "Agent": "DDPG"}, {"env_step": 1190000, "rew": 8290.1479, "rew_std": 2753.3733, "Agent": "DDPG"}, {"env_step": 1195000, "rew": 8291.7456, "rew_std": 2754.7311, "Agent": "DDPG"}, {"env_step": 1200000, "rew": 8293.014, "rew_std": 2754.6125, "Agent": "DDPG"}, {"env_step": 1205000, "rew": 8290.6384, "rew_std": 2754.3514, "Agent": "DDPG"}, {"env_step": 1210000, "rew": 8291.264, "rew_std": 2754.8298, "Agent": "DDPG"}, {"env_step": 1215000, "rew": 8289.5644, "rew_std": 2753.9916, "Agent": "DDPG"}, {"env_step": 1220000, "rew": 8292.3213, "rew_std": 2755.2023, "Agent": "DDPG"}, {"env_step": 1225000, "rew": 8292.2093, "rew_std": 2755.1442, "Agent": "DDPG"}, {"env_step": 1230000, "rew": 8292.6926, "rew_std": 2754.7738, "Agent": "DDPG"}, {"env_step": 1235000, "rew": 8289.2696, "rew_std": 2754.1698, "Agent": "DDPG"}, {"env_step": 1240000, "rew": 8293.3196, "rew_std": 2754.9889, "Agent": "DDPG"}, {"env_step": 1245000, "rew": 8291.3114, "rew_std": 2754.3019, "Agent": "DDPG"}, {"env_step": 1250000, "rew": 8294.6964, "rew_std": 2755.7174, "Agent": "DDPG"}, {"env_step": 0, "rew": 53.5626, "rew_std": 5.4712, "Agent": "NPG"}, {"env_step": 30720, "rew": 93.7525, "rew_std": 7.8065, "Agent": "NPG"}, {"env_step": 61440, "rew": 145.1677, "rew_std": 11.1809, "Agent": "NPG"}, {"env_step": 92160, "rew": 227.7882, "rew_std": 47.6936, "Agent": "NPG"}, {"env_step": 122880, "rew": 331.3754, "rew_std": 35.9211, "Agent": "NPG"}, {"env_step": 153600, "rew": 450.2905, "rew_std": 98.6661, "Agent": "NPG"}, {"env_step": 184320, "rew": 1282.0046, "rew_std": 1215.1833, "Agent": "NPG"}, {"env_step": 215040, "rew": 5172.1435, "rew_std": 3336.5647, "Agent": "NPG"}, {"env_step": 245760, "rew": 7556.8745, "rew_std": 2358.8193, "Agent": "NPG"}, {"env_step": 276480, "rew": 8342.2332, "rew_std": 889.5419, "Agent": "NPG"}, {"env_step": 307200, "rew": 9120.4056, "rew_std": 363.6629, "Agent": "NPG"}, {"env_step": 337920, "rew": 8790.0591, "rew_std": 607.4685, "Agent": "NPG"}, {"env_step": 368640, "rew": 7497.9364, "rew_std": 918.9238, "Agent": "NPG"}, {"env_step": 399360, "rew": 9243.2042, "rew_std": 276.0102, "Agent": "NPG"}, {"env_step": 430080, "rew": 8782.4836, "rew_std": 735.3132, "Agent": "NPG"}, {"env_step": 460800, "rew": 8135.8516, "rew_std": 1013.2713, "Agent": "NPG"}, {"env_step": 491520, "rew": 8636.2203, "rew_std": 760.4209, "Agent": "NPG"}, {"env_step": 522240, "rew": 8603.2744, "rew_std": 985.0476, "Agent": "NPG"}, {"env_step": 552960, "rew": 7953.9208, "rew_std": 944.2577, "Agent": "NPG"}, {"env_step": 583680, "rew": 8504.378, "rew_std": 645.6198, "Agent": "NPG"}, {"env_step": 614400, "rew": 6299.3341, "rew_std": 926.591, "Agent": "NPG"}, {"env_step": 645120, "rew": 7321.6252, "rew_std": 1220.76, "Agent": "NPG"}, {"env_step": 675840, "rew": 6588.6516, "rew_std": 1533.5691, "Agent": "NPG"}, {"env_step": 706560, "rew": 7603.2033, "rew_std": 1128.6156, "Agent": "NPG"}, {"env_step": 737280, "rew": 7697.9528, "rew_std": 1066.3563, "Agent": "NPG"}, {"env_step": 768000, "rew": 7868.5664, "rew_std": 1021.7702, "Agent": "NPG"}, {"env_step": 798720, "rew": 8326.5491, "rew_std": 756.4409, "Agent": "NPG"}, {"env_step": 829440, "rew": 6494.5301, "rew_std": 955.295, "Agent": "NPG"}, {"env_step": 860160, "rew": 7501.9611, "rew_std": 1487.8421, "Agent": "NPG"}, {"env_step": 890880, "rew": 8239.8652, "rew_std": 989.5976, "Agent": "NPG"}, {"env_step": 921600, "rew": 7509.1838, "rew_std": 1479.877, "Agent": "NPG"}, {"env_step": 952320, "rew": 8846.8643, "rew_std": 599.2212, "Agent": "NPG"}, {"env_step": 983040, "rew": 8341.8588, "rew_std": 837.6174, "Agent": "NPG"}, {"env_step": 1013760, "rew": 8332.1646, "rew_std": 863.0581, "Agent": "NPG"}, {"env_step": 1044480, "rew": 7782.1788, "rew_std": 1086.4028, "Agent": "NPG"}, {"env_step": 1075200, "rew": 7635.1259, "rew_std": 637.9461, "Agent": "NPG"}, {"env_step": 1105920, "rew": 5717.9593, "rew_std": 1559.7387, "Agent": "NPG"}, {"env_step": 1136640, "rew": 6803.4293, "rew_std": 493.9787, "Agent": "NPG"}, {"env_step": 1167360, "rew": 8693.1565, "rew_std": 831.7087, "Agent": "NPG"}, {"env_step": 1198080, "rew": 8676.553, "rew_std": 564.7209, "Agent": "NPG"}, {"env_step": 1228800, "rew": 7882.9752, "rew_std": 1153.8992, "Agent": "NPG"}, {"env_step": 1259520, "rew": 7416.5771, "rew_std": 642.9856, "Agent": "NPG"}, {"env_step": 1290240, "rew": 7224.5211, "rew_std": 921.5855, "Agent": "NPG"}, {"env_step": 1320960, "rew": 7541.964, "rew_std": 942.8465, "Agent": "NPG"}, {"env_step": 1351680, "rew": 6955.1912, "rew_std": 729.6559, "Agent": "NPG"}, {"env_step": 1382400, "rew": 7857.8242, "rew_std": 1226.5542, "Agent": "NPG"}, {"env_step": 1413120, "rew": 8975.9127, "rew_std": 607.2945, "Agent": "NPG"}, {"env_step": 1443840, "rew": 8227.1127, "rew_std": 861.5084, "Agent": "NPG"}, {"env_step": 1474560, "rew": 7596.6879, "rew_std": 962.8973, "Agent": "NPG"}, {"env_step": 1505280, "rew": 6582.4302, "rew_std": 1887.2931, "Agent": "NPG"}, {"env_step": 1536000, "rew": 7217.4144, "rew_std": 1075.038, "Agent": "NPG"}, {"env_step": 1566720, "rew": 8788.3364, "rew_std": 606.8396, "Agent": "NPG"}, {"env_step": 1597440, "rew": 6406.4683, "rew_std": 1530.4712, "Agent": "NPG"}, {"env_step": 1628160, "rew": 6222.7329, "rew_std": 1557.3993, "Agent": "NPG"}, {"env_step": 1658880, "rew": 5671.6322, "rew_std": 1602.9869, "Agent": "NPG"}, {"env_step": 1689600, "rew": 6458.5924, "rew_std": 955.4097, "Agent": "NPG"}, {"env_step": 1720320, "rew": 8255.7237, "rew_std": 882.877, "Agent": "NPG"}, {"env_step": 1751040, "rew": 7236.3726, "rew_std": 904.844, "Agent": "NPG"}, {"env_step": 1781760, "rew": 6624.1905, "rew_std": 1290.8312, "Agent": "NPG"}, {"env_step": 1812480, "rew": 5374.0434, "rew_std": 855.3992, "Agent": "NPG"}, {"env_step": 1843200, "rew": 7887.3667, "rew_std": 1817.1808, "Agent": "NPG"}, {"env_step": 1873920, "rew": 7597.0396, "rew_std": 1028.537, "Agent": "NPG"}, {"env_step": 1904640, "rew": 6702.5288, "rew_std": 653.2027, "Agent": "NPG"}, {"env_step": 1935360, "rew": 6169.228, "rew_std": 1494.6354, "Agent": "NPG"}, {"env_step": 1966080, "rew": 7421.8628, "rew_std": 1715.79, "Agent": "NPG"}, {"env_step": 1996800, "rew": 5688.8848, "rew_std": 1616.7137, "Agent": "NPG"}, {"env_step": 2027520, "rew": 6750.3647, "rew_std": 1617.0297, "Agent": "NPG"}, {"env_step": 2058240, "rew": 7070.6516, "rew_std": 1251.6352, "Agent": "NPG"}, {"env_step": 2088960, "rew": 7195.2004, "rew_std": 861.5709, "Agent": "NPG"}, {"env_step": 2119680, "rew": 5420.7439, "rew_std": 1527.7407, "Agent": "NPG"}, {"env_step": 2150400, "rew": 7257.8297, "rew_std": 1374.2466, "Agent": "NPG"}, {"env_step": 2181120, "rew": 4872.7478, "rew_std": 1468.0044, "Agent": "NPG"}, {"env_step": 2211840, "rew": 7188.6986, "rew_std": 1218.7812, "Agent": "NPG"}, {"env_step": 2242560, "rew": 5842.3451, "rew_std": 1293.316, "Agent": "NPG"}, {"env_step": 2273280, "rew": 6426.7194, "rew_std": 1506.8555, "Agent": "NPG"}, {"env_step": 2304000, "rew": 7884.1542, "rew_std": 734.7095, "Agent": "NPG"}, {"env_step": 2334720, "rew": 5753.8633, "rew_std": 1051.8227, "Agent": "NPG"}, {"env_step": 2365440, "rew": 6034.9842, "rew_std": 1791.209, "Agent": "NPG"}, {"env_step": 2396160, "rew": 6307.4989, "rew_std": 1089.9991, "Agent": "NPG"}, {"env_step": 2426880, "rew": 5764.5426, "rew_std": 1396.7399, "Agent": "NPG"}, {"env_step": 2457600, "rew": 7054.1218, "rew_std": 1314.0487, "Agent": "NPG"}, {"env_step": 2488320, "rew": 7060.1352, "rew_std": 1752.3972, "Agent": "NPG"}, {"env_step": 2519040, "rew": 5125.029, "rew_std": 1577.2035, "Agent": "NPG"}, {"env_step": 2549760, "rew": 7058.9974, "rew_std": 1100.9997, "Agent": "NPG"}, {"env_step": 2580480, "rew": 7805.5938, "rew_std": 1361.2888, "Agent": "NPG"}, {"env_step": 2611200, "rew": 8162.1976, "rew_std": 1013.4727, "Agent": "NPG"}, {"env_step": 2641920, "rew": 7170.2241, "rew_std": 1300.1413, "Agent": "NPG"}, {"env_step": 2672640, "rew": 7328.2797, "rew_std": 1279.522, "Agent": "NPG"}, {"env_step": 2703360, "rew": 6235.7244, "rew_std": 1850.8459, "Agent": "NPG"}, {"env_step": 2734080, "rew": 6338.7643, "rew_std": 1516.0854, "Agent": "NPG"}, {"env_step": 2764800, "rew": 5596.0665, "rew_std": 1707.551, "Agent": "NPG"}, {"env_step": 2795520, "rew": 6112.4961, "rew_std": 1511.4371, "Agent": "NPG"}, {"env_step": 2826240, "rew": 6789.8476, "rew_std": 2006.1376, "Agent": "NPG"}, {"env_step": 2856960, "rew": 5580.7281, "rew_std": 1824.1451, "Agent": "NPG"}, {"env_step": 2887680, "rew": 5939.7712, "rew_std": 1640.1104, "Agent": "NPG"}, {"env_step": 2918400, "rew": 5724.2187, "rew_std": 1511.346, "Agent": "NPG"}, {"env_step": 2949120, "rew": 5876.7021, "rew_std": 1668.2841, "Agent": "NPG"}, {"env_step": 2979840, "rew": 5605.5739, "rew_std": 1106.9738, "Agent": "NPG"}, {"env_step": 3010560, "rew": 7114.6138, "rew_std": 1004.4565, "Agent": "NPG"}, {"env_step": 3041280, "rew": 6610.3985, "rew_std": 1094.8828, "Agent": "NPG"}, {"env_step": 3072000, "rew": 5673.5061, "rew_std": 1901.9522, "Agent": "NPG"}]