[{"env_step": 0, "rew": -274.9585, "rew_std": 30.3947, "Agent": "PPO"}, {"env_step": 30720, "rew": 11.9799, "rew_std": 55.2327, "Agent": "PPO"}, {"env_step": 61440, "rew": 345.7298, "rew_std": 139.9961, "Agent": "PPO"}, {"env_step": 92160, "rew": 909.6493, "rew_std": 303.9931, "Agent": "PPO"}, {"env_step": 122880, "rew": 1370.7231, "rew_std": 466.5559, "Agent": "PPO"}, {"env_step": 153600, "rew": 1978.4231, "rew_std": 768.0638, "Agent": "PPO"}, {"env_step": 184320, "rew": 2466.3956, "rew_std": 727.2613, "Agent": "PPO"}, {"env_step": 215040, "rew": 2932.2232, "rew_std": 768.6621, "Agent": "PPO"}, {"env_step": 245760, "rew": 3256.0578, "rew_std": 791.5371, "Agent": "PPO"}, {"env_step": 276480, "rew": 3608.5002, "rew_std": 913.1391, "Agent": "PPO"}, {"env_step": 307200, "rew": 3927.2865, "rew_std": 996.2931, "Agent": "PPO"}, {"env_step": 337920, "rew": 4036.1874, "rew_std": 889.6304, "Agent": "PPO"}, {"env_step": 368640, "rew": 4211.7008, "rew_std": 967.32, "Agent": "PPO"}, {"env_step": 399360, "rew": 4469.8477, "rew_std": 1067.6662, "Agent": "PPO"}, {"env_step": 430080, "rew": 4508.921, "rew_std": 952.455, "Agent": "PPO"}, {"env_step": 460800, "rew": 4718.2123, "rew_std": 1095.8106, "Agent": "PPO"}, {"env_step": 491520, "rew": 4877.9208, "rew_std": 1055.6683, "Agent": "PPO"}, {"env_step": 522240, "rew": 4896.2957, "rew_std": 980.5305, "Agent": "PPO"}, {"env_step": 552960, "rew": 5173.8165, "rew_std": 1106.9123, "Agent": "PPO"}, {"env_step": 583680, "rew": 5164.5684, "rew_std": 1146.3997, "Agent": "PPO"}, {"env_step": 614400, "rew": 5291.8974, "rew_std": 1195.9413, "Agent": "PPO"}, {"env_step": 645120, "rew": 5258.5054, "rew_std": 1149.9965, "Agent": "PPO"}, {"env_step": 675840, "rew": 5389.2988, "rew_std": 1304.1797, "Agent": "PPO"}, {"env_step": 706560, "rew": 5290.879, "rew_std": 1152.4471, "Agent": "PPO"}, {"env_step": 737280, "rew": 5483.6851, "rew_std": 1062.3022, "Agent": "PPO"}, {"env_step": 768000, "rew": 5235.702, "rew_std": 1092.4269, "Agent": "PPO"}, {"env_step": 798720, "rew": 5380.5798, "rew_std": 1149.1554, "Agent": "PPO"}, {"env_step": 829440, "rew": 5609.442, "rew_std": 1139.8926, "Agent": "PPO"}, {"env_step": 860160, "rew": 5535.6169, "rew_std": 1188.8048, "Agent": "PPO"}, {"env_step": 890880, "rew": 5733.831, "rew_std": 1221.6438, "Agent": "PPO"}, {"env_step": 921600, "rew": 5783.8931, "rew_std": 1243.9648, "Agent": "PPO"}, {"env_step": 952320, "rew": 5636.1712, "rew_std": 1398.1925, "Agent": "PPO"}, {"env_step": 983040, "rew": 5780.2176, "rew_std": 1267.7102, "Agent": "PPO"}, {"env_step": 1013760, "rew": 5649.9171, "rew_std": 1226.3424, "Agent": "PPO"}, {"env_step": 1044480, "rew": 5929.9898, "rew_std": 1158.9523, "Agent": "PPO"}, {"env_step": 1075200, "rew": 5961.6938, "rew_std": 1207.4791, "Agent": "PPO"}, {"env_step": 1105920, "rew": 6070.5436, "rew_std": 1286.7158, "Agent": "PPO"}, {"env_step": 1136640, "rew": 6087.6435, "rew_std": 1203.064, "Agent": "PPO"}, {"env_step": 1167360, "rew": 6084.3965, "rew_std": 1086.3397, "Agent": "PPO"}, {"env_step": 1198080, "rew": 6138.0199, "rew_std": 1164.6205, "Agent": "PPO"}, {"env_step": 1228800, "rew": 6103.6806, "rew_std": 1104.3936, "Agent": "PPO"}, {"env_step": 1259520, "rew": 6272.6565, "rew_std": 1283.0591, "Agent": "PPO"}, {"env_step": 1290240, "rew": 5979.2705, "rew_std": 1387.8467, "Agent": "PPO"}, {"env_step": 1320960, "rew": 6270.4063, "rew_std": 1344.6734, "Agent": "PPO"}, {"env_step": 1351680, "rew": 6311.9153, "rew_std": 1318.2905, "Agent": "PPO"}, {"env_step": 1382400, "rew": 6457.731, "rew_std": 1296.4794, "Agent": "PPO"}, {"env_step": 1413120, "rew": 6391.7267, "rew_std": 1265.2202, "Agent": "PPO"}, {"env_step": 1443840, "rew": 6494.0974, "rew_std": 1286.5803, "Agent": "PPO"}, {"env_step": 1474560, "rew": 6443.9407, "rew_std": 1231.9738, "Agent": "PPO"}, {"env_step": 1505280, "rew": 6489.5079, "rew_std": 1387.1682, "Agent": "PPO"}, {"env_step": 1536000, "rew": 6424.721, "rew_std": 1264.9294, "Agent": "PPO"}, {"env_step": 1566720, "rew": 6514.5716, "rew_std": 1267.179, "Agent": "PPO"}, {"env_step": 1597440, "rew": 6442.9185, "rew_std": 1254.8738, "Agent": "PPO"}, {"env_step": 1628160, "rew": 6519.5557, "rew_std": 1200.6957, "Agent": "PPO"}, {"env_step": 1658880, "rew": 6612.5312, "rew_std": 1318.4577, "Agent": "PPO"}, {"env_step": 1689600, "rew": 6621.729, "rew_std": 1408.4337, "Agent": "PPO"}, {"env_step": 1720320, "rew": 6733.1272, "rew_std": 1352.7413, "Agent": "PPO"}, {"env_step": 1751040, "rew": 6598.918, "rew_std": 1249.3865, "Agent": "PPO"}, {"env_step": 1781760, "rew": 6690.3299, "rew_std": 1359.7003, "Agent": "PPO"}, {"env_step": 1812480, "rew": 6603.2403, "rew_std": 1293.2844, "Agent": "PPO"}, {"env_step": 1843200, "rew": 6756.5714, "rew_std": 1222.5844, "Agent": "PPO"}, {"env_step": 1873920, "rew": 6652.8604, "rew_std": 1413.5678, "Agent": "PPO"}, {"env_step": 1904640, "rew": 6703.5758, "rew_std": 1361.8639, "Agent": "PPO"}, {"env_step": 1935360, "rew": 6796.892, "rew_std": 1308.253, "Agent": "PPO"}, {"env_step": 1966080, "rew": 6618.2339, "rew_std": 1212.2791, "Agent": "PPO"}, {"env_step": 1996800, "rew": 6760.9166, "rew_std": 1445.6126, "Agent": "PPO"}, {"env_step": 2027520, "rew": 6657.0263, "rew_std": 1416.5504, "Agent": "PPO"}, {"env_step": 2058240, "rew": 6797.0142, "rew_std": 1369.9286, "Agent": "PPO"}, {"env_step": 2088960, "rew": 6941.3041, "rew_std": 1424.6141, "Agent": "PPO"}, {"env_step": 2119680, "rew": 6679.1551, "rew_std": 1502.0568, "Agent": "PPO"}, {"env_step": 2150400, "rew": 6877.6658, "rew_std": 1419.0989, "Agent": "PPO"}, {"env_step": 2181120, "rew": 6893.2083, "rew_std": 1362.4631, "Agent": "PPO"}, {"env_step": 2211840, "rew": 6884.2739, "rew_std": 1537.1663, "Agent": "PPO"}, {"env_step": 2242560, "rew": 6544.0137, "rew_std": 1765.0257, "Agent": "PPO"}, {"env_step": 2273280, "rew": 6873.6828, "rew_std": 1544.1919, "Agent": "PPO"}, {"env_step": 2304000, "rew": 6930.433, "rew_std": 1425.9817, "Agent": "PPO"}, {"env_step": 2334720, "rew": 6970.6427, "rew_std": 1612.793, "Agent": "PPO"}, {"env_step": 2365440, "rew": 6976.7841, "rew_std": 1502.4346, "Agent": "PPO"}, {"env_step": 2396160, "rew": 6956.7531, "rew_std": 1521.8277, "Agent": "PPO"}, {"env_step": 2426880, "rew": 6923.9605, "rew_std": 1502.0078, "Agent": "PPO"}, {"env_step": 2457600, "rew": 7076.802, "rew_std": 1461.5333, "Agent": "PPO"}, {"env_step": 2488320, "rew": 6910.2399, "rew_std": 1554.5215, "Agent": "PPO"}, {"env_step": 2519040, "rew": 7015.2602, "rew_std": 1620.3088, "Agent": "PPO"}, {"env_step": 2549760, "rew": 7044.4279, "rew_std": 1445.5683, "Agent": "PPO"}, {"env_step": 2580480, "rew": 7149.1791, "rew_std": 1366.216, "Agent": "PPO"}, {"env_step": 2611200, "rew": 7272.657, "rew_std": 1544.8839, "Agent": "PPO"}, {"env_step": 2641920, "rew": 7315.5085, "rew_std": 1382.7119, "Agent": "PPO"}, {"env_step": 2672640, "rew": 7118.8575, "rew_std": 1598.8056, "Agent": "PPO"}, {"env_step": 2703360, "rew": 7207.8444, "rew_std": 1569.6635, "Agent": "PPO"}, {"env_step": 2734080, "rew": 7174.3004, "rew_std": 1515.153, "Agent": "PPO"}, {"env_step": 2764800, "rew": 7262.0208, "rew_std": 1514.371, "Agent": "PPO"}, {"env_step": 2795520, "rew": 7172.3527, "rew_std": 1623.1998, "Agent": "PPO"}, {"env_step": 2826240, "rew": 7233.2708, "rew_std": 1585.3007, "Agent": "PPO"}, {"env_step": 2856960, "rew": 7217.521, "rew_std": 1510.6647, "Agent": "PPO"}, {"env_step": 2887680, "rew": 7293.4964, "rew_std": 1417.3943, "Agent": "PPO"}, {"env_step": 2918400, "rew": 7337.4447, "rew_std": 1508.2475, "Agent": "PPO"}, {"env_step": 2949120, "rew": 7153.7914, "rew_std": 1587.5787, "Agent": "PPO"}, {"env_step": 2979840, "rew": 7241.567, "rew_std": 1467.1855, "Agent": "PPO"}, {"env_step": 3010560, "rew": 7274.2529, "rew_std": 1480.4173, "Agent": "PPO"}, {"env_step": 3041280, "rew": 7236.2394, "rew_std": 1590.6492, "Agent": "PPO"}, {"env_step": 3072000, "rew": 7194.2608, "rew_std": 1404.8626, "Agent": "PPO"}, {"env_step": 5000, "rew": -491.7738, "rew_std": 108.7776, "Agent": "TD3"}, {"env_step": 10000, "rew": -262.0194, "rew_std": 291.8401, "Agent": "TD3"}, {"env_step": 15000, "rew": 939.3631, "rew_std": 527.7309, "Agent": "TD3"}, {"env_step": 20000, "rew": 1252.1263, "rew_std": 495.519, "Agent": "TD3"}, {"env_step": 25000, "rew": 2023.157, "rew_std": 523.8599, "Agent": "TD3"}, {"env_step": 30000, "rew": 2470.4407, "rew_std": 572.3322, "Agent": "TD3"}, {"env_step": 35000, "rew": 2749.4355, "rew_std": 598.9823, "Agent": "TD3"}, {"env_step": 40000, "rew": 3033.9985, "rew_std": 779.7287, "Agent": "TD3"}, {"env_step": 45000, "rew": 3414.1016, "rew_std": 557.1514, "Agent": "TD3"}, {"env_step": 50000, "rew": 3891.1476, "rew_std": 538.9045, "Agent": "TD3"}, {"env_step": 55000, "rew": 3769.953, "rew_std": 880.9102, "Agent": "TD3"}, {"env_step": 60000, "rew": 4215.0849, "rew_std": 338.3772, "Agent": "TD3"}, {"env_step": 65000, "rew": 4181.9487, "rew_std": 574.3375, "Agent": "TD3"}, {"env_step": 70000, "rew": 4451.898, "rew_std": 650.4167, "Agent": "TD3"}, {"env_step": 75000, "rew": 4715.3097, "rew_std": 387.332, "Agent": "TD3"}, {"env_step": 80000, "rew": 4977.8756, "rew_std": 332.4097, "Agent": "TD3"}, {"env_step": 85000, "rew": 4896.933, "rew_std": 436.9965, "Agent": "TD3"}, {"env_step": 90000, "rew": 5098.2884, "rew_std": 380.5583, "Agent": "TD3"}, {"env_step": 95000, "rew": 5064.4533, "rew_std": 376.0554, "Agent": "TD3"}, {"env_step": 100000, "rew": 5335.7776, "rew_std": 376.493, "Agent": "TD3"}, {"env_step": 105000, "rew": 5467.5474, "rew_std": 373.8211, "Agent": "TD3"}, {"env_step": 110000, "rew": 5548.1319, "rew_std": 376.2427, "Agent": "TD3"}, {"env_step": 115000, "rew": 5569.3028, "rew_std": 518.1977, "Agent": "TD3"}, {"env_step": 120000, "rew": 5557.8942, "rew_std": 501.4938, "Agent": "TD3"}, {"env_step": 125000, "rew": 5722.358, "rew_std": 351.7448, "Agent": "TD3"}, {"env_step": 130000, "rew": 5758.6115, "rew_std": 424.7812, "Agent": "TD3"}, {"env_step": 135000, "rew": 5848.0071, "rew_std": 496.162, "Agent": "TD3"}, {"env_step": 140000, "rew": 6062.7877, "rew_std": 456.7988, "Agent": "TD3"}, {"env_step": 145000, "rew": 5828.3979, "rew_std": 584.2805, "Agent": "TD3"}, {"env_step": 150000, "rew": 6110.8245, "rew_std": 399.7731, "Agent": "TD3"}, {"env_step": 155000, "rew": 6157.971, "rew_std": 451.4417, "Agent": "TD3"}, {"env_step": 160000, "rew": 6260.956, "rew_std": 455.5466, "Agent": "TD3"}, {"env_step": 165000, "rew": 6117.1841, "rew_std": 576.6519, "Agent": "TD3"}, {"env_step": 170000, "rew": 6360.7148, "rew_std": 465.9206, "Agent": "TD3"}, {"env_step": 175000, "rew": 6488.1046, "rew_std": 564.2199, "Agent": "TD3"}, {"env_step": 180000, "rew": 6485.5139, "rew_std": 523.2218, "Agent": "TD3"}, {"env_step": 185000, "rew": 6511.1075, "rew_std": 624.1234, "Agent": "TD3"}, {"env_step": 190000, "rew": 6623.9033, "rew_std": 606.1132, "Agent": "TD3"}, {"env_step": 195000, "rew": 6753.3993, "rew_std": 578.0539, "Agent": "TD3"}, {"env_step": 200000, "rew": 6720.6971, "rew_std": 617.1835, "Agent": "TD3"}, {"env_step": 205000, "rew": 6882.3305, "rew_std": 679.724, "Agent": "TD3"}, {"env_step": 210000, "rew": 6880.4545, "rew_std": 707.2802, "Agent": "TD3"}, {"env_step": 215000, "rew": 6899.3154, "rew_std": 623.297, "Agent": "TD3"}, {"env_step": 220000, "rew": 6959.4102, "rew_std": 532.1334, "Agent": "TD3"}, {"env_step": 225000, "rew": 6920.9057, "rew_std": 511.4183, "Agent": "TD3"}, {"env_step": 230000, "rew": 7056.547, "rew_std": 597.4038, "Agent": "TD3"}, {"env_step": 235000, "rew": 7163.5816, "rew_std": 656.1597, "Agent": "TD3"}, {"env_step": 240000, "rew": 7138.8121, "rew_std": 625.1124, "Agent": "TD3"}, {"env_step": 245000, "rew": 7201.8415, "rew_std": 736.7508, "Agent": "TD3"}, {"env_step": 250000, "rew": 7254.6046, "rew_std": 704.2153, "Agent": "TD3"}, {"env_step": 255000, "rew": 7104.3644, "rew_std": 774.2303, "Agent": "TD3"}, {"env_step": 260000, "rew": 7358.2901, "rew_std": 657.0822, "Agent": "TD3"}, {"env_step": 265000, "rew": 7387.0317, "rew_std": 690.7049, "Agent": "TD3"}, {"env_step": 270000, "rew": 7399.2832, "rew_std": 627.2569, "Agent": "TD3"}, {"env_step": 275000, "rew": 7461.1843, "rew_std": 752.2841, "Agent": "TD3"}, {"env_step": 280000, "rew": 7507.7466, "rew_std": 668.2431, "Agent": "TD3"}, {"env_step": 285000, "rew": 7564.6746, "rew_std": 704.8122, "Agent": "TD3"}, {"env_step": 290000, "rew": 7651.8881, "rew_std": 744.0028, "Agent": "TD3"}, {"env_step": 295000, "rew": 7639.7461, "rew_std": 683.6467, "Agent": "TD3"}, {"env_step": 300000, "rew": 7545.8266, "rew_std": 716.7928, "Agent": "TD3"}, {"env_step": 305000, "rew": 7586.793, "rew_std": 633.4799, "Agent": "TD3"}, {"env_step": 310000, "rew": 7830.0758, "rew_std": 786.95, "Agent": "TD3"}, {"env_step": 315000, "rew": 7753.983, "rew_std": 751.0059, "Agent": "TD3"}, {"env_step": 320000, "rew": 7838.6571, "rew_std": 738.9047, "Agent": "TD3"}, {"env_step": 325000, "rew": 7792.9696, "rew_std": 740.962, "Agent": "TD3"}, {"env_step": 330000, "rew": 7909.5051, "rew_std": 752.5249, "Agent": "TD3"}, {"env_step": 335000, "rew": 7940.4501, "rew_std": 803.4945, "Agent": "TD3"}, {"env_step": 340000, "rew": 7962.7489, "rew_std": 717.4368, "Agent": "TD3"}, {"env_step": 345000, "rew": 8013.5734, "rew_std": 914.0881, "Agent": "TD3"}, {"env_step": 350000, "rew": 8012.9812, "rew_std": 746.8912, "Agent": "TD3"}, {"env_step": 355000, "rew": 8070.066, "rew_std": 728.7675, "Agent": "TD3"}, {"env_step": 360000, "rew": 8029.628, "rew_std": 815.7537, "Agent": "TD3"}, {"env_step": 365000, "rew": 8189.133, "rew_std": 768.2708, "Agent": "TD3"}, {"env_step": 370000, "rew": 8138.5234, "rew_std": 870.01, "Agent": "TD3"}, {"env_step": 375000, "rew": 8199.8861, "rew_std": 749.7979, "Agent": "TD3"}, {"env_step": 380000, "rew": 8178.8484, "rew_std": 704.411, "Agent": "TD3"}, {"env_step": 385000, "rew": 8218.0795, "rew_std": 760.3696, "Agent": "TD3"}, {"env_step": 390000, "rew": 8320.7244, "rew_std": 742.0684, "Agent": "TD3"}, {"env_step": 395000, "rew": 8306.1744, "rew_std": 774.4848, "Agent": "TD3"}, {"env_step": 400000, "rew": 8332.8264, "rew_std": 662.934, "Agent": "TD3"}, {"env_step": 405000, "rew": 8454.6759, "rew_std": 784.0574, "Agent": "TD3"}, {"env_step": 410000, "rew": 8435.5763, "rew_std": 857.1755, "Agent": "TD3"}, {"env_step": 415000, "rew": 8429.4245, "rew_std": 696.4486, "Agent": "TD3"}, {"env_step": 420000, "rew": 8507.612, "rew_std": 759.0253, "Agent": "TD3"}, {"env_step": 425000, "rew": 8407.1033, "rew_std": 731.4275, "Agent": "TD3"}, {"env_step": 430000, "rew": 8494.8885, "rew_std": 743.2674, "Agent": "TD3"}, {"env_step": 435000, "rew": 8612.279, "rew_std": 793.3193, "Agent": "TD3"}, {"env_step": 440000, "rew": 8607.9371, "rew_std": 747.9842, "Agent": "TD3"}, {"env_step": 445000, "rew": 8591.4923, "rew_std": 747.7889, "Agent": "TD3"}, {"env_step": 450000, "rew": 8595.9424, "rew_std": 824.3331, "Agent": "TD3"}, {"env_step": 455000, "rew": 8677.8482, "rew_std": 772.3754, "Agent": "TD3"}, {"env_step": 460000, "rew": 8598.7622, "rew_std": 820.0984, "Agent": "TD3"}, {"env_step": 465000, "rew": 8559.2102, "rew_std": 880.4971, "Agent": "TD3"}, {"env_step": 470000, "rew": 8745.6001, "rew_std": 739.5832, "Agent": "TD3"}, {"env_step": 475000, "rew": 8737.3063, "rew_std": 747.7016, "Agent": "TD3"}, {"env_step": 480000, "rew": 8790.2033, "rew_std": 752.6937, "Agent": "TD3"}, {"env_step": 485000, "rew": 8760.4856, "rew_std": 774.4096, "Agent": "TD3"}, {"env_step": 490000, "rew": 8824.4661, "rew_std": 818.5167, "Agent": "TD3"}, {"env_step": 495000, "rew": 8831.1715, "rew_std": 787.5662, "Agent": "TD3"}, {"env_step": 500000, "rew": 8804.9793, "rew_std": 731.6913, "Agent": "TD3"}, {"env_step": 505000, "rew": 8850.2683, "rew_std": 735.7623, "Agent": "TD3"}, {"env_step": 510000, "rew": 8760.5785, "rew_std": 871.1392, "Agent": "TD3"}, {"env_step": 515000, "rew": 8909.451, "rew_std": 750.5147, "Agent": "TD3"}, {"env_step": 520000, "rew": 8898.6247, "rew_std": 823.3533, "Agent": "TD3"}, {"env_step": 525000, "rew": 8979.796, "rew_std": 803.2727, "Agent": "TD3"}, {"env_step": 530000, "rew": 8826.3866, "rew_std": 688.6222, "Agent": "TD3"}, {"env_step": 535000, "rew": 8943.3122, "rew_std": 862.1328, "Agent": "TD3"}, {"env_step": 540000, "rew": 8950.6791, "rew_std": 841.9943, "Agent": "TD3"}, {"env_step": 545000, "rew": 9076.3193, "rew_std": 807.2128, "Agent": "TD3"}, {"env_step": 550000, "rew": 9083.1078, "rew_std": 783.0794, "Agent": "TD3"}, {"env_step": 555000, "rew": 9100.463, "rew_std": 788.4377, "Agent": "TD3"}, {"env_step": 560000, "rew": 9109.1642, "rew_std": 766.6449, "Agent": "TD3"}, {"env_step": 565000, "rew": 9035.3107, "rew_std": 832.0449, "Agent": "TD3"}, {"env_step": 570000, "rew": 9088.8057, "rew_std": 692.5742, "Agent": "TD3"}, {"env_step": 575000, "rew": 9071.9369, "rew_std": 754.8484, "Agent": "TD3"}, {"env_step": 580000, "rew": 9110.8467, "rew_std": 743.0409, "Agent": "TD3"}, {"env_step": 585000, "rew": 9193.2445, "rew_std": 875.4127, "Agent": "TD3"}, {"env_step": 590000, "rew": 9195.2836, "rew_std": 813.2878, "Agent": "TD3"}, {"env_step": 595000, "rew": 9187.9049, "rew_std": 740.0919, "Agent": "TD3"}, {"env_step": 600000, "rew": 9327.7404, "rew_std": 806.1976, "Agent": "TD3"}, {"env_step": 605000, "rew": 9138.3398, "rew_std": 725.0365, "Agent": "TD3"}, {"env_step": 610000, "rew": 9264.9501, "rew_std": 799.4507, "Agent": "TD3"}, {"env_step": 615000, "rew": 9312.8531, "rew_std": 837.1041, "Agent": "TD3"}, {"env_step": 620000, "rew": 9283.921, "rew_std": 826.1715, "Agent": "TD3"}, {"env_step": 625000, "rew": 9361.8274, "rew_std": 825.3747, "Agent": "TD3"}, {"env_step": 630000, "rew": 9282.1575, "rew_std": 730.256, "Agent": "TD3"}, {"env_step": 635000, "rew": 9377.9864, "rew_std": 793.3509, "Agent": "TD3"}, {"env_step": 640000, "rew": 9284.64, "rew_std": 737.4991, "Agent": "TD3"}, {"env_step": 645000, "rew": 9341.4001, "rew_std": 796.181, "Agent": "TD3"}, {"env_step": 650000, "rew": 9393.1446, "rew_std": 719.3792, "Agent": "TD3"}, {"env_step": 655000, "rew": 9431.7345, "rew_std": 797.8404, "Agent": "TD3"}, {"env_step": 660000, "rew": 9517.6054, "rew_std": 840.7985, "Agent": "TD3"}, {"env_step": 665000, "rew": 9404.8517, "rew_std": 747.3251, "Agent": "TD3"}, {"env_step": 670000, "rew": 9454.8159, "rew_std": 760.1696, "Agent": "TD3"}, {"env_step": 675000, "rew": 9500.148, "rew_std": 787.3883, "Agent": "TD3"}, {"env_step": 680000, "rew": 9561.3347, "rew_std": 785.2622, "Agent": "TD3"}, {"env_step": 685000, "rew": 9487.3321, "rew_std": 818.1828, "Agent": "TD3"}, {"env_step": 690000, "rew": 9426.4945, "rew_std": 792.3134, "Agent": "TD3"}, {"env_step": 695000, "rew": 9489.5022, "rew_std": 765.5105, "Agent": "TD3"}, {"env_step": 700000, "rew": 9341.9792, "rew_std": 846.4012, "Agent": "TD3"}, {"env_step": 705000, "rew": 9454.9199, "rew_std": 764.8516, "Agent": "TD3"}, {"env_step": 710000, "rew": 9589.4149, "rew_std": 772.9486, "Agent": "TD3"}, {"env_step": 715000, "rew": 9645.4927, "rew_std": 780.9173, "Agent": "TD3"}, {"env_step": 720000, "rew": 9668.0014, "rew_std": 785.7856, "Agent": "TD3"}, {"env_step": 725000, "rew": 9625.1669, "rew_std": 737.8234, "Agent": "TD3"}, {"env_step": 730000, "rew": 9502.0475, "rew_std": 968.5391, "Agent": "TD3"}, {"env_step": 735000, "rew": 9483.871, "rew_std": 690.854, "Agent": "TD3"}, {"env_step": 740000, "rew": 9641.7172, "rew_std": 793.3571, "Agent": "TD3"}, {"env_step": 745000, "rew": 9734.494, "rew_std": 812.6246, "Agent": "TD3"}, {"env_step": 750000, "rew": 9720.93, "rew_std": 783.6363, "Agent": "TD3"}, {"env_step": 755000, "rew": 9665.8567, "rew_std": 815.7909, "Agent": "TD3"}, {"env_step": 760000, "rew": 9679.3486, "rew_std": 800.5279, "Agent": "TD3"}, {"env_step": 765000, "rew": 9763.7048, "rew_std": 834.6644, "Agent": "TD3"}, {"env_step": 770000, "rew": 9772.4914, "rew_std": 832.7718, "Agent": "TD3"}, {"env_step": 775000, "rew": 9804.0023, "rew_std": 792.9635, "Agent": "TD3"}, {"env_step": 780000, "rew": 9745.1979, "rew_std": 920.7406, "Agent": "TD3"}, {"env_step": 785000, "rew": 9750.7988, "rew_std": 784.167, "Agent": "TD3"}, {"env_step": 790000, "rew": 9808.6392, "rew_std": 822.0098, "Agent": "TD3"}, {"env_step": 795000, "rew": 9754.6227, "rew_std": 831.5913, "Agent": "TD3"}, {"env_step": 800000, "rew": 9778.1098, "rew_std": 763.7581, "Agent": "TD3"}, {"env_step": 805000, "rew": 9825.7902, "rew_std": 813.3548, "Agent": "TD3"}, {"env_step": 810000, "rew": 9798.4076, "rew_std": 799.6761, "Agent": "TD3"}, {"env_step": 815000, "rew": 9804.338, "rew_std": 798.6376, "Agent": "TD3"}, {"env_step": 820000, "rew": 9793.0963, "rew_std": 809.0504, "Agent": "TD3"}, {"env_step": 825000, "rew": 9821.5347, "rew_std": 811.4409, "Agent": "TD3"}, {"env_step": 830000, "rew": 9762.1984, "rew_std": 753.4929, "Agent": "TD3"}, {"env_step": 835000, "rew": 9852.6895, "rew_std": 841.7706, "Agent": "TD3"}, {"env_step": 840000, "rew": 9872.1575, "rew_std": 756.2683, "Agent": "TD3"}, {"env_step": 845000, "rew": 9909.5908, "rew_std": 837.792, "Agent": "TD3"}, {"env_step": 850000, "rew": 9916.1449, "rew_std": 807.2152, "Agent": "TD3"}, {"env_step": 855000, "rew": 9883.2548, "rew_std": 776.8632, "Agent": "TD3"}, {"env_step": 860000, "rew": 9974.5868, "rew_std": 808.4498, "Agent": "TD3"}, {"env_step": 865000, "rew": 9928.346, "rew_std": 811.971, "Agent": "TD3"}, {"env_step": 870000, "rew": 9910.8146, "rew_std": 829.7343, "Agent": "TD3"}, {"env_step": 875000, "rew": 9915.3258, "rew_std": 716.3259, "Agent": "TD3"}, {"env_step": 880000, "rew": 9943.3313, "rew_std": 801.7854, "Agent": "TD3"}, {"env_step": 885000, "rew": 9973.9117, "rew_std": 815.8196, "Agent": "TD3"}, {"env_step": 890000, "rew": 10028.523, "rew_std": 810.603, "Agent": "TD3"}, {"env_step": 895000, "rew": 9988.4478, "rew_std": 830.4222, "Agent": "TD3"}, {"env_step": 900000, "rew": 10019.7384, "rew_std": 821.4592, "Agent": "TD3"}, {"env_step": 905000, "rew": 10014.3362, "rew_std": 800.811, "Agent": "TD3"}, {"env_step": 910000, "rew": 10115.0379, "rew_std": 802.7237, "Agent": "TD3"}, {"env_step": 915000, "rew": 10078.2624, "rew_std": 763.4506, "Agent": "TD3"}, {"env_step": 920000, "rew": 10025.5229, "rew_std": 706.419, "Agent": "TD3"}, {"env_step": 925000, "rew": 10137.1765, "rew_std": 784.5741, "Agent": "TD3"}, {"env_step": 930000, "rew": 10029.2503, "rew_std": 786.896, "Agent": "TD3"}, {"env_step": 935000, "rew": 10059.9907, "rew_std": 770.6038, "Agent": "TD3"}, {"env_step": 940000, "rew": 10080.8968, "rew_std": 868.2282, "Agent": "TD3"}, {"env_step": 945000, "rew": 10087.6062, "rew_std": 761.3788, "Agent": "TD3"}, {"env_step": 950000, "rew": 10130.8133, "rew_std": 817.9981, "Agent": "TD3"}, {"env_step": 955000, "rew": 10119.0627, "rew_std": 797.4048, "Agent": "TD3"}, {"env_step": 960000, "rew": 10117.4533, "rew_std": 731.4008, "Agent": "TD3"}, {"env_step": 965000, "rew": 10095.9303, "rew_std": 840.427, "Agent": "TD3"}, {"env_step": 970000, "rew": 10065.6145, "rew_std": 821.9565, "Agent": "TD3"}, {"env_step": 975000, "rew": 10168.2197, "rew_std": 772.3371, "Agent": "TD3"}, {"env_step": 980000, "rew": 10138.8102, "rew_std": 797.7195, "Agent": "TD3"}, {"env_step": 985000, "rew": 10201.1953, "rew_std": 772.7887, "Agent": "TD3"}, {"env_step": 990000, "rew": 10164.0714, "rew_std": 772.0474, "Agent": "TD3"}, {"env_step": 995000, "rew": 10166.9941, "rew_std": 782.1563, "Agent": "TD3"}, {"env_step": 1000000, "rew": 10126.7338, "rew_std": 691.8358, "Agent": "TD3"}, {"env_step": 1005000, "rew": 10178.6879, "rew_std": 730.893, "Agent": "TD3"}, {"env_step": 1010000, "rew": 10218.8769, "rew_std": 779.1047, "Agent": "TD3"}, {"env_step": 1015000, "rew": 10223.7908, "rew_std": 805.2236, "Agent": "TD3"}, {"env_step": 1020000, "rew": 10283.0535, "rew_std": 840.6199, "Agent": "TD3"}, {"env_step": 1025000, "rew": 10234.8471, "rew_std": 737.6595, "Agent": "TD3"}, {"env_step": 1030000, "rew": 10276.3837, "rew_std": 851.1605, "Agent": "TD3"}, {"env_step": 1035000, "rew": 10326.8339, "rew_std": 794.7202, "Agent": "TD3"}, {"env_step": 1040000, "rew": 10296.1702, "rew_std": 756.8565, "Agent": "TD3"}, {"env_step": 1045000, "rew": 10303.7155, "rew_std": 793.3612, "Agent": "TD3"}, {"env_step": 1050000, "rew": 10323.1621, "rew_std": 822.8054, "Agent": "TD3"}, {"env_step": 1055000, "rew": 10317.0148, "rew_std": 815.1317, "Agent": "TD3"}, {"env_step": 1060000, "rew": 10384.3829, "rew_std": 792.7379, "Agent": "TD3"}, {"env_step": 1065000, "rew": 10312.6868, "rew_std": 802.5368, "Agent": "TD3"}, {"env_step": 1070000, "rew": 10337.5452, "rew_std": 731.5095, "Agent": "TD3"}, {"env_step": 1075000, "rew": 10426.9081, "rew_std": 720.6897, "Agent": "TD3"}, {"env_step": 1080000, "rew": 10445.9585, "rew_std": 743.8478, "Agent": "TD3"}, {"env_step": 1085000, "rew": 10404.4356, "rew_std": 686.9511, "Agent": "TD3"}, {"env_step": 1090000, "rew": 10411.9082, "rew_std": 759.3062, "Agent": "TD3"}, {"env_step": 1095000, "rew": 10493.6734, "rew_std": 719.0233, "Agent": "TD3"}, {"env_step": 1100000, "rew": 10446.2659, "rew_std": 800.8762, "Agent": "TD3"}, {"env_step": 1105000, "rew": 10473.0588, "rew_std": 714.3254, "Agent": "TD3"}, {"env_step": 1110000, "rew": 10559.5191, "rew_std": 748.8673, "Agent": "TD3"}, {"env_step": 1115000, "rew": 10549.2806, "rew_std": 754.3475, "Agent": "TD3"}, {"env_step": 1120000, "rew": 10452.5229, "rew_std": 692.153, "Agent": "TD3"}, {"env_step": 1125000, "rew": 10562.384, "rew_std": 770.6165, "Agent": "TD3"}, {"env_step": 1130000, "rew": 10547.1885, "rew_std": 711.6438, "Agent": "TD3"}, {"env_step": 1135000, "rew": 10602.5228, "rew_std": 721.8553, "Agent": "TD3"}, {"env_step": 1140000, "rew": 10459.9711, "rew_std": 688.9873, "Agent": "TD3"}, {"env_step": 1145000, "rew": 10592.8877, "rew_std": 706.5442, "Agent": "TD3"}, {"env_step": 1150000, "rew": 10587.6289, "rew_std": 766.3566, "Agent": "TD3"}, {"env_step": 1155000, "rew": 10635.7845, "rew_std": 774.0688, "Agent": "TD3"}, {"env_step": 1160000, "rew": 10659.2155, "rew_std": 774.1428, "Agent": "TD3"}, {"env_step": 1165000, "rew": 10574.2337, "rew_std": 678.7509, "Agent": "TD3"}, {"env_step": 1170000, "rew": 10614.9555, "rew_std": 700.4832, "Agent": "TD3"}, {"env_step": 1175000, "rew": 10676.1137, "rew_std": 676.5039, "Agent": "TD3"}, {"env_step": 1180000, "rew": 10698.8282, "rew_std": 658.7235, "Agent": "TD3"}, {"env_step": 1185000, "rew": 10542.7353, "rew_std": 663.1433, "Agent": "TD3"}, {"env_step": 1190000, "rew": 10669.2207, "rew_std": 709.0098, "Agent": "TD3"}, {"env_step": 1195000, "rew": 10655.4834, "rew_std": 698.5363, "Agent": "TD3"}, {"env_step": 1200000, "rew": 10633.3746, "rew_std": 638.7168, "Agent": "TD3"}, {"env_step": 1205000, "rew": 10701.2624, "rew_std": 710.2126, "Agent": "TD3"}, {"env_step": 1210000, "rew": 10764.1783, "rew_std": 624.228, "Agent": "TD3"}, {"env_step": 1215000, "rew": 10750.3966, "rew_std": 695.4035, "Agent": "TD3"}, {"env_step": 1220000, "rew": 10837.0146, "rew_std": 677.4937, "Agent": "TD3"}, {"env_step": 1225000, "rew": 10737.5749, "rew_std": 714.6048, "Agent": "TD3"}, {"env_step": 1230000, "rew": 10771.3394, "rew_std": 627.9872, "Agent": "TD3"}, {"env_step": 1235000, "rew": 10858.5293, "rew_std": 689.6976, "Agent": "TD3"}, {"env_step": 1240000, "rew": 10797.6929, "rew_std": 668.7104, "Agent": "TD3"}, {"env_step": 1245000, "rew": 10868.2019, "rew_std": 696.346, "Agent": "TD3"}, {"env_step": 1250000, "rew": 10792.3989, "rew_std": 665.2522, "Agent": "TD3"}, {"env_step": 0, "rew": -239.2134, "rew_std": 26.5314, "Agent": "REINFORCE"}, {"env_step": 30720, "rew": -130.9784, "rew_std": 17.5175, "Agent": "REINFORCE"}, {"env_step": 61440, "rew": -48.2173, "rew_std": 19.3685, "Agent": "REINFORCE"}, {"env_step": 92160, "rew": -52.4932, "rew_std": 35.6246, "Agent": "REINFORCE"}, {"env_step": 122880, "rew": -65.4243, "rew_std": 29.0437, "Agent": "REINFORCE"}, {"env_step": 153600, "rew": -72.0306, "rew_std": 36.0845, "Agent": "REINFORCE"}, {"env_step": 184320, "rew": 0.4784, "rew_std": 67.6205, "Agent": "REINFORCE"}, {"env_step": 215040, "rew": 13.6712, "rew_std": 101.5885, "Agent": "REINFORCE"}, {"env_step": 245760, "rew": 139.6784, "rew_std": 121.8181, "Agent": "REINFORCE"}, {"env_step": 276480, "rew": 130.5103, "rew_std": 191.4711, "Agent": "REINFORCE"}, {"env_step": 307200, "rew": 114.7512, "rew_std": 190.9939, "Agent": "REINFORCE"}, {"env_step": 337920, "rew": 68.9615, "rew_std": 121.306, "Agent": "REINFORCE"}, {"env_step": 368640, "rew": 109.9668, "rew_std": 138.3891, "Agent": "REINFORCE"}, {"env_step": 399360, "rew": 126.0045, "rew_std": 178.0439, "Agent": "REINFORCE"}, {"env_step": 430080, "rew": 204.6715, "rew_std": 161.6187, "Agent": "REINFORCE"}, {"env_step": 460800, "rew": 272.3794, "rew_std": 130.6516, "Agent": "REINFORCE"}, {"env_step": 491520, "rew": 363.4219, "rew_std": 141.1197, "Agent": "REINFORCE"}, {"env_step": 522240, "rew": 323.1122, "rew_std": 199.7319, "Agent": "REINFORCE"}, {"env_step": 552960, "rew": 336.5633, "rew_std": 202.8921, "Agent": "REINFORCE"}, {"env_step": 583680, "rew": 350.5812, "rew_std": 196.8854, "Agent": "REINFORCE"}, {"env_step": 614400, "rew": 371.6283, "rew_std": 190.2861, "Agent": "REINFORCE"}, {"env_step": 645120, "rew": 403.8344, "rew_std": 176.4811, "Agent": "REINFORCE"}, {"env_step": 675840, "rew": 429.8125, "rew_std": 182.3272, "Agent": "REINFORCE"}, {"env_step": 706560, "rew": 445.647, "rew_std": 156.3292, "Agent": "REINFORCE"}, {"env_step": 737280, "rew": 409.2769, "rew_std": 187.4834, "Agent": "REINFORCE"}, {"env_step": 768000, "rew": 399.6021, "rew_std": 222.1071, "Agent": "REINFORCE"}, {"env_step": 798720, "rew": 402.4893, "rew_std": 243.7293, "Agent": "REINFORCE"}, {"env_step": 829440, "rew": 436.1274, "rew_std": 245.7288, "Agent": "REINFORCE"}, {"env_step": 860160, "rew": 434.0936, "rew_std": 248.5055, "Agent": "REINFORCE"}, {"env_step": 890880, "rew": 422.6199, "rew_std": 266.891, "Agent": "REINFORCE"}, {"env_step": 921600, "rew": 458.7628, "rew_std": 234.5876, "Agent": "REINFORCE"}, {"env_step": 952320, "rew": 481.243, "rew_std": 243.8428, "Agent": "REINFORCE"}, {"env_step": 983040, "rew": 512.3078, "rew_std": 209.158, "Agent": "REINFORCE"}, {"env_step": 1013760, "rew": 525.5006, "rew_std": 181.8258, "Agent": "REINFORCE"}, {"env_step": 1044480, "rew": 532.0321, "rew_std": 198.5119, "Agent": "REINFORCE"}, {"env_step": 1075200, "rew": 541.2009, "rew_std": 191.9939, "Agent": "REINFORCE"}, {"env_step": 1105920, "rew": 552.9654, "rew_std": 191.0248, "Agent": "REINFORCE"}, {"env_step": 1136640, "rew": 549.1181, "rew_std": 197.3171, "Agent": "REINFORCE"}, {"env_step": 1167360, "rew": 604.0583, "rew_std": 174.7335, "Agent": "REINFORCE"}, {"env_step": 1198080, "rew": 594.4701, "rew_std": 154.8017, "Agent": "REINFORCE"}, {"env_step": 1228800, "rew": 606.9413, "rew_std": 156.8321, "Agent": "REINFORCE"}, {"env_step": 1259520, "rew": 620.9988, "rew_std": 143.3749, "Agent": "REINFORCE"}, {"env_step": 1290240, "rew": 634.8226, "rew_std": 140.0081, "Agent": "REINFORCE"}, {"env_step": 1320960, "rew": 635.5886, "rew_std": 129.6849, "Agent": "REINFORCE"}, {"env_step": 1351680, "rew": 641.4025, "rew_std": 119.5029, "Agent": "REINFORCE"}, {"env_step": 1382400, "rew": 631.3879, "rew_std": 128.1176, "Agent": "REINFORCE"}, {"env_step": 1413120, "rew": 657.6043, "rew_std": 124.8992, "Agent": "REINFORCE"}, {"env_step": 1443840, "rew": 675.7489, "rew_std": 119.027, "Agent": "REINFORCE"}, {"env_step": 1474560, "rew": 662.4531, "rew_std": 105.9602, "Agent": "REINFORCE"}, {"env_step": 1505280, "rew": 666.6031, "rew_std": 103.0068, "Agent": "REINFORCE"}, {"env_step": 1536000, "rew": 683.1362, "rew_std": 107.026, "Agent": "REINFORCE"}, {"env_step": 1566720, "rew": 686.2614, "rew_std": 112.2725, "Agent": "REINFORCE"}, {"env_step": 1597440, "rew": 696.8179, "rew_std": 98.897, "Agent": "REINFORCE"}, {"env_step": 1628160, "rew": 702.4769, "rew_std": 94.8873, "Agent": "REINFORCE"}, {"env_step": 1658880, "rew": 704.4676, "rew_std": 87.216, "Agent": "REINFORCE"}, {"env_step": 1689600, "rew": 733.5609, "rew_std": 85.4199, "Agent": "REINFORCE"}, {"env_step": 1720320, "rew": 739.9737, "rew_std": 74.0321, "Agent": "REINFORCE"}, {"env_step": 1751040, "rew": 727.4521, "rew_std": 62.8634, "Agent": "REINFORCE"}, {"env_step": 1781760, "rew": 732.5071, "rew_std": 71.188, "Agent": "REINFORCE"}, {"env_step": 1812480, "rew": 748.7167, "rew_std": 76.5575, "Agent": "REINFORCE"}, {"env_step": 1843200, "rew": 737.4527, "rew_std": 72.1915, "Agent": "REINFORCE"}, {"env_step": 1873920, "rew": 754.2162, "rew_std": 73.0255, "Agent": "REINFORCE"}, {"env_step": 1904640, "rew": 756.587, "rew_std": 80.629, "Agent": "REINFORCE"}, {"env_step": 1935360, "rew": 725.8417, "rew_std": 120.566, "Agent": "REINFORCE"}, {"env_step": 1966080, "rew": 769.9105, "rew_std": 63.3313, "Agent": "REINFORCE"}, {"env_step": 1996800, "rew": 755.0456, "rew_std": 47.4848, "Agent": "REINFORCE"}, {"env_step": 2027520, "rew": 780.3756, "rew_std": 56.5651, "Agent": "REINFORCE"}, {"env_step": 2058240, "rew": 769.5733, "rew_std": 67.2945, "Agent": "REINFORCE"}, {"env_step": 2088960, "rew": 781.3064, "rew_std": 72.9166, "Agent": "REINFORCE"}, {"env_step": 2119680, "rew": 781.6407, "rew_std": 47.8687, "Agent": "REINFORCE"}, {"env_step": 2150400, "rew": 798.3952, "rew_std": 72.5853, "Agent": "REINFORCE"}, {"env_step": 2181120, "rew": 793.7055, "rew_std": 57.7114, "Agent": "REINFORCE"}, {"env_step": 2211840, "rew": 788.6205, "rew_std": 65.4386, "Agent": "REINFORCE"}, {"env_step": 2242560, "rew": 803.8613, "rew_std": 46.9137, "Agent": "REINFORCE"}, {"env_step": 2273280, "rew": 782.8062, "rew_std": 58.0125, "Agent": "REINFORCE"}, {"env_step": 2304000, "rew": 795.8051, "rew_std": 55.088, "Agent": "REINFORCE"}, {"env_step": 2334720, "rew": 809.0786, "rew_std": 41.5371, "Agent": "REINFORCE"}, {"env_step": 2365440, "rew": 812.1326, "rew_std": 50.8964, "Agent": "REINFORCE"}, {"env_step": 2396160, "rew": 813.0989, "rew_std": 60.4955, "Agent": "REINFORCE"}, {"env_step": 2426880, "rew": 810.6179, "rew_std": 52.8278, "Agent": "REINFORCE"}, {"env_step": 2457600, "rew": 809.6877, "rew_std": 54.128, "Agent": "REINFORCE"}, {"env_step": 2488320, "rew": 831.7716, "rew_std": 46.8229, "Agent": "REINFORCE"}, {"env_step": 2519040, "rew": 831.0148, "rew_std": 49.9816, "Agent": "REINFORCE"}, {"env_step": 2549760, "rew": 819.638, "rew_std": 65.2786, "Agent": "REINFORCE"}, {"env_step": 2580480, "rew": 835.1732, "rew_std": 58.8964, "Agent": "REINFORCE"}, {"env_step": 2611200, "rew": 849.7141, "rew_std": 45.4597, "Agent": "REINFORCE"}, {"env_step": 2641920, "rew": 858.2384, "rew_std": 49.3522, "Agent": "REINFORCE"}, {"env_step": 2672640, "rew": 862.0843, "rew_std": 47.91, "Agent": "REINFORCE"}, {"env_step": 2703360, "rew": 855.118, "rew_std": 31.717, "Agent": "REINFORCE"}, {"env_step": 2734080, "rew": 865.496, "rew_std": 51.6423, "Agent": "REINFORCE"}, {"env_step": 2764800, "rew": 852.2358, "rew_std": 49.6403, "Agent": "REINFORCE"}, {"env_step": 2795520, "rew": 846.0969, "rew_std": 29.3903, "Agent": "REINFORCE"}, {"env_step": 2826240, "rew": 843.4356, "rew_std": 35.9265, "Agent": "REINFORCE"}, {"env_step": 2856960, "rew": 876.8606, "rew_std": 36.6545, "Agent": "REINFORCE"}, {"env_step": 2887680, "rew": 878.6943, "rew_std": 35.3836, "Agent": "REINFORCE"}, {"env_step": 2918400, "rew": 883.9985, "rew_std": 40.9765, "Agent": "REINFORCE"}, {"env_step": 2949120, "rew": 879.088, "rew_std": 36.9194, "Agent": "REINFORCE"}, {"env_step": 2979840, "rew": 883.1086, "rew_std": 51.5751, "Agent": "REINFORCE"}, {"env_step": 3010560, "rew": 878.5629, "rew_std": 51.4401, "Agent": "REINFORCE"}, {"env_step": 3041280, "rew": 876.7223, "rew_std": 54.3786, "Agent": "REINFORCE"}, {"env_step": 3072000, "rew": 881.5336, "rew_std": 83.5794, "Agent": "REINFORCE"}, {"env_step": 3102720, "rew": 867.0418, "rew_std": 82.998, "Agent": "REINFORCE"}, {"env_step": 3133440, "rew": 877.304, "rew_std": 75.1667, "Agent": "REINFORCE"}, {"env_step": 3164160, "rew": 876.2122, "rew_std": 93.2066, "Agent": "REINFORCE"}, {"env_step": 3194880, "rew": 822.7774, "rew_std": 179.4039, "Agent": "REINFORCE"}, {"env_step": 3225600, "rew": 865.225, "rew_std": 95.6548, "Agent": "REINFORCE"}, {"env_step": 3256320, "rew": 876.3886, "rew_std": 65.7255, "Agent": "REINFORCE"}, {"env_step": 3287040, "rew": 901.4318, "rew_std": 44.2542, "Agent": "REINFORCE"}, {"env_step": 3317760, "rew": 906.5281, "rew_std": 40.9878, "Agent": "REINFORCE"}, {"env_step": 3348480, "rew": 902.8887, "rew_std": 42.6048, "Agent": "REINFORCE"}, {"env_step": 3379200, "rew": 887.7884, "rew_std": 55.2236, "Agent": "REINFORCE"}, {"env_step": 3409920, "rew": 890.9958, "rew_std": 45.3819, "Agent": "REINFORCE"}, {"env_step": 3440640, "rew": 905.9487, "rew_std": 59.0244, "Agent": "REINFORCE"}, {"env_step": 3471360, "rew": 878.4631, "rew_std": 77.4708, "Agent": "REINFORCE"}, {"env_step": 3502080, "rew": 918.9451, "rew_std": 68.617, "Agent": "REINFORCE"}, {"env_step": 3532800, "rew": 912.5092, "rew_std": 56.8806, "Agent": "REINFORCE"}, {"env_step": 3563520, "rew": 930.3603, "rew_std": 47.639, "Agent": "REINFORCE"}, {"env_step": 3594240, "rew": 937.8539, "rew_std": 46.8265, "Agent": "REINFORCE"}, {"env_step": 3624960, "rew": 933.9781, "rew_std": 54.7217, "Agent": "REINFORCE"}, {"env_step": 3655680, "rew": 924.4348, "rew_std": 46.9608, "Agent": "REINFORCE"}, {"env_step": 3686400, "rew": 932.5993, "rew_std": 61.1287, "Agent": "REINFORCE"}, {"env_step": 3717120, "rew": 930.562, "rew_std": 39.1545, "Agent": "REINFORCE"}, {"env_step": 3747840, "rew": 939.6507, "rew_std": 50.0547, "Agent": "REINFORCE"}, {"env_step": 3778560, "rew": 931.6101, "rew_std": 64.34, "Agent": "REINFORCE"}, {"env_step": 3809280, "rew": 893.6656, "rew_std": 91.2603, "Agent": "REINFORCE"}, {"env_step": 3840000, "rew": 933.943, "rew_std": 51.9606, "Agent": "REINFORCE"}, {"env_step": 3870720, "rew": 937.8593, "rew_std": 58.272, "Agent": "REINFORCE"}, {"env_step": 3901440, "rew": 923.1785, "rew_std": 46.8948, "Agent": "REINFORCE"}, {"env_step": 3932160, "rew": 919.5106, "rew_std": 79.6043, "Agent": "REINFORCE"}, {"env_step": 3962880, "rew": 937.6189, "rew_std": 35.4825, "Agent": "REINFORCE"}, {"env_step": 3993600, "rew": 941.5022, "rew_std": 39.9812, "Agent": "REINFORCE"}, {"env_step": 4024320, "rew": 927.7056, "rew_std": 43.8473, "Agent": "REINFORCE"}, {"env_step": 4055040, "rew": 955.5857, "rew_std": 40.0532, "Agent": "REINFORCE"}, {"env_step": 4085760, "rew": 954.8072, "rew_std": 47.7404, "Agent": "REINFORCE"}, {"env_step": 4116480, "rew": 968.9528, "rew_std": 47.641, "Agent": "REINFORCE"}, {"env_step": 4147200, "rew": 927.58, "rew_std": 60.9435, "Agent": "REINFORCE"}, {"env_step": 4177920, "rew": 951.3564, "rew_std": 35.3196, "Agent": "REINFORCE"}, {"env_step": 4208640, "rew": 949.8772, "rew_std": 44.6866, "Agent": "REINFORCE"}, {"env_step": 4239360, "rew": 923.3382, "rew_std": 59.9723, "Agent": "REINFORCE"}, {"env_step": 4270080, "rew": 947.1497, "rew_std": 46.7235, "Agent": "REINFORCE"}, {"env_step": 4300800, "rew": 930.2156, "rew_std": 96.1385, "Agent": "REINFORCE"}, {"env_step": 4331520, "rew": 947.0682, "rew_std": 44.4635, "Agent": "REINFORCE"}, {"env_step": 4362240, "rew": 913.4538, "rew_std": 106.4576, "Agent": "REINFORCE"}, {"env_step": 4392960, "rew": 956.4173, "rew_std": 72.454, "Agent": "REINFORCE"}, {"env_step": 4423680, "rew": 986.112, "rew_std": 53.2538, "Agent": "REINFORCE"}, {"env_step": 4454400, "rew": 980.6774, "rew_std": 55.4501, "Agent": "REINFORCE"}, {"env_step": 4485120, "rew": 969.6189, "rew_std": 45.7465, "Agent": "REINFORCE"}, {"env_step": 4515840, "rew": 961.9398, "rew_std": 44.0191, "Agent": "REINFORCE"}, {"env_step": 4546560, "rew": 977.3772, "rew_std": 46.2519, "Agent": "REINFORCE"}, {"env_step": 4577280, "rew": 960.5113, "rew_std": 43.8153, "Agent": "REINFORCE"}, {"env_step": 4608000, "rew": 975.5923, "rew_std": 42.7543, "Agent": "REINFORCE"}, {"env_step": 4638720, "rew": 978.18, "rew_std": 60.7165, "Agent": "REINFORCE"}, {"env_step": 4669440, "rew": 994.968, "rew_std": 52.9976, "Agent": "REINFORCE"}, {"env_step": 4700160, "rew": 992.85, "rew_std": 53.1501, "Agent": "REINFORCE"}, {"env_step": 4730880, "rew": 964.6797, "rew_std": 46.663, "Agent": "REINFORCE"}, {"env_step": 4761600, "rew": 983.9115, "rew_std": 52.2566, "Agent": "REINFORCE"}, {"env_step": 4792320, "rew": 990.3478, "rew_std": 40.05, "Agent": "REINFORCE"}, {"env_step": 4823040, "rew": 997.0132, "rew_std": 41.0583, "Agent": "REINFORCE"}, {"env_step": 4853760, "rew": 993.6661, "rew_std": 42.785, "Agent": "REINFORCE"}, {"env_step": 4884480, "rew": 1011.8642, "rew_std": 27.5827, "Agent": "REINFORCE"}, {"env_step": 4915200, "rew": 1005.24, "rew_std": 22.0347, "Agent": "REINFORCE"}, {"env_step": 4945920, "rew": 995.1774, "rew_std": 38.7399, "Agent": "REINFORCE"}, {"env_step": 4976640, "rew": 993.0942, "rew_std": 45.0712, "Agent": "REINFORCE"}, {"env_step": 5007360, "rew": 1013.1125, "rew_std": 60.5238, "Agent": "REINFORCE"}, {"env_step": 5038080, "rew": 996.6935, "rew_std": 44.7954, "Agent": "REINFORCE"}, {"env_step": 5068800, "rew": 995.8926, "rew_std": 58.3237, "Agent": "REINFORCE"}, {"env_step": 5099520, "rew": 1010.5929, "rew_std": 54.3951, "Agent": "REINFORCE"}, {"env_step": 5130240, "rew": 994.6702, "rew_std": 69.0843, "Agent": "REINFORCE"}, {"env_step": 5160960, "rew": 997.2196, "rew_std": 39.166, "Agent": "REINFORCE"}, {"env_step": 5191680, "rew": 1016.5374, "rew_std": 54.9657, "Agent": "REINFORCE"}, {"env_step": 5222400, "rew": 1017.5374, "rew_std": 62.1809, "Agent": "REINFORCE"}, {"env_step": 5253120, "rew": 1015.6075, "rew_std": 53.5472, "Agent": "REINFORCE"}, {"env_step": 5283840, "rew": 1016.8015, "rew_std": 52.6332, "Agent": "REINFORCE"}, {"env_step": 5314560, "rew": 1002.2621, "rew_std": 57.4378, "Agent": "REINFORCE"}, {"env_step": 5345280, "rew": 1001.0012, "rew_std": 100.386, "Agent": "REINFORCE"}, {"env_step": 5376000, "rew": 1022.3522, "rew_std": 66.3868, "Agent": "REINFORCE"}, {"env_step": 5406720, "rew": 1000.0438, "rew_std": 51.6201, "Agent": "REINFORCE"}, {"env_step": 5437440, "rew": 1011.1049, "rew_std": 62.4932, "Agent": "REINFORCE"}, {"env_step": 5468160, "rew": 1015.1676, "rew_std": 89.5522, "Agent": "REINFORCE"}, {"env_step": 5498880, "rew": 1006.4157, "rew_std": 58.868, "Agent": "REINFORCE"}, {"env_step": 5529600, "rew": 1021.2901, "rew_std": 48.5136, "Agent": "REINFORCE"}, {"env_step": 5560320, "rew": 1034.2604, "rew_std": 51.6751, "Agent": "REINFORCE"}, {"env_step": 5591040, "rew": 1012.779, "rew_std": 60.1441, "Agent": "REINFORCE"}, {"env_step": 5621760, "rew": 1019.7712, "rew_std": 50.3584, "Agent": "REINFORCE"}, {"env_step": 5652480, "rew": 1028.3674, "rew_std": 37.5526, "Agent": "REINFORCE"}, {"env_step": 5683200, "rew": 1022.9339, "rew_std": 42.2359, "Agent": "REINFORCE"}, {"env_step": 5713920, "rew": 1035.5652, "rew_std": 35.8611, "Agent": "REINFORCE"}, {"env_step": 5744640, "rew": 1034.2733, "rew_std": 40.2398, "Agent": "REINFORCE"}, {"env_step": 5775360, "rew": 1045.4148, "rew_std": 49.8297, "Agent": "REINFORCE"}, {"env_step": 5806080, "rew": 1050.8877, "rew_std": 40.4739, "Agent": "REINFORCE"}, {"env_step": 5836800, "rew": 1039.0886, "rew_std": 36.1023, "Agent": "REINFORCE"}, {"env_step": 5867520, "rew": 1036.9562, "rew_std": 70.2645, "Agent": "REINFORCE"}, {"env_step": 5898240, "rew": 1038.1224, "rew_std": 51.4148, "Agent": "REINFORCE"}, {"env_step": 5928960, "rew": 1043.1975, "rew_std": 55.1165, "Agent": "REINFORCE"}, {"env_step": 5959680, "rew": 1034.1112, "rew_std": 65.8918, "Agent": "REINFORCE"}, {"env_step": 5990400, "rew": 1039.1232, "rew_std": 74.2882, "Agent": "REINFORCE"}, {"env_step": 6021120, "rew": 1026.4448, "rew_std": 72.7191, "Agent": "REINFORCE"}, {"env_step": 6051840, "rew": 1042.3366, "rew_std": 61.0111, "Agent": "REINFORCE"}, {"env_step": 6082560, "rew": 1025.8535, "rew_std": 64.4098, "Agent": "REINFORCE"}, {"env_step": 6113280, "rew": 1034.3692, "rew_std": 66.0265, "Agent": "REINFORCE"}, {"env_step": 6144000, "rew": 1035.6472, "rew_std": 59.5942, "Agent": "REINFORCE"}, {"env_step": 6174720, "rew": 1024.2567, "rew_std": 52.5294, "Agent": "REINFORCE"}, {"env_step": 6205440, "rew": 1035.5613, "rew_std": 51.0109, "Agent": "REINFORCE"}, {"env_step": 6236160, "rew": 1050.8728, "rew_std": 54.2495, "Agent": "REINFORCE"}, {"env_step": 6266880, "rew": 1027.9969, "rew_std": 53.9087, "Agent": "REINFORCE"}, {"env_step": 6297600, "rew": 1058.0868, "rew_std": 43.1176, "Agent": "REINFORCE"}, {"env_step": 6328320, "rew": 1049.4824, "rew_std": 47.3149, "Agent": "REINFORCE"}, {"env_step": 6359040, "rew": 1026.2656, "rew_std": 58.7652, "Agent": "REINFORCE"}, {"env_step": 6389760, "rew": 1063.611, "rew_std": 62.7269, "Agent": "REINFORCE"}, {"env_step": 6420480, "rew": 1013.5708, "rew_std": 87.5254, "Agent": "REINFORCE"}, {"env_step": 6451200, "rew": 1059.3438, "rew_std": 46.8292, "Agent": "REINFORCE"}, {"env_step": 6481920, "rew": 1021.049, "rew_std": 81.6385, "Agent": "REINFORCE"}, {"env_step": 6512640, "rew": 1053.7262, "rew_std": 74.1989, "Agent": "REINFORCE"}, {"env_step": 6543360, "rew": 1053.0535, "rew_std": 65.418, "Agent": "REINFORCE"}, {"env_step": 6574080, "rew": 1059.707, "rew_std": 69.9458, "Agent": "REINFORCE"}, {"env_step": 6604800, "rew": 1045.8224, "rew_std": 54.9453, "Agent": "REINFORCE"}, {"env_step": 6635520, "rew": 1047.9718, "rew_std": 59.0243, "Agent": "REINFORCE"}, {"env_step": 6666240, "rew": 1053.1456, "rew_std": 60.2588, "Agent": "REINFORCE"}, {"env_step": 6696960, "rew": 1050.9961, "rew_std": 72.2672, "Agent": "REINFORCE"}, {"env_step": 6727680, "rew": 1055.0399, "rew_std": 73.4961, "Agent": "REINFORCE"}, {"env_step": 6758400, "rew": 1052.8888, "rew_std": 70.5037, "Agent": "REINFORCE"}, {"env_step": 6789120, "rew": 1029.896, "rew_std": 92.459, "Agent": "REINFORCE"}, {"env_step": 6819840, "rew": 1058.1352, "rew_std": 58.4981, "Agent": "REINFORCE"}, {"env_step": 6850560, "rew": 1040.137, "rew_std": 86.8626, "Agent": "REINFORCE"}, {"env_step": 6881280, "rew": 1048.5212, "rew_std": 58.2427, "Agent": "REINFORCE"}, {"env_step": 6912000, "rew": 1056.9189, "rew_std": 56.9239, "Agent": "REINFORCE"}, {"env_step": 6942720, "rew": 1066.5289, "rew_std": 56.7241, "Agent": "REINFORCE"}, {"env_step": 6973440, "rew": 1039.9768, "rew_std": 69.6099, "Agent": "REINFORCE"}, {"env_step": 7004160, "rew": 1055.0471, "rew_std": 48.4431, "Agent": "REINFORCE"}, {"env_step": 7034880, "rew": 1073.3547, "rew_std": 54.2786, "Agent": "REINFORCE"}, {"env_step": 7065600, "rew": 1078.4087, "rew_std": 56.8925, "Agent": "REINFORCE"}, {"env_step": 7096320, "rew": 1062.771, "rew_std": 56.5096, "Agent": "REINFORCE"}, {"env_step": 7127040, "rew": 1064.348, "rew_std": 46.8655, "Agent": "REINFORCE"}, {"env_step": 7157760, "rew": 1069.0247, "rew_std": 53.9928, "Agent": "REINFORCE"}, {"env_step": 7188480, "rew": 1095.3149, "rew_std": 56.0251, "Agent": "REINFORCE"}, {"env_step": 7219200, "rew": 1059.7795, "rew_std": 89.3297, "Agent": "REINFORCE"}, {"env_step": 7249920, "rew": 1075.7866, "rew_std": 48.5306, "Agent": "REINFORCE"}, {"env_step": 7280640, "rew": 1070.4785, "rew_std": 57.9126, "Agent": "REINFORCE"}, {"env_step": 7311360, "rew": 1067.7449, "rew_std": 45.6498, "Agent": "REINFORCE"}, {"env_step": 7342080, "rew": 1068.3339, "rew_std": 51.5933, "Agent": "REINFORCE"}, {"env_step": 7372800, "rew": 1073.2552, "rew_std": 45.2915, "Agent": "REINFORCE"}, {"env_step": 7403520, "rew": 1086.6587, "rew_std": 51.2162, "Agent": "REINFORCE"}, {"env_step": 7434240, "rew": 1078.313, "rew_std": 39.8316, "Agent": "REINFORCE"}, {"env_step": 7464960, "rew": 1060.5985, "rew_std": 44.682, "Agent": "REINFORCE"}, {"env_step": 7495680, "rew": 1075.5627, "rew_std": 50.3273, "Agent": "REINFORCE"}, {"env_step": 7526400, "rew": 1072.449, "rew_std": 63.2418, "Agent": "REINFORCE"}, {"env_step": 7557120, "rew": 1085.9426, "rew_std": 33.5946, "Agent": "REINFORCE"}, {"env_step": 7587840, "rew": 1092.3983, "rew_std": 53.6555, "Agent": "REINFORCE"}, {"env_step": 7618560, "rew": 1078.9839, "rew_std": 54.3774, "Agent": "REINFORCE"}, {"env_step": 7649280, "rew": 1091.3667, "rew_std": 46.3437, "Agent": "REINFORCE"}, {"env_step": 7680000, "rew": 1082.5875, "rew_std": 42.6033, "Agent": "REINFORCE"}, {"env_step": 7710720, "rew": 1066.3451, "rew_std": 61.7616, "Agent": "REINFORCE"}, {"env_step": 7741440, "rew": 1073.6454, "rew_std": 59.707, "Agent": "REINFORCE"}, {"env_step": 7772160, "rew": 1063.3744, "rew_std": 71.0224, "Agent": "REINFORCE"}, {"env_step": 7802880, "rew": 1090.047, "rew_std": 40.6139, "Agent": "REINFORCE"}, {"env_step": 7833600, "rew": 1080.7565, "rew_std": 44.8726, "Agent": "REINFORCE"}, {"env_step": 7864320, "rew": 1065.6765, "rew_std": 46.4016, "Agent": "REINFORCE"}, {"env_step": 7895040, "rew": 1067.6488, "rew_std": 49.9414, "Agent": "REINFORCE"}, {"env_step": 7925760, "rew": 1085.3441, "rew_std": 55.2402, "Agent": "REINFORCE"}, {"env_step": 7956480, "rew": 1062.0563, "rew_std": 49.4121, "Agent": "REINFORCE"}, {"env_step": 7987200, "rew": 1086.9089, "rew_std": 50.1225, "Agent": "REINFORCE"}, {"env_step": 8017920, "rew": 1085.0331, "rew_std": 42.0211, "Agent": "REINFORCE"}, {"env_step": 8048640, "rew": 1076.8434, "rew_std": 43.465, "Agent": "REINFORCE"}, {"env_step": 8079360, "rew": 1097.6033, "rew_std": 44.2847, "Agent": "REINFORCE"}, {"env_step": 8110080, "rew": 1105.4302, "rew_std": 43.7604, "Agent": "REINFORCE"}, {"env_step": 8140800, "rew": 1088.2506, "rew_std": 37.5434, "Agent": "REINFORCE"}, {"env_step": 8171520, "rew": 1080.3139, "rew_std": 45.7188, "Agent": "REINFORCE"}, {"env_step": 8202240, "rew": 1084.8442, "rew_std": 47.4441, "Agent": "REINFORCE"}, {"env_step": 8232960, "rew": 1077.7378, "rew_std": 59.542, "Agent": "REINFORCE"}, {"env_step": 8263680, "rew": 1066.8771, "rew_std": 72.9645, "Agent": "REINFORCE"}, {"env_step": 8294400, "rew": 1096.348, "rew_std": 52.8151, "Agent": "REINFORCE"}, {"env_step": 8325120, "rew": 1071.0871, "rew_std": 50.5231, "Agent": "REINFORCE"}, {"env_step": 8355840, "rew": 1091.951, "rew_std": 44.6643, "Agent": "REINFORCE"}, {"env_step": 8386560, "rew": 1086.8091, "rew_std": 46.2969, "Agent": "REINFORCE"}, {"env_step": 8417280, "rew": 1095.6318, "rew_std": 51.617, "Agent": "REINFORCE"}, {"env_step": 8448000, "rew": 1064.6144, "rew_std": 70.4566, "Agent": "REINFORCE"}, {"env_step": 8478720, "rew": 1097.0543, "rew_std": 45.3195, "Agent": "REINFORCE"}, {"env_step": 8509440, "rew": 1104.6612, "rew_std": 42.8634, "Agent": "REINFORCE"}, {"env_step": 8540160, "rew": 1098.8933, "rew_std": 38.3864, "Agent": "REINFORCE"}, {"env_step": 8570880, "rew": 1086.6912, "rew_std": 50.3266, "Agent": "REINFORCE"}, {"env_step": 8601600, "rew": 1102.2135, "rew_std": 70.933, "Agent": "REINFORCE"}, {"env_step": 8632320, "rew": 1090.1486, "rew_std": 81.3128, "Agent": "REINFORCE"}, {"env_step": 8663040, "rew": 1087.0612, "rew_std": 57.0418, "Agent": "REINFORCE"}, {"env_step": 8693760, "rew": 1107.9893, "rew_std": 51.2113, "Agent": "REINFORCE"}, {"env_step": 8724480, "rew": 1116.9207, "rew_std": 50.9583, "Agent": "REINFORCE"}, {"env_step": 8755200, "rew": 1112.6254, "rew_std": 43.8869, "Agent": "REINFORCE"}, {"env_step": 8785920, "rew": 1118.0138, "rew_std": 37.5083, "Agent": "REINFORCE"}, {"env_step": 8816640, "rew": 1092.8679, "rew_std": 52.3159, "Agent": "REINFORCE"}, {"env_step": 8847360, "rew": 1112.43, "rew_std": 43.5469, "Agent": "REINFORCE"}, {"env_step": 8878080, "rew": 1109.6117, "rew_std": 53.1086, "Agent": "REINFORCE"}, {"env_step": 8908800, "rew": 1091.1253, "rew_std": 55.2791, "Agent": "REINFORCE"}, {"env_step": 8939520, "rew": 1103.3368, "rew_std": 47.0241, "Agent": "REINFORCE"}, {"env_step": 8970240, "rew": 1117.9517, "rew_std": 45.6591, "Agent": "REINFORCE"}, {"env_step": 9000960, "rew": 1106.9619, "rew_std": 41.4317, "Agent": "REINFORCE"}, {"env_step": 9031680, "rew": 1115.1068, "rew_std": 55.2598, "Agent": "REINFORCE"}, {"env_step": 9062400, "rew": 1122.0894, "rew_std": 35.4838, "Agent": "REINFORCE"}, {"env_step": 9093120, "rew": 1127.6883, "rew_std": 46.4658, "Agent": "REINFORCE"}, {"env_step": 9123840, "rew": 1112.8166, "rew_std": 41.8131, "Agent": "REINFORCE"}, {"env_step": 9154560, "rew": 1115.7368, "rew_std": 53.6233, "Agent": "REINFORCE"}, {"env_step": 9185280, "rew": 1095.7732, "rew_std": 39.6533, "Agent": "REINFORCE"}, {"env_step": 9216000, "rew": 1120.5861, "rew_std": 41.3632, "Agent": "REINFORCE"}, {"env_step": 9246720, "rew": 1082.4576, "rew_std": 92.7449, "Agent": "REINFORCE"}, {"env_step": 9277440, "rew": 1129.3393, "rew_std": 45.1588, "Agent": "REINFORCE"}, {"env_step": 9308160, "rew": 1107.1046, "rew_std": 57.317, "Agent": "REINFORCE"}, {"env_step": 9338880, "rew": 1115.6161, "rew_std": 54.6329, "Agent": "REINFORCE"}, {"env_step": 9369600, "rew": 1123.2624, "rew_std": 32.816, "Agent": "REINFORCE"}, {"env_step": 9400320, "rew": 1127.7662, "rew_std": 38.7112, "Agent": "REINFORCE"}, {"env_step": 9431040, "rew": 1122.9372, "rew_std": 35.7091, "Agent": "REINFORCE"}, {"env_step": 9461760, "rew": 1115.9145, "rew_std": 40.5152, "Agent": "REINFORCE"}, {"env_step": 9492480, "rew": 1113.5322, "rew_std": 40.1525, "Agent": "REINFORCE"}, {"env_step": 9523200, "rew": 1136.2791, "rew_std": 35.7975, "Agent": "REINFORCE"}, {"env_step": 9553920, "rew": 1113.7384, "rew_std": 35.8931, "Agent": "REINFORCE"}, {"env_step": 9584640, "rew": 1121.8195, "rew_std": 42.9915, "Agent": "REINFORCE"}, {"env_step": 9615360, "rew": 1130.7352, "rew_std": 35.1201, "Agent": "REINFORCE"}, {"env_step": 9646080, "rew": 1125.1981, "rew_std": 40.9015, "Agent": "REINFORCE"}, {"env_step": 9676800, "rew": 1118.2906, "rew_std": 48.4825, "Agent": "REINFORCE"}, {"env_step": 9707520, "rew": 1089.7356, "rew_std": 58.9498, "Agent": "REINFORCE"}, {"env_step": 9738240, "rew": 1115.0204, "rew_std": 53.2705, "Agent": "REINFORCE"}, {"env_step": 9768960, "rew": 1121.7228, "rew_std": 48.332, "Agent": "REINFORCE"}, {"env_step": 9799680, "rew": 1129.367, "rew_std": 35.2903, "Agent": "REINFORCE"}, {"env_step": 9830400, "rew": 1118.8765, "rew_std": 36.8765, "Agent": "REINFORCE"}, {"env_step": 9861120, "rew": 1113.9437, "rew_std": 69.7432, "Agent": "REINFORCE"}, {"env_step": 9891840, "rew": 1120.8454, "rew_std": 33.3913, "Agent": "REINFORCE"}, {"env_step": 9922560, "rew": 1113.0581, "rew_std": 56.4189, "Agent": "REINFORCE"}, {"env_step": 9953280, "rew": 1120.8607, "rew_std": 33.265, "Agent": "REINFORCE"}, {"env_step": 9984000, "rew": 1107.17, "rew_std": 51.0692, "Agent": "REINFORCE"}, {"env_step": 10014720, "rew": 1123.9591, "rew_std": 39.8303, "Agent": "REINFORCE"}, {"env_step": 10045440, "rew": 1132.0132, "rew_std": 53.0461, "Agent": "REINFORCE"}, {"env_step": 10076160, "rew": 1138.7607, "rew_std": 38.8626, "Agent": "REINFORCE"}, {"env_step": 10106880, "rew": 1125.9321, "rew_std": 35.3656, "Agent": "REINFORCE"}, {"env_step": 10137600, "rew": 1121.423, "rew_std": 45.7195, "Agent": "REINFORCE"}, {"env_step": 10168320, "rew": 1132.5021, "rew_std": 46.9729, "Agent": "REINFORCE"}, {"env_step": 10199040, "rew": 1133.2431, "rew_std": 38.2374, "Agent": "REINFORCE"}, {"env_step": 10229760, "rew": 1125.8592, "rew_std": 40.0745, "Agent": "REINFORCE"}, {"env_step": 0, "rew": -2.027, "rew_std": 0.7352, "Agent": "SAC"}, {"env_step": 5000, "rew": 10.1839, "rew_std": 23.2072, "Agent": "SAC"}, {"env_step": 10000, "rew": 865.359, "rew_std": 486.562, "Agent": "SAC"}, {"env_step": 15000, "rew": 1814.2922, "rew_std": 570.1082, "Agent": "SAC"}, {"env_step": 20000, "rew": 2641.1068, "rew_std": 503.2532, "Agent": "SAC"}, {"env_step": 25000, "rew": 3365.0157, "rew_std": 417.5691, "Agent": "SAC"}, {"env_step": 30000, "rew": 3525.4369, "rew_std": 501.063, "Agent": "SAC"}, {"env_step": 35000, "rew": 3983.1205, "rew_std": 279.2621, "Agent": "SAC"}, {"env_step": 40000, "rew": 4326.9325, "rew_std": 213.1473, "Agent": "SAC"}, {"env_step": 45000, "rew": 4605.0875, "rew_std": 269.9916, "Agent": "SAC"}, {"env_step": 50000, "rew": 4747.2399, "rew_std": 345.0121, "Agent": "SAC"}, {"env_step": 55000, "rew": 5083.2292, "rew_std": 380.5083, "Agent": "SAC"}, {"env_step": 60000, "rew": 5316.2064, "rew_std": 330.2907, "Agent": "SAC"}, {"env_step": 65000, "rew": 5496.9468, "rew_std": 418.5496, "Agent": "SAC"}, {"env_step": 70000, "rew": 5586.9485, "rew_std": 540.2148, "Agent": "SAC"}, {"env_step": 75000, "rew": 5851.4753, "rew_std": 371.89, "Agent": "SAC"}, {"env_step": 80000, "rew": 5929.2037, "rew_std": 454.7962, "Agent": "SAC"}, {"env_step": 85000, "rew": 6106.3958, "rew_std": 438.9816, "Agent": "SAC"}, {"env_step": 90000, "rew": 6212.7888, "rew_std": 437.2369, "Agent": "SAC"}, {"env_step": 95000, "rew": 6187.6082, "rew_std": 511.4287, "Agent": "SAC"}, {"env_step": 100000, "rew": 6514.6227, "rew_std": 514.2304, "Agent": "SAC"}, {"env_step": 105000, "rew": 6485.9809, "rew_std": 597.6332, "Agent": "SAC"}, {"env_step": 110000, "rew": 6595.3192, "rew_std": 550.9856, "Agent": "SAC"}, {"env_step": 115000, "rew": 6751.1698, "rew_std": 579.1543, "Agent": "SAC"}, {"env_step": 120000, "rew": 6801.2745, "rew_std": 579.1199, "Agent": "SAC"}, {"env_step": 125000, "rew": 7076.524, "rew_std": 669.0167, "Agent": "SAC"}, {"env_step": 130000, "rew": 7088.5351, "rew_std": 673.049, "Agent": "SAC"}, {"env_step": 135000, "rew": 7229.5772, "rew_std": 688.2214, "Agent": "SAC"}, {"env_step": 140000, "rew": 7198.8854, "rew_std": 665.0043, "Agent": "SAC"}, {"env_step": 145000, "rew": 7391.4168, "rew_std": 768.3948, "Agent": "SAC"}, {"env_step": 150000, "rew": 7464.8962, "rew_std": 720.8476, "Agent": "SAC"}, {"env_step": 155000, "rew": 7437.4415, "rew_std": 763.1268, "Agent": "SAC"}, {"env_step": 160000, "rew": 7577.3921, "rew_std": 815.7664, "Agent": "SAC"}, {"env_step": 165000, "rew": 7730.9681, "rew_std": 811.9207, "Agent": "SAC"}, {"env_step": 170000, "rew": 7653.3391, "rew_std": 694.4047, "Agent": "SAC"}, {"env_step": 175000, "rew": 7943.5144, "rew_std": 887.9127, "Agent": "SAC"}, {"env_step": 180000, "rew": 7825.5208, "rew_std": 918.1944, "Agent": "SAC"}, {"env_step": 185000, "rew": 8028.0037, "rew_std": 881.683, "Agent": "SAC"}, {"env_step": 190000, "rew": 7877.3779, "rew_std": 762.8448, "Agent": "SAC"}, {"env_step": 195000, "rew": 8144.8266, "rew_std": 1004.9139, "Agent": "SAC"}, {"env_step": 200000, "rew": 8207.6336, "rew_std": 928.3063, "Agent": "SAC"}, {"env_step": 205000, "rew": 7962.9357, "rew_std": 1050.1757, "Agent": "SAC"}, {"env_step": 210000, "rew": 8309.562, "rew_std": 986.6001, "Agent": "SAC"}, {"env_step": 215000, "rew": 8434.306, "rew_std": 1014.6172, "Agent": "SAC"}, {"env_step": 220000, "rew": 8270.1339, "rew_std": 964.6572, "Agent": "SAC"}, {"env_step": 225000, "rew": 8415.4762, "rew_std": 917.3119, "Agent": "SAC"}, {"env_step": 230000, "rew": 8533.957, "rew_std": 987.645, "Agent": "SAC"}, {"env_step": 235000, "rew": 8591.5228, "rew_std": 1112.037, "Agent": "SAC"}, {"env_step": 240000, "rew": 8707.7558, "rew_std": 1031.5746, "Agent": "SAC"}, {"env_step": 245000, "rew": 8759.7748, "rew_std": 1046.6268, "Agent": "SAC"}, {"env_step": 250000, "rew": 8836.3744, "rew_std": 1070.2071, "Agent": "SAC"}, {"env_step": 255000, "rew": 8835.3932, "rew_std": 1125.7859, "Agent": "SAC"}, {"env_step": 260000, "rew": 8948.6225, "rew_std": 1104.4205, "Agent": "SAC"}, {"env_step": 265000, "rew": 8910.7138, "rew_std": 967.2416, "Agent": "SAC"}, {"env_step": 270000, "rew": 8892.1686, "rew_std": 1144.4755, "Agent": "SAC"}, {"env_step": 275000, "rew": 8966.5011, "rew_std": 1009.1316, "Agent": "SAC"}, {"env_step": 280000, "rew": 9011.7319, "rew_std": 1003.8617, "Agent": "SAC"}, {"env_step": 285000, "rew": 9067.2721, "rew_std": 1095.6016, "Agent": "SAC"}, {"env_step": 290000, "rew": 9150.2293, "rew_std": 1051.4986, "Agent": "SAC"}, {"env_step": 295000, "rew": 8819.8506, "rew_std": 1224.7711, "Agent": "SAC"}, {"env_step": 300000, "rew": 9059.2562, "rew_std": 1051.4143, "Agent": "SAC"}, {"env_step": 305000, "rew": 9241.608, "rew_std": 972.1405, "Agent": "SAC"}, {"env_step": 310000, "rew": 9317.492, "rew_std": 955.1288, "Agent": "SAC"}, {"env_step": 315000, "rew": 9108.5728, "rew_std": 933.4934, "Agent": "SAC"}, {"env_step": 320000, "rew": 9338.11, "rew_std": 807.6986, "Agent": "SAC"}, {"env_step": 325000, "rew": 9341.4086, "rew_std": 952.2938, "Agent": "SAC"}, {"env_step": 330000, "rew": 9356.795, "rew_std": 887.4584, "Agent": "SAC"}, {"env_step": 335000, "rew": 9481.7274, "rew_std": 942.1804, "Agent": "SAC"}, {"env_step": 340000, "rew": 9367.992, "rew_std": 1002.2366, "Agent": "SAC"}, {"env_step": 345000, "rew": 9424.7869, "rew_std": 793.3956, "Agent": "SAC"}, {"env_step": 350000, "rew": 9521.2021, "rew_std": 945.0578, "Agent": "SAC"}, {"env_step": 355000, "rew": 9465.8035, "rew_std": 986.819, "Agent": "SAC"}, {"env_step": 360000, "rew": 9631.8073, "rew_std": 901.8403, "Agent": "SAC"}, {"env_step": 365000, "rew": 9666.9302, "rew_std": 688.4103, "Agent": "SAC"}, {"env_step": 370000, "rew": 9845.7185, "rew_std": 776.1784, "Agent": "SAC"}, {"env_step": 375000, "rew": 9783.6146, "rew_std": 748.8536, "Agent": "SAC"}, {"env_step": 380000, "rew": 9743.993, "rew_std": 864.4312, "Agent": "SAC"}, {"env_step": 385000, "rew": 9748.2177, "rew_std": 755.897, "Agent": "SAC"}, {"env_step": 390000, "rew": 9794.1282, "rew_std": 749.9596, "Agent": "SAC"}, {"env_step": 395000, "rew": 9691.9995, "rew_std": 855.6781, "Agent": "SAC"}, {"env_step": 400000, "rew": 9908.5217, "rew_std": 901.3128, "Agent": "SAC"}, {"env_step": 405000, "rew": 10051.019, "rew_std": 774.8568, "Agent": "SAC"}, {"env_step": 410000, "rew": 10034.7663, "rew_std": 815.4708, "Agent": "SAC"}, {"env_step": 415000, "rew": 10157.1511, "rew_std": 724.3571, "Agent": "SAC"}, {"env_step": 420000, "rew": 10016.6583, "rew_std": 830.1947, "Agent": "SAC"}, {"env_step": 425000, "rew": 9990.6593, "rew_std": 783.9429, "Agent": "SAC"}, {"env_step": 430000, "rew": 9951.3972, "rew_std": 816.0467, "Agent": "SAC"}, {"env_step": 435000, "rew": 10314.0172, "rew_std": 750.6577, "Agent": "SAC"}, {"env_step": 440000, "rew": 10258.7498, "rew_std": 753.6217, "Agent": "SAC"}, {"env_step": 445000, "rew": 10039.4467, "rew_std": 1114.8295, "Agent": "SAC"}, {"env_step": 450000, "rew": 10256.0898, "rew_std": 724.7449, "Agent": "SAC"}, {"env_step": 455000, "rew": 10255.1356, "rew_std": 715.2809, "Agent": "SAC"}, {"env_step": 460000, "rew": 10313.6543, "rew_std": 670.6573, "Agent": "SAC"}, {"env_step": 465000, "rew": 10239.7386, "rew_std": 699.8731, "Agent": "SAC"}, {"env_step": 470000, "rew": 10444.677, "rew_std": 721.1596, "Agent": "SAC"}, {"env_step": 475000, "rew": 10348.6424, "rew_std": 875.3533, "Agent": "SAC"}, {"env_step": 480000, "rew": 9822.9344, "rew_std": 995.0004, "Agent": "SAC"}, {"env_step": 485000, "rew": 10373.6868, "rew_std": 676.0692, "Agent": "SAC"}, {"env_step": 490000, "rew": 10464.7314, "rew_std": 783.7438, "Agent": "SAC"}, {"env_step": 495000, "rew": 10477.8849, "rew_std": 749.5457, "Agent": "SAC"}, {"env_step": 500000, "rew": 10409.97, "rew_std": 696.7419, "Agent": "SAC"}, {"env_step": 505000, "rew": 10344.591, "rew_std": 754.885, "Agent": "SAC"}, {"env_step": 510000, "rew": 10585.7676, "rew_std": 798.5526, "Agent": "SAC"}, {"env_step": 515000, "rew": 10509.9652, "rew_std": 755.3173, "Agent": "SAC"}, {"env_step": 520000, "rew": 10578.6697, "rew_std": 767.8139, "Agent": "SAC"}, {"env_step": 525000, "rew": 10731.3679, "rew_std": 702.0967, "Agent": "SAC"}, {"env_step": 530000, "rew": 10715.2787, "rew_std": 816.2541, "Agent": "SAC"}, {"env_step": 535000, "rew": 10434.4037, "rew_std": 903.8272, "Agent": "SAC"}, {"env_step": 540000, "rew": 10402.0162, "rew_std": 865.098, "Agent": "SAC"}, {"env_step": 545000, "rew": 10469.6772, "rew_std": 1201.1587, "Agent": "SAC"}, {"env_step": 550000, "rew": 10784.2863, "rew_std": 756.5986, "Agent": "SAC"}, {"env_step": 555000, "rew": 10736.8056, "rew_std": 772.8018, "Agent": "SAC"}, {"env_step": 560000, "rew": 10693.0171, "rew_std": 808.7638, "Agent": "SAC"}, {"env_step": 565000, "rew": 10771.5095, "rew_std": 861.7875, "Agent": "SAC"}, {"env_step": 570000, "rew": 10681.0633, "rew_std": 873.4222, "Agent": "SAC"}, {"env_step": 575000, "rew": 10807.2527, "rew_std": 814.9743, "Agent": "SAC"}, {"env_step": 580000, "rew": 10937.5397, "rew_std": 819.6207, "Agent": "SAC"}, {"env_step": 585000, "rew": 10878.7778, "rew_std": 897.3742, "Agent": "SAC"}, {"env_step": 590000, "rew": 10909.0009, "rew_std": 790.7898, "Agent": "SAC"}, {"env_step": 595000, "rew": 10864.504, "rew_std": 839.9366, "Agent": "SAC"}, {"env_step": 600000, "rew": 10834.5523, "rew_std": 798.3907, "Agent": "SAC"}, {"env_step": 605000, "rew": 10965.6832, "rew_std": 782.3083, "Agent": "SAC"}, {"env_step": 610000, "rew": 10670.7502, "rew_std": 1000.5134, "Agent": "SAC"}, {"env_step": 615000, "rew": 11034.147, "rew_std": 770.7826, "Agent": "SAC"}, {"env_step": 620000, "rew": 10885.1786, "rew_std": 846.6412, "Agent": "SAC"}, {"env_step": 625000, "rew": 11171.5709, "rew_std": 842.4588, "Agent": "SAC"}, {"env_step": 630000, "rew": 11093.6177, "rew_std": 853.805, "Agent": "SAC"}, {"env_step": 635000, "rew": 11108.4159, "rew_std": 817.3521, "Agent": "SAC"}, {"env_step": 640000, "rew": 10876.0314, "rew_std": 843.1665, "Agent": "SAC"}, {"env_step": 645000, "rew": 11164.6113, "rew_std": 871.3397, "Agent": "SAC"}, {"env_step": 650000, "rew": 10951.5324, "rew_std": 844.1223, "Agent": "SAC"}, {"env_step": 655000, "rew": 10930.1218, "rew_std": 751.7118, "Agent": "SAC"}, {"env_step": 660000, "rew": 11156.2704, "rew_std": 864.4117, "Agent": "SAC"}, {"env_step": 665000, "rew": 11292.937, "rew_std": 857.9847, "Agent": "SAC"}, {"env_step": 670000, "rew": 11120.3012, "rew_std": 900.4298, "Agent": "SAC"}, {"env_step": 675000, "rew": 11238.3806, "rew_std": 799.2015, "Agent": "SAC"}, {"env_step": 680000, "rew": 11199.6556, "rew_std": 869.3494, "Agent": "SAC"}, {"env_step": 685000, "rew": 11196.8285, "rew_std": 1142.7087, "Agent": "SAC"}, {"env_step": 690000, "rew": 11376.8737, "rew_std": 843.3762, "Agent": "SAC"}, {"env_step": 695000, "rew": 11250.9709, "rew_std": 832.8242, "Agent": "SAC"}, {"env_step": 700000, "rew": 11357.1604, "rew_std": 904.5123, "Agent": "SAC"}, {"env_step": 705000, "rew": 11167.0614, "rew_std": 878.1416, "Agent": "SAC"}, {"env_step": 710000, "rew": 11142.2148, "rew_std": 849.0947, "Agent": "SAC"}, {"env_step": 715000, "rew": 11354.5586, "rew_std": 880.9652, "Agent": "SAC"}, {"env_step": 720000, "rew": 11292.1365, "rew_std": 855.3787, "Agent": "SAC"}, {"env_step": 725000, "rew": 11397.1391, "rew_std": 849.8348, "Agent": "SAC"}, {"env_step": 730000, "rew": 11363.1654, "rew_std": 865.1339, "Agent": "SAC"}, {"env_step": 735000, "rew": 11401.6934, "rew_std": 985.0648, "Agent": "SAC"}, {"env_step": 740000, "rew": 11457.9921, "rew_std": 882.5772, "Agent": "SAC"}, {"env_step": 745000, "rew": 11263.8964, "rew_std": 861.9337, "Agent": "SAC"}, {"env_step": 750000, "rew": 11329.132, "rew_std": 870.3124, "Agent": "SAC"}, {"env_step": 755000, "rew": 11432.5841, "rew_std": 878.3916, "Agent": "SAC"}, {"env_step": 760000, "rew": 11366.4875, "rew_std": 1066.7255, "Agent": "SAC"}, {"env_step": 765000, "rew": 11235.2494, "rew_std": 1250.3021, "Agent": "SAC"}, {"env_step": 770000, "rew": 11393.2447, "rew_std": 956.0431, "Agent": "SAC"}, {"env_step": 775000, "rew": 11499.3649, "rew_std": 903.8219, "Agent": "SAC"}, {"env_step": 780000, "rew": 11377.0247, "rew_std": 857.1325, "Agent": "SAC"}, {"env_step": 785000, "rew": 11420.9959, "rew_std": 945.2315, "Agent": "SAC"}, {"env_step": 790000, "rew": 11381.5919, "rew_std": 870.4013, "Agent": "SAC"}, {"env_step": 795000, "rew": 11440.576, "rew_std": 898.4534, "Agent": "SAC"}, {"env_step": 800000, "rew": 11676.8494, "rew_std": 971.5681, "Agent": "SAC"}, {"env_step": 805000, "rew": 11607.9284, "rew_std": 904.6303, "Agent": "SAC"}, {"env_step": 810000, "rew": 11336.3882, "rew_std": 967.6672, "Agent": "SAC"}, {"env_step": 815000, "rew": 11037.0411, "rew_std": 1891.8502, "Agent": "SAC"}, {"env_step": 820000, "rew": 11702.6572, "rew_std": 930.5494, "Agent": "SAC"}, {"env_step": 825000, "rew": 11571.8939, "rew_std": 964.7258, "Agent": "SAC"}, {"env_step": 830000, "rew": 11714.3621, "rew_std": 953.5695, "Agent": "SAC"}, {"env_step": 835000, "rew": 11484.7875, "rew_std": 919.6083, "Agent": "SAC"}, {"env_step": 840000, "rew": 11653.8103, "rew_std": 892.0375, "Agent": "SAC"}, {"env_step": 845000, "rew": 11684.4042, "rew_std": 866.6908, "Agent": "SAC"}, {"env_step": 850000, "rew": 11681.3375, "rew_std": 961.4558, "Agent": "SAC"}, {"env_step": 855000, "rew": 11587.8436, "rew_std": 933.4399, "Agent": "SAC"}, {"env_step": 860000, "rew": 11661.2521, "rew_std": 1040.2257, "Agent": "SAC"}, {"env_step": 865000, "rew": 11488.6788, "rew_std": 1063.185, "Agent": "SAC"}, {"env_step": 870000, "rew": 11540.2953, "rew_std": 1037.9443, "Agent": "SAC"}, {"env_step": 875000, "rew": 11841.9591, "rew_std": 963.0978, "Agent": "SAC"}, {"env_step": 880000, "rew": 11793.1006, "rew_std": 896.7818, "Agent": "SAC"}, {"env_step": 885000, "rew": 11874.787, "rew_std": 980.7893, "Agent": "SAC"}, {"env_step": 890000, "rew": 11648.9695, "rew_std": 905.3032, "Agent": "SAC"}, {"env_step": 895000, "rew": 11912.3981, "rew_std": 944.7161, "Agent": "SAC"}, {"env_step": 900000, "rew": 12012.0246, "rew_std": 1032.0492, "Agent": "SAC"}, {"env_step": 905000, "rew": 11748.9588, "rew_std": 961.4382, "Agent": "SAC"}, {"env_step": 910000, "rew": 11786.2655, "rew_std": 1031.0671, "Agent": "SAC"}, {"env_step": 915000, "rew": 11219.5542, "rew_std": 1884.3568, "Agent": "SAC"}, {"env_step": 920000, "rew": 11846.4572, "rew_std": 1007.202, "Agent": "SAC"}, {"env_step": 925000, "rew": 11506.1745, "rew_std": 1096.2194, "Agent": "SAC"}, {"env_step": 930000, "rew": 11861.6563, "rew_std": 1074.5994, "Agent": "SAC"}, {"env_step": 935000, "rew": 11753.2089, "rew_std": 1013.6127, "Agent": "SAC"}, {"env_step": 940000, "rew": 11921.9789, "rew_std": 939.7152, "Agent": "SAC"}, {"env_step": 945000, "rew": 11950.4468, "rew_std": 949.9662, "Agent": "SAC"}, {"env_step": 950000, "rew": 12028.8625, "rew_std": 1032.3731, "Agent": "SAC"}, {"env_step": 955000, "rew": 11937.5016, "rew_std": 957.3345, "Agent": "SAC"}, {"env_step": 960000, "rew": 11984.8677, "rew_std": 1016.5514, "Agent": "SAC"}, {"env_step": 965000, "rew": 11962.7994, "rew_std": 997.6641, "Agent": "SAC"}, {"env_step": 970000, "rew": 12027.9757, "rew_std": 941.3748, "Agent": "SAC"}, {"env_step": 975000, "rew": 11939.0175, "rew_std": 999.1897, "Agent": "SAC"}, {"env_step": 980000, "rew": 11913.8985, "rew_std": 916.6498, "Agent": "SAC"}, {"env_step": 985000, "rew": 11802.1434, "rew_std": 1129.3786, "Agent": "SAC"}, {"env_step": 990000, "rew": 12138.7987, "rew_std": 1049.3246, "Agent": "SAC"}, {"env_step": 995000, "rew": 12130.1697, "rew_std": 993.185, "Agent": "SAC"}, {"env_step": 1000000, "rew": 12121.8566, "rew_std": 1006.2108, "Agent": "SAC"}, {"env_step": 1005000, "rew": 11942.5856, "rew_std": 991.2353, "Agent": "SAC"}, {"env_step": 1010000, "rew": 12005.1579, "rew_std": 1045.1113, "Agent": "SAC"}, {"env_step": 1015000, "rew": 12041.7859, "rew_std": 998.4825, "Agent": "SAC"}, {"env_step": 1020000, "rew": 12013.6874, "rew_std": 1026.4441, "Agent": "SAC"}, {"env_step": 1025000, "rew": 12065.7275, "rew_std": 1012.3839, "Agent": "SAC"}, {"env_step": 1030000, "rew": 11714.3521, "rew_std": 1212.8575, "Agent": "SAC"}, {"env_step": 1035000, "rew": 12218.3614, "rew_std": 1082.4594, "Agent": "SAC"}, {"env_step": 1040000, "rew": 12184.5401, "rew_std": 1020.1823, "Agent": "SAC"}, {"env_step": 1045000, "rew": 12244.2109, "rew_std": 1030.6247, "Agent": "SAC"}, {"env_step": 1050000, "rew": 12202.9869, "rew_std": 1078.7199, "Agent": "SAC"}, {"env_step": 1055000, "rew": 12239.3944, "rew_std": 1019.3269, "Agent": "SAC"}, {"env_step": 1060000, "rew": 11997.9335, "rew_std": 914.4304, "Agent": "SAC"}, {"env_step": 1065000, "rew": 12149.6644, "rew_std": 893.8064, "Agent": "SAC"}, {"env_step": 1070000, "rew": 12175.7625, "rew_std": 1044.152, "Agent": "SAC"}, {"env_step": 1075000, "rew": 12346.2323, "rew_std": 1005.64, "Agent": "SAC"}, {"env_step": 1080000, "rew": 12362.0626, "rew_std": 1034.2557, "Agent": "SAC"}, {"env_step": 1085000, "rew": 12180.2346, "rew_std": 1023.6408, "Agent": "SAC"}, {"env_step": 1090000, "rew": 12104.2195, "rew_std": 1141.1273, "Agent": "SAC"}, {"env_step": 1095000, "rew": 12191.2541, "rew_std": 1113.5694, "Agent": "SAC"}, {"env_step": 1100000, "rew": 12395.9566, "rew_std": 952.733, "Agent": "SAC"}, {"env_step": 1105000, "rew": 12347.7701, "rew_std": 801.054, "Agent": "SAC"}, {"env_step": 1110000, "rew": 12235.5543, "rew_std": 1035.2947, "Agent": "SAC"}, {"env_step": 1115000, "rew": 12449.6886, "rew_std": 994.0012, "Agent": "SAC"}, {"env_step": 1120000, "rew": 12209.3594, "rew_std": 855.504, "Agent": "SAC"}, {"env_step": 1125000, "rew": 12242.4778, "rew_std": 958.1728, "Agent": "SAC"}, {"env_step": 1130000, "rew": 12435.6339, "rew_std": 713.4702, "Agent": "SAC"}, {"env_step": 1135000, "rew": 12379.179, "rew_std": 955.365, "Agent": "SAC"}, {"env_step": 1140000, "rew": 12235.5068, "rew_std": 1268.6864, "Agent": "SAC"}, {"env_step": 1145000, "rew": 12097.1035, "rew_std": 873.944, "Agent": "SAC"}, {"env_step": 1150000, "rew": 12531.4431, "rew_std": 932.6429, "Agent": "SAC"}, {"env_step": 1155000, "rew": 12377.1813, "rew_std": 815.1965, "Agent": "SAC"}, {"env_step": 1160000, "rew": 12598.7106, "rew_std": 843.0569, "Agent": "SAC"}, {"env_step": 1165000, "rew": 12420.8783, "rew_std": 869.0023, "Agent": "SAC"}, {"env_step": 1170000, "rew": 12546.8189, "rew_std": 872.5977, "Agent": "SAC"}, {"env_step": 1175000, "rew": 12338.7278, "rew_std": 934.1012, "Agent": "SAC"}, {"env_step": 1180000, "rew": 12441.9147, "rew_std": 970.1274, "Agent": "SAC"}, {"env_step": 1185000, "rew": 12395.7239, "rew_std": 856.8003, "Agent": "SAC"}, {"env_step": 1190000, "rew": 12693.0426, "rew_std": 841.1914, "Agent": "SAC"}, {"env_step": 1195000, "rew": 12438.0021, "rew_std": 1017.4289, "Agent": "SAC"}, {"env_step": 1200000, "rew": 12248.8422, "rew_std": 860.0051, "Agent": "SAC"}, {"env_step": 1205000, "rew": 12643.7048, "rew_std": 952.921, "Agent": "SAC"}, {"env_step": 1210000, "rew": 12449.039, "rew_std": 1083.0253, "Agent": "SAC"}, {"env_step": 1215000, "rew": 12576.7585, "rew_std": 913.4922, "Agent": "SAC"}, {"env_step": 1220000, "rew": 12584.8301, "rew_std": 883.0901, "Agent": "SAC"}, {"env_step": 1225000, "rew": 12716.9272, "rew_std": 996.5454, "Agent": "SAC"}, {"env_step": 1230000, "rew": 12436.8757, "rew_std": 882.0322, "Agent": "SAC"}, {"env_step": 1235000, "rew": 12590.1792, "rew_std": 886.9334, "Agent": "SAC"}, {"env_step": 1240000, "rew": 12652.7922, "rew_std": 932.0824, "Agent": "SAC"}, {"env_step": 1245000, "rew": 12458.9671, "rew_std": 1062.3939, "Agent": "SAC"}, {"env_step": 1250000, "rew": 12533.7516, "rew_std": 859.9165, "Agent": "SAC"}, {"env_step": 0, "rew": -269.0138, "rew_std": 20.4789, "Agent": "TRPO"}, {"env_step": 30720, "rew": -75.8476, "rew_std": 40.7319, "Agent": "TRPO"}, {"env_step": 61440, "rew": 118.8494, "rew_std": 70.2244, "Agent": "TRPO"}, {"env_step": 92160, "rew": 364.9657, "rew_std": 116.1403, "Agent": "TRPO"}, {"env_step": 122880, "rew": 630.9174, "rew_std": 220.7665, "Agent": "TRPO"}, {"env_step": 153600, "rew": 949.9552, "rew_std": 360.9975, "Agent": "TRPO"}, {"env_step": 184320, "rew": 1331.3596, "rew_std": 500.4918, "Agent": "TRPO"}, {"env_step": 215040, "rew": 1679.6014, "rew_std": 589.2362, "Agent": "TRPO"}, {"env_step": 245760, "rew": 2028.546, "rew_std": 727.1721, "Agent": "TRPO"}, {"env_step": 276480, "rew": 2256.0638, "rew_std": 860.3888, "Agent": "TRPO"}, {"env_step": 307200, "rew": 2601.4536, "rew_std": 799.4256, "Agent": "TRPO"}, {"env_step": 337920, "rew": 2822.262, "rew_std": 864.365, "Agent": "TRPO"}, {"env_step": 368640, "rew": 2958.2152, "rew_std": 890.044, "Agent": "TRPO"}, {"env_step": 399360, "rew": 3122.42, "rew_std": 885.6809, "Agent": "TRPO"}, {"env_step": 430080, "rew": 3221.8895, "rew_std": 799.139, "Agent": "TRPO"}, {"env_step": 460800, "rew": 3470.8979, "rew_std": 771.6672, "Agent": "TRPO"}, {"env_step": 491520, "rew": 3589.9087, "rew_std": 788.0406, "Agent": "TRPO"}, {"env_step": 522240, "rew": 3604.1879, "rew_std": 879.1726, "Agent": "TRPO"}, {"env_step": 552960, "rew": 3781.7636, "rew_std": 763.628, "Agent": "TRPO"}, {"env_step": 583680, "rew": 3771.7911, "rew_std": 857.4732, "Agent": "TRPO"}, {"env_step": 614400, "rew": 3918.9384, "rew_std": 813.178, "Agent": "TRPO"}, {"env_step": 645120, "rew": 3831.2216, "rew_std": 683.7742, "Agent": "TRPO"}, {"env_step": 675840, "rew": 3787.9915, "rew_std": 705.263, "Agent": "TRPO"}, {"env_step": 706560, "rew": 4062.4776, "rew_std": 654.6117, "Agent": "TRPO"}, {"env_step": 737280, "rew": 4163.2384, "rew_std": 684.7851, "Agent": "TRPO"}, {"env_step": 768000, "rew": 4174.8406, "rew_std": 629.7946, "Agent": "TRPO"}, {"env_step": 798720, "rew": 4074.9109, "rew_std": 660.3338, "Agent": "TRPO"}, {"env_step": 829440, "rew": 3946.6171, "rew_std": 649.9162, "Agent": "TRPO"}, {"env_step": 860160, "rew": 4383.0311, "rew_std": 699.1061, "Agent": "TRPO"}, {"env_step": 890880, "rew": 4322.1978, "rew_std": 633.054, "Agent": "TRPO"}, {"env_step": 921600, "rew": 4120.6806, "rew_std": 832.5398, "Agent": "TRPO"}, {"env_step": 952320, "rew": 4349.8712, "rew_std": 547.033, "Agent": "TRPO"}, {"env_step": 983040, "rew": 4402.5787, "rew_std": 1053.7237, "Agent": "TRPO"}, {"env_step": 1013760, "rew": 4526.9356, "rew_std": 603.0703, "Agent": "TRPO"}, {"env_step": 1044480, "rew": 4793.7482, "rew_std": 606.3231, "Agent": "TRPO"}, {"env_step": 1075200, "rew": 4516.2141, "rew_std": 579.7988, "Agent": "TRPO"}, {"env_step": 1105920, "rew": 4453.5164, "rew_std": 800.1863, "Agent": "TRPO"}, {"env_step": 1136640, "rew": 4630.0231, "rew_std": 597.8511, "Agent": "TRPO"}, {"env_step": 1167360, "rew": 4652.3804, "rew_std": 579.6711, "Agent": "TRPO"}, {"env_step": 1198080, "rew": 4169.8088, "rew_std": 857.9307, "Agent": "TRPO"}, {"env_step": 1228800, "rew": 4266.6013, "rew_std": 864.7216, "Agent": "TRPO"}, {"env_step": 1259520, "rew": 4894.7608, "rew_std": 543.0844, "Agent": "TRPO"}, {"env_step": 1290240, "rew": 4754.3905, "rew_std": 789.3097, "Agent": "TRPO"}, {"env_step": 1320960, "rew": 4576.833, "rew_std": 601.6164, "Agent": "TRPO"}, {"env_step": 1351680, "rew": 4940.4867, "rew_std": 648.3332, "Agent": "TRPO"}, {"env_step": 1382400, "rew": 5076.2226, "rew_std": 599.6275, "Agent": "TRPO"}, {"env_step": 1413120, "rew": 4756.491, "rew_std": 708.1688, "Agent": "TRPO"}, {"env_step": 1443840, "rew": 5068.1599, "rew_std": 638.463, "Agent": "TRPO"}, {"env_step": 1474560, "rew": 5187.4496, "rew_std": 631.2651, "Agent": "TRPO"}, {"env_step": 1505280, "rew": 4823.9084, "rew_std": 933.0163, "Agent": "TRPO"}, {"env_step": 1536000, "rew": 4975.8632, "rew_std": 601.5036, "Agent": "TRPO"}, {"env_step": 1566720, "rew": 4814.2276, "rew_std": 1317.8236, "Agent": "TRPO"}, {"env_step": 1597440, "rew": 4822.302, "rew_std": 691.5942, "Agent": "TRPO"}, {"env_step": 1628160, "rew": 4603.7932, "rew_std": 574.1043, "Agent": "TRPO"}, {"env_step": 1658880, "rew": 4858.2699, "rew_std": 517.2126, "Agent": "TRPO"}, {"env_step": 1689600, "rew": 5034.7999, "rew_std": 676.5515, "Agent": "TRPO"}, {"env_step": 1720320, "rew": 4979.1784, "rew_std": 771.1231, "Agent": "TRPO"}, {"env_step": 1751040, "rew": 5213.5581, "rew_std": 645.344, "Agent": "TRPO"}, {"env_step": 1781760, "rew": 5076.3158, "rew_std": 722.6969, "Agent": "TRPO"}, {"env_step": 1812480, "rew": 5066.8979, "rew_std": 552.8654, "Agent": "TRPO"}, {"env_step": 1843200, "rew": 5264.7166, "rew_std": 690.4721, "Agent": "TRPO"}, {"env_step": 1873920, "rew": 5484.2208, "rew_std": 512.12, "Agent": "TRPO"}, {"env_step": 1904640, "rew": 5298.097, "rew_std": 479.2661, "Agent": "TRPO"}, {"env_step": 1935360, "rew": 5042.6996, "rew_std": 351.0465, "Agent": "TRPO"}, {"env_step": 1966080, "rew": 5218.0571, "rew_std": 461.361, "Agent": "TRPO"}, {"env_step": 1996800, "rew": 5099.4767, "rew_std": 549.3635, "Agent": "TRPO"}, {"env_step": 2027520, "rew": 4911.2805, "rew_std": 571.7617, "Agent": "TRPO"}, {"env_step": 2058240, "rew": 5124.3423, "rew_std": 740.2355, "Agent": "TRPO"}, {"env_step": 2088960, "rew": 5073.4381, "rew_std": 801.7295, "Agent": "TRPO"}, {"env_step": 2119680, "rew": 5418.5278, "rew_std": 564.8367, "Agent": "TRPO"}, {"env_step": 2150400, "rew": 5318.2615, "rew_std": 572.5533, "Agent": "TRPO"}, {"env_step": 2181120, "rew": 5508.5316, "rew_std": 625.3701, "Agent": "TRPO"}, {"env_step": 2211840, "rew": 5445.9508, "rew_std": 548.5905, "Agent": "TRPO"}, {"env_step": 2242560, "rew": 5344.9399, "rew_std": 726.9044, "Agent": "TRPO"}, {"env_step": 2273280, "rew": 5350.4917, "rew_std": 545.9578, "Agent": "TRPO"}, {"env_step": 2304000, "rew": 5314.5685, "rew_std": 462.1794, "Agent": "TRPO"}, {"env_step": 2334720, "rew": 5235.3065, "rew_std": 564.983, "Agent": "TRPO"}, {"env_step": 2365440, "rew": 5405.6218, "rew_std": 922.5236, "Agent": "TRPO"}, {"env_step": 2396160, "rew": 5467.4483, "rew_std": 426.0478, "Agent": "TRPO"}, {"env_step": 2426880, "rew": 5590.4942, "rew_std": 711.1954, "Agent": "TRPO"}, {"env_step": 2457600, "rew": 5483.506, "rew_std": 727.4994, "Agent": "TRPO"}, {"env_step": 2488320, "rew": 5604.7737, "rew_std": 574.7065, "Agent": "TRPO"}, {"env_step": 2519040, "rew": 5703.7329, "rew_std": 667.7648, "Agent": "TRPO"}, {"env_step": 2549760, "rew": 5636.2336, "rew_std": 558.0077, "Agent": "TRPO"}, {"env_step": 2580480, "rew": 5608.7512, "rew_std": 751.4965, "Agent": "TRPO"}, {"env_step": 2611200, "rew": 5513.036, "rew_std": 605.4246, "Agent": "TRPO"}, {"env_step": 2641920, "rew": 5609.2432, "rew_std": 672.4689, "Agent": "TRPO"}, {"env_step": 2672640, "rew": 5443.2685, "rew_std": 598.4775, "Agent": "TRPO"}, {"env_step": 2703360, "rew": 5716.6334, "rew_std": 658.9426, "Agent": "TRPO"}, {"env_step": 2734080, "rew": 5621.2652, "rew_std": 636.1672, "Agent": "TRPO"}, {"env_step": 2764800, "rew": 5753.6776, "rew_std": 478.559, "Agent": "TRPO"}, {"env_step": 2795520, "rew": 5385.6886, "rew_std": 663.7376, "Agent": "TRPO"}, {"env_step": 2826240, "rew": 5626.3676, "rew_std": 942.3911, "Agent": "TRPO"}, {"env_step": 2856960, "rew": 5602.6663, "rew_std": 673.6156, "Agent": "TRPO"}, {"env_step": 2887680, "rew": 5747.0218, "rew_std": 430.6334, "Agent": "TRPO"}, {"env_step": 2918400, "rew": 5582.5437, "rew_std": 620.8898, "Agent": "TRPO"}, {"env_step": 2949120, "rew": 5792.1012, "rew_std": 656.0013, "Agent": "TRPO"}, {"env_step": 2979840, "rew": 5760.8131, "rew_std": 680.0352, "Agent": "TRPO"}, {"env_step": 3010560, "rew": 5736.4579, "rew_std": 503.2371, "Agent": "TRPO"}, {"env_step": 3041280, "rew": 5925.6824, "rew_std": 592.2829, "Agent": "TRPO"}, {"env_step": 3072000, "rew": 5863.0106, "rew_std": 751.258, "Agent": "TRPO"}, {"env_step": 0, "rew": -265.1803, "rew_std": 26.8288, "Agent": "A2C"}, {"env_step": 30000, "rew": -151.642, "rew_std": 224.3554, "Agent": "A2C"}, {"env_step": 60000, "rew": -92.9903, "rew_std": 289.8266, "Agent": "A2C"}, {"env_step": 90000, "rew": 38.995, "rew_std": 327.5368, "Agent": "A2C"}, {"env_step": 120000, "rew": 87.1445, "rew_std": 307.6683, "Agent": "A2C"}, {"env_step": 150000, "rew": 220.5334, "rew_std": 379.6231, "Agent": "A2C"}, {"env_step": 180000, "rew": 409.0691, "rew_std": 452.5335, "Agent": "A2C"}, {"env_step": 210000, "rew": 544.2138, "rew_std": 558.6034, "Agent": "A2C"}, {"env_step": 240000, "rew": 514.9554, "rew_std": 431.3969, "Agent": "A2C"}, {"env_step": 270000, "rew": 624.0016, "rew_std": 507.8467, "Agent": "A2C"}, {"env_step": 300000, "rew": 731.1425, "rew_std": 578.3944, "Agent": "A2C"}, {"env_step": 330000, "rew": 796.0141, "rew_std": 644.6127, "Agent": "A2C"}, {"env_step": 360000, "rew": 917.1018, "rew_std": 552.9203, "Agent": "A2C"}, {"env_step": 390000, "rew": 975.4043, "rew_std": 576.3952, "Agent": "A2C"}, {"env_step": 420000, "rew": 934.7208, "rew_std": 561.8865, "Agent": "A2C"}, {"env_step": 450000, "rew": 1119.1488, "rew_std": 647.3409, "Agent": "A2C"}, {"env_step": 480000, "rew": 1154.8508, "rew_std": 658.6049, "Agent": "A2C"}, {"env_step": 510000, "rew": 1076.622, "rew_std": 557.945, "Agent": "A2C"}, {"env_step": 540000, "rew": 1346.3252, "rew_std": 714.3876, "Agent": "A2C"}, {"env_step": 570000, "rew": 1408.3093, "rew_std": 806.4266, "Agent": "A2C"}, {"env_step": 600000, "rew": 1481.7456, "rew_std": 803.4338, "Agent": "A2C"}, {"env_step": 630000, "rew": 1511.0946, "rew_std": 811.9055, "Agent": "A2C"}, {"env_step": 660000, "rew": 1552.3128, "rew_std": 882.5074, "Agent": "A2C"}, {"env_step": 690000, "rew": 1655.6848, "rew_std": 914.6282, "Agent": "A2C"}, {"env_step": 720000, "rew": 1630.8987, "rew_std": 906.7856, "Agent": "A2C"}, {"env_step": 750000, "rew": 1796.7893, "rew_std": 1091.8783, "Agent": "A2C"}, {"env_step": 780000, "rew": 1711.6462, "rew_std": 1041.518, "Agent": "A2C"}, {"env_step": 810000, "rew": 1756.5038, "rew_std": 1036.4954, "Agent": "A2C"}, {"env_step": 840000, "rew": 1764.3135, "rew_std": 1025.8311, "Agent": "A2C"}, {"env_step": 870000, "rew": 1812.3831, "rew_std": 1058.1799, "Agent": "A2C"}, {"env_step": 900000, "rew": 1829.923, "rew_std": 1068.3028, "Agent": "A2C"}, {"env_step": 930000, "rew": 1751.078, "rew_std": 958.1423, "Agent": "A2C"}, {"env_step": 960000, "rew": 1828.2283, "rew_std": 1084.8595, "Agent": "A2C"}, {"env_step": 990000, "rew": 1935.7414, "rew_std": 1159.8274, "Agent": "A2C"}, {"env_step": 1020000, "rew": 1864.5865, "rew_std": 1113.9975, "Agent": "A2C"}, {"env_step": 1050000, "rew": 1881.9668, "rew_std": 1133.5133, "Agent": "A2C"}, {"env_step": 1080000, "rew": 1937.6426, "rew_std": 1153.6651, "Agent": "A2C"}, {"env_step": 1110000, "rew": 1928.2942, "rew_std": 1109.9099, "Agent": "A2C"}, {"env_step": 1140000, "rew": 1924.8877, "rew_std": 1196.4508, "Agent": "A2C"}, {"env_step": 1170000, "rew": 1942.7908, "rew_std": 1204.9327, "Agent": "A2C"}, {"env_step": 1200000, "rew": 1969.991, "rew_std": 1165.5349, "Agent": "A2C"}, {"env_step": 1230000, "rew": 1978.3989, "rew_std": 1163.5834, "Agent": "A2C"}, {"env_step": 1260000, "rew": 1933.0249, "rew_std": 1102.7583, "Agent": "A2C"}, {"env_step": 1290000, "rew": 1939.4646, "rew_std": 1137.9136, "Agent": "A2C"}, {"env_step": 1320000, "rew": 1975.756, "rew_std": 1157.2301, "Agent": "A2C"}, {"env_step": 1350000, "rew": 2043.2366, "rew_std": 1194.5776, "Agent": "A2C"}, {"env_step": 1380000, "rew": 1959.5897, "rew_std": 1145.7464, "Agent": "A2C"}, {"env_step": 1410000, "rew": 1995.257, "rew_std": 1190.176, "Agent": "A2C"}, {"env_step": 1440000, "rew": 1928.3597, "rew_std": 1015.5797, "Agent": "A2C"}, {"env_step": 1470000, "rew": 1892.8145, "rew_std": 1082.5848, "Agent": "A2C"}, {"env_step": 1500000, "rew": 2039.3697, "rew_std": 1250.7594, "Agent": "A2C"}, {"env_step": 1530000, "rew": 2029.4864, "rew_std": 1238.908, "Agent": "A2C"}, {"env_step": 1560000, "rew": 2105.0698, "rew_std": 1217.2523, "Agent": "A2C"}, {"env_step": 1590000, "rew": 2098.116, "rew_std": 1240.7264, "Agent": "A2C"}, {"env_step": 1620000, "rew": 2124.1828, "rew_std": 1284.9803, "Agent": "A2C"}, {"env_step": 1650000, "rew": 2095.9743, "rew_std": 1179.2287, "Agent": "A2C"}, {"env_step": 1680000, "rew": 2141.3761, "rew_std": 1227.2086, "Agent": "A2C"}, {"env_step": 1710000, "rew": 2182.5117, "rew_std": 1272.711, "Agent": "A2C"}, {"env_step": 1740000, "rew": 2117.5139, "rew_std": 1190.7188, "Agent": "A2C"}, {"env_step": 1770000, "rew": 2185.9423, "rew_std": 1307.419, "Agent": "A2C"}, {"env_step": 1800000, "rew": 2220.7673, "rew_std": 1313.4839, "Agent": "A2C"}, {"env_step": 1830000, "rew": 2209.8734, "rew_std": 1277.911, "Agent": "A2C"}, {"env_step": 1860000, "rew": 2169.9106, "rew_std": 1223.3593, "Agent": "A2C"}, {"env_step": 1890000, "rew": 2218.1295, "rew_std": 1282.6223, "Agent": "A2C"}, {"env_step": 1920000, "rew": 2158.5649, "rew_std": 1214.0396, "Agent": "A2C"}, {"env_step": 1950000, "rew": 2183.6557, "rew_std": 1288.1706, "Agent": "A2C"}, {"env_step": 1980000, "rew": 2217.1837, "rew_std": 1306.43, "Agent": "A2C"}, {"env_step": 2010000, "rew": 2231.2067, "rew_std": 1337.9609, "Agent": "A2C"}, {"env_step": 2040000, "rew": 2193.3199, "rew_std": 1228.9301, "Agent": "A2C"}, {"env_step": 2070000, "rew": 2268.7662, "rew_std": 1349.0271, "Agent": "A2C"}, {"env_step": 2100000, "rew": 2264.3721, "rew_std": 1253.8081, "Agent": "A2C"}, {"env_step": 2130000, "rew": 2244.4677, "rew_std": 1302.3581, "Agent": "A2C"}, {"env_step": 2160000, "rew": 2257.2162, "rew_std": 1296.9644, "Agent": "A2C"}, {"env_step": 2190000, "rew": 2181.3572, "rew_std": 1222.576, "Agent": "A2C"}, {"env_step": 2220000, "rew": 2307.0364, "rew_std": 1349.8938, "Agent": "A2C"}, {"env_step": 2250000, "rew": 2262.5205, "rew_std": 1304.059, "Agent": "A2C"}, {"env_step": 2280000, "rew": 2281.8044, "rew_std": 1255.3387, "Agent": "A2C"}, {"env_step": 2310000, "rew": 2298.6342, "rew_std": 1309.8012, "Agent": "A2C"}, {"env_step": 2340000, "rew": 2341.7024, "rew_std": 1321.0374, "Agent": "A2C"}, {"env_step": 2370000, "rew": 2246.4439, "rew_std": 1258.2221, "Agent": "A2C"}, {"env_step": 2400000, "rew": 2229.6385, "rew_std": 1226.8818, "Agent": "A2C"}, {"env_step": 2430000, "rew": 2222.9333, "rew_std": 1238.6857, "Agent": "A2C"}, {"env_step": 2460000, "rew": 2271.9239, "rew_std": 1225.146, "Agent": "A2C"}, {"env_step": 2490000, "rew": 2333.9164, "rew_std": 1287.422, "Agent": "A2C"}, {"env_step": 2520000, "rew": 2212.4533, "rew_std": 1203.0745, "Agent": "A2C"}, {"env_step": 2550000, "rew": 2345.4101, "rew_std": 1304.2363, "Agent": "A2C"}, {"env_step": 2580000, "rew": 2324.3592, "rew_std": 1278.9764, "Agent": "A2C"}, {"env_step": 2610000, "rew": 2329.7909, "rew_std": 1344.4421, "Agent": "A2C"}, {"env_step": 2640000, "rew": 2377.3057, "rew_std": 1363.7383, "Agent": "A2C"}, {"env_step": 2670000, "rew": 2315.1766, "rew_std": 1384.7018, "Agent": "A2C"}, {"env_step": 2700000, "rew": 2343.1761, "rew_std": 1318.4924, "Agent": "A2C"}, {"env_step": 2730000, "rew": 2289.6847, "rew_std": 1298.1297, "Agent": "A2C"}, {"env_step": 2760000, "rew": 2340.3924, "rew_std": 1353.7832, "Agent": "A2C"}, {"env_step": 2790000, "rew": 2301.7639, "rew_std": 1313.5865, "Agent": "A2C"}, {"env_step": 2820000, "rew": 2255.2329, "rew_std": 1275.3453, "Agent": "A2C"}, {"env_step": 2850000, "rew": 2367.6211, "rew_std": 1385.5564, "Agent": "A2C"}, {"env_step": 2880000, "rew": 2270.8572, "rew_std": 1289.8252, "Agent": "A2C"}, {"env_step": 2910000, "rew": 2311.5837, "rew_std": 1262.1833, "Agent": "A2C"}, {"env_step": 2940000, "rew": 2227.0238, "rew_std": 1234.4241, "Agent": "A2C"}, {"env_step": 2970000, "rew": 2285.462, "rew_std": 1210.3531, "Agent": "A2C"}, {"env_step": 3000000, "rew": 2360.4776, "rew_std": 1376.9442, "Agent": "A2C"}, {"env_step": 0, "rew": -268.1684, "rew_std": 22.1247, "Agent": "ACKTR"}, {"env_step": 30000, "rew": -14.5193, "rew_std": 138.544, "Agent": "ACKTR"}, {"env_step": 60000, "rew": 193.7705, "rew_std": 191.3771, "Agent": "ACKTR"}, {"env_step": 90000, "rew": 395.6773, "rew_std": 207.9727, "Agent": "ACKTR"}, {"env_step": 120000, "rew": 578.6845, "rew_std": 321.9886, "Agent": "ACKTR"}, {"env_step": 150000, "rew": 730.4549, "rew_std": 403.146, "Agent": "ACKTR"}, {"env_step": 180000, "rew": 833.2477, "rew_std": 559.5678, "Agent": "ACKTR"}, {"env_step": 210000, "rew": 940.124, "rew_std": 629.521, "Agent": "ACKTR"}, {"env_step": 240000, "rew": 952.3074, "rew_std": 511.6155, "Agent": "ACKTR"}, {"env_step": 270000, "rew": 1063.3239, "rew_std": 699.0664, "Agent": "ACKTR"}, {"env_step": 300000, "rew": 1187.7045, "rew_std": 740.2877, "Agent": "ACKTR"}, {"env_step": 330000, "rew": 1249.8625, "rew_std": 789.3878, "Agent": "ACKTR"}, {"env_step": 360000, "rew": 1295.4229, "rew_std": 764.7084, "Agent": "ACKTR"}, {"env_step": 390000, "rew": 1368.1586, "rew_std": 930.5967, "Agent": "ACKTR"}, {"env_step": 420000, "rew": 1395.8387, "rew_std": 964.0231, "Agent": "ACKTR"}, {"env_step": 450000, "rew": 1323.2105, "rew_std": 739.2303, "Agent": "ACKTR"}, {"env_step": 480000, "rew": 1485.8828, "rew_std": 935.5817, "Agent": "ACKTR"}, {"env_step": 510000, "rew": 1501.2576, "rew_std": 974.8261, "Agent": "ACKTR"}, {"env_step": 540000, "rew": 1556.7868, "rew_std": 947.9883, "Agent": "ACKTR"}, {"env_step": 570000, "rew": 1643.0914, "rew_std": 1096.2904, "Agent": "ACKTR"}, {"env_step": 600000, "rew": 1660.5686, "rew_std": 995.5335, "Agent": "ACKTR"}, {"env_step": 630000, "rew": 1628.4914, "rew_std": 705.7248, "Agent": "ACKTR"}, {"env_step": 660000, "rew": 1653.1471, "rew_std": 911.5086, "Agent": "ACKTR"}, {"env_step": 690000, "rew": 1604.3215, "rew_std": 592.5337, "Agent": "ACKTR"}, {"env_step": 720000, "rew": 1715.827, "rew_std": 702.3705, "Agent": "ACKTR"}, {"env_step": 750000, "rew": 1785.9494, "rew_std": 954.4084, "Agent": "ACKTR"}, {"env_step": 780000, "rew": 1710.2602, "rew_std": 755.3784, "Agent": "ACKTR"}, {"env_step": 810000, "rew": 1701.2389, "rew_std": 707.746, "Agent": "ACKTR"}, {"env_step": 840000, "rew": 1687.7479, "rew_std": 626.1382, "Agent": "ACKTR"}, {"env_step": 870000, "rew": 1523.0408, "rew_std": 458.2535, "Agent": "ACKTR"}, {"env_step": 900000, "rew": 1801.4055, "rew_std": 760.0242, "Agent": "ACKTR"}, {"env_step": 930000, "rew": 1876.2619, "rew_std": 950.2658, "Agent": "ACKTR"}, {"env_step": 960000, "rew": 1768.8184, "rew_std": 781.6244, "Agent": "ACKTR"}, {"env_step": 990000, "rew": 1783.4827, "rew_std": 850.5749, "Agent": "ACKTR"}, {"env_step": 1020000, "rew": 1788.2526, "rew_std": 770.2574, "Agent": "ACKTR"}, {"env_step": 1050000, "rew": 1780.1307, "rew_std": 863.1314, "Agent": "ACKTR"}, {"env_step": 1080000, "rew": 1887.8607, "rew_std": 810.6047, "Agent": "ACKTR"}, {"env_step": 1110000, "rew": 1859.9687, "rew_std": 944.364, "Agent": "ACKTR"}, {"env_step": 1140000, "rew": 1885.4072, "rew_std": 803.8013, "Agent": "ACKTR"}, {"env_step": 1170000, "rew": 1865.0065, "rew_std": 934.3834, "Agent": "ACKTR"}, {"env_step": 1200000, "rew": 1816.6636, "rew_std": 530.9794, "Agent": "ACKTR"}, {"env_step": 1230000, "rew": 1859.788, "rew_std": 734.1784, "Agent": "ACKTR"}, {"env_step": 1260000, "rew": 1891.369, "rew_std": 768.2084, "Agent": "ACKTR"}, {"env_step": 1290000, "rew": 1828.3124, "rew_std": 677.8935, "Agent": "ACKTR"}, {"env_step": 1320000, "rew": 1824.8614, "rew_std": 672.4608, "Agent": "ACKTR"}, {"env_step": 1350000, "rew": 1859.8675, "rew_std": 703.1076, "Agent": "ACKTR"}, {"env_step": 1380000, "rew": 1965.0207, "rew_std": 725.3783, "Agent": "ACKTR"}, {"env_step": 1410000, "rew": 1935.3317, "rew_std": 686.6766, "Agent": "ACKTR"}, {"env_step": 1440000, "rew": 1977.2533, "rew_std": 844.6317, "Agent": "ACKTR"}, {"env_step": 1470000, "rew": 1996.6427, "rew_std": 731.361, "Agent": "ACKTR"}, {"env_step": 1500000, "rew": 1909.8049, "rew_std": 648.6458, "Agent": "ACKTR"}, {"env_step": 1530000, "rew": 2083.2117, "rew_std": 964.2025, "Agent": "ACKTR"}, {"env_step": 1560000, "rew": 2078.3141, "rew_std": 927.8724, "Agent": "ACKTR"}, {"env_step": 1590000, "rew": 2172.2574, "rew_std": 1279.1033, "Agent": "ACKTR"}, {"env_step": 1620000, "rew": 2098.7222, "rew_std": 922.5966, "Agent": "ACKTR"}, {"env_step": 1650000, "rew": 2138.8731, "rew_std": 992.9591, "Agent": "ACKTR"}, {"env_step": 1680000, "rew": 2048.3473, "rew_std": 804.1683, "Agent": "ACKTR"}, {"env_step": 1710000, "rew": 2138.4514, "rew_std": 1038.8278, "Agent": "ACKTR"}, {"env_step": 1740000, "rew": 2042.7256, "rew_std": 799.9514, "Agent": "ACKTR"}, {"env_step": 1770000, "rew": 2091.9107, "rew_std": 924.8025, "Agent": "ACKTR"}, {"env_step": 1800000, "rew": 2147.6626, "rew_std": 1017.3082, "Agent": "ACKTR"}, {"env_step": 1830000, "rew": 2119.5882, "rew_std": 925.3075, "Agent": "ACKTR"}, {"env_step": 1860000, "rew": 1961.7058, "rew_std": 699.3049, "Agent": "ACKTR"}, {"env_step": 1890000, "rew": 2061.6277, "rew_std": 749.1866, "Agent": "ACKTR"}, {"env_step": 1920000, "rew": 2282.5652, "rew_std": 1102.6251, "Agent": "ACKTR"}, {"env_step": 1950000, "rew": 2227.3933, "rew_std": 1068.5204, "Agent": "ACKTR"}, {"env_step": 1980000, "rew": 2292.5157, "rew_std": 1132.1101, "Agent": "ACKTR"}, {"env_step": 2010000, "rew": 2303.1018, "rew_std": 1147.1583, "Agent": "ACKTR"}, {"env_step": 2040000, "rew": 2290.2303, "rew_std": 1070.7875, "Agent": "ACKTR"}, {"env_step": 2070000, "rew": 2360.144, "rew_std": 1252.4242, "Agent": "ACKTR"}, {"env_step": 2100000, "rew": 2366.3926, "rew_std": 1130.6992, "Agent": "ACKTR"}, {"env_step": 2130000, "rew": 2242.8126, "rew_std": 1080.0157, "Agent": "ACKTR"}, {"env_step": 2160000, "rew": 2336.7545, "rew_std": 1156.5183, "Agent": "ACKTR"}, {"env_step": 2190000, "rew": 2315.4955, "rew_std": 1044.6986, "Agent": "ACKTR"}, {"env_step": 2220000, "rew": 2330.0476, "rew_std": 1130.58, "Agent": "ACKTR"}, {"env_step": 2250000, "rew": 2352.413, "rew_std": 1096.7473, "Agent": "ACKTR"}, {"env_step": 2280000, "rew": 2389.5, "rew_std": 1160.3324, "Agent": "ACKTR"}, {"env_step": 2310000, "rew": 2324.3074, "rew_std": 1001.0831, "Agent": "ACKTR"}, {"env_step": 2340000, "rew": 2286.4306, "rew_std": 962.9473, "Agent": "ACKTR"}, {"env_step": 2370000, "rew": 2311.3439, "rew_std": 1050.2019, "Agent": "ACKTR"}, {"env_step": 2400000, "rew": 2461.8528, "rew_std": 1289.1003, "Agent": "ACKTR"}, {"env_step": 2430000, "rew": 2370.452, "rew_std": 1103.9687, "Agent": "ACKTR"}, {"env_step": 2460000, "rew": 2436.4813, "rew_std": 1226.6672, "Agent": "ACKTR"}, {"env_step": 2490000, "rew": 2407.2287, "rew_std": 1114.3394, "Agent": "ACKTR"}, {"env_step": 2520000, "rew": 2455.9365, "rew_std": 1183.1678, "Agent": "ACKTR"}, {"env_step": 2550000, "rew": 2330.6359, "rew_std": 1043.2411, "Agent": "ACKTR"}, {"env_step": 2580000, "rew": 2506.3795, "rew_std": 1410.5156, "Agent": "ACKTR"}, {"env_step": 2610000, "rew": 2409.6729, "rew_std": 1153.5073, "Agent": "ACKTR"}, {"env_step": 2640000, "rew": 2520.0984, "rew_std": 1368.7371, "Agent": "ACKTR"}, {"env_step": 2670000, "rew": 2364.8727, "rew_std": 1065.739, "Agent": "ACKTR"}, {"env_step": 2700000, "rew": 2467.9384, "rew_std": 1217.5099, "Agent": "ACKTR"}, {"env_step": 2730000, "rew": 2439.0683, "rew_std": 1165.0312, "Agent": "ACKTR"}, {"env_step": 2760000, "rew": 2392.407, "rew_std": 1111.4616, "Agent": "ACKTR"}, {"env_step": 2790000, "rew": 2448.1418, "rew_std": 1293.95, "Agent": "ACKTR"}, {"env_step": 2820000, "rew": 2413.2139, "rew_std": 1081.5176, "Agent": "ACKTR"}, {"env_step": 2850000, "rew": 2268.733, "rew_std": 915.9169, "Agent": "ACKTR"}, {"env_step": 2880000, "rew": 2381.0669, "rew_std": 1093.55, "Agent": "ACKTR"}, {"env_step": 2910000, "rew": 2417.5628, "rew_std": 1121.1654, "Agent": "ACKTR"}, {"env_step": 2940000, "rew": 2363.6494, "rew_std": 1134.7054, "Agent": "ACKTR"}, {"env_step": 2970000, "rew": 2322.6152, "rew_std": 1033.3899, "Agent": "ACKTR"}, {"env_step": 3000000, "rew": 2478.7952, "rew_std": 1188.5866, "Agent": "ACKTR"}, {"env_step": 0, "rew": -2.027, "rew_std": 0.7352, "Agent": "DDPG"}, {"env_step": 5000, "rew": -28.8271, "rew_std": 334.3419, "Agent": "DDPG"}, {"env_step": 10000, "rew": 1412.5232, "rew_std": 641.5603, "Agent": "DDPG"}, {"env_step": 15000, "rew": 1981.823, "rew_std": 561.1781, "Agent": "DDPG"}, {"env_step": 20000, "rew": 2379.8574, "rew_std": 785.2131, "Agent": "DDPG"}, {"env_step": 25000, "rew": 3125.7271, "rew_std": 479.5881, "Agent": "DDPG"}, {"env_step": 30000, "rew": 3456.9745, "rew_std": 433.4561, "Agent": "DDPG"}, {"env_step": 35000, "rew": 3823.9994, "rew_std": 779.0331, "Agent": "DDPG"}, {"env_step": 40000, "rew": 3978.0427, "rew_std": 719.3501, "Agent": "DDPG"}, {"env_step": 45000, "rew": 4546.8822, "rew_std": 620.1597, "Agent": "DDPG"}, {"env_step": 50000, "rew": 4523.1437, "rew_std": 791.7028, "Agent": "DDPG"}, {"env_step": 55000, "rew": 4710.7945, "rew_std": 912.7164, "Agent": "DDPG"}, {"env_step": 60000, "rew": 4860.8532, "rew_std": 981.0827, "Agent": "DDPG"}, {"env_step": 65000, "rew": 4937.9971, "rew_std": 1051.3911, "Agent": "DDPG"}, {"env_step": 70000, "rew": 4991.6168, "rew_std": 883.5144, "Agent": "DDPG"}, {"env_step": 75000, "rew": 5598.5992, "rew_std": 676.2098, "Agent": "DDPG"}, {"env_step": 80000, "rew": 5188.1598, "rew_std": 1077.1823, "Agent": "DDPG"}, {"env_step": 85000, "rew": 5752.0384, "rew_std": 932.4943, "Agent": "DDPG"}, {"env_step": 90000, "rew": 5805.2834, "rew_std": 1228.4622, "Agent": "DDPG"}, {"env_step": 95000, "rew": 6139.6541, "rew_std": 812.3183, "Agent": "DDPG"}, {"env_step": 100000, "rew": 6308.281, "rew_std": 1011.4719, "Agent": "DDPG"}, {"env_step": 105000, "rew": 6578.4465, "rew_std": 902.1652, "Agent": "DDPG"}, {"env_step": 110000, "rew": 6225.5968, "rew_std": 628.945, "Agent": "DDPG"}, {"env_step": 115000, "rew": 6618.0579, "rew_std": 792.9479, "Agent": "DDPG"}, {"env_step": 120000, "rew": 6636.5746, "rew_std": 758.4807, "Agent": "DDPG"}, {"env_step": 125000, "rew": 6726.8723, "rew_std": 746.8756, "Agent": "DDPG"}, {"env_step": 130000, "rew": 6426.0841, "rew_std": 1312.1471, "Agent": "DDPG"}, {"env_step": 135000, "rew": 5961.9648, "rew_std": 2287.1167, "Agent": "DDPG"}, {"env_step": 140000, "rew": 6294.7688, "rew_std": 1638.965, "Agent": "DDPG"}, {"env_step": 145000, "rew": 6992.672, "rew_std": 834.1884, "Agent": "DDPG"}, {"env_step": 150000, "rew": 6974.0589, "rew_std": 802.4812, "Agent": "DDPG"}, {"env_step": 155000, "rew": 7314.7522, "rew_std": 848.3754, "Agent": "DDPG"}, {"env_step": 160000, "rew": 7296.0335, "rew_std": 999.8537, "Agent": "DDPG"}, {"env_step": 165000, "rew": 7394.7493, "rew_std": 758.0624, "Agent": "DDPG"}, {"env_step": 170000, "rew": 7444.2435, "rew_std": 896.1343, "Agent": "DDPG"}, {"env_step": 175000, "rew": 7506.2172, "rew_std": 939.2738, "Agent": "DDPG"}, {"env_step": 180000, "rew": 7792.2261, "rew_std": 922.8894, "Agent": "DDPG"}, {"env_step": 185000, "rew": 7772.0288, "rew_std": 780.9202, "Agent": "DDPG"}, {"env_step": 190000, "rew": 7947.7237, "rew_std": 855.0877, "Agent": "DDPG"}, {"env_step": 195000, "rew": 7787.8832, "rew_std": 799.944, "Agent": "DDPG"}, {"env_step": 200000, "rew": 7913.7071, "rew_std": 1074.6718, "Agent": "DDPG"}, {"env_step": 205000, "rew": 7950.1875, "rew_std": 1026.8272, "Agent": "DDPG"}, {"env_step": 210000, "rew": 7572.8741, "rew_std": 1350.0385, "Agent": "DDPG"}, {"env_step": 215000, "rew": 7531.8723, "rew_std": 2504.3457, "Agent": "DDPG"}, {"env_step": 220000, "rew": 8093.4657, "rew_std": 1265.1079, "Agent": "DDPG"}, {"env_step": 225000, "rew": 8232.0487, "rew_std": 938.8681, "Agent": "DDPG"}, {"env_step": 230000, "rew": 8453.1188, "rew_std": 672.4392, "Agent": "DDPG"}, {"env_step": 235000, "rew": 8562.3664, "rew_std": 1045.5171, "Agent": "DDPG"}, {"env_step": 240000, "rew": 8503.9181, "rew_std": 803.2379, "Agent": "DDPG"}, {"env_step": 245000, "rew": 7906.8492, "rew_std": 2653.9952, "Agent": "DDPG"}, {"env_step": 250000, "rew": 7774.7352, "rew_std": 2889.966, "Agent": "DDPG"}, {"env_step": 255000, "rew": 7570.7543, "rew_std": 2772.8448, "Agent": "DDPG"}, {"env_step": 260000, "rew": 8732.4448, "rew_std": 760.7779, "Agent": "DDPG"}, {"env_step": 265000, "rew": 8753.7309, "rew_std": 656.8576, "Agent": "DDPG"}, {"env_step": 270000, "rew": 8893.9039, "rew_std": 633.8578, "Agent": "DDPG"}, {"env_step": 275000, "rew": 9089.5602, "rew_std": 764.8756, "Agent": "DDPG"}, {"env_step": 280000, "rew": 8964.6522, "rew_std": 642.0339, "Agent": "DDPG"}, {"env_step": 285000, "rew": 8901.8237, "rew_std": 528.058, "Agent": "DDPG"}, {"env_step": 290000, "rew": 8804.5557, "rew_std": 626.7264, "Agent": "DDPG"}, {"env_step": 295000, "rew": 9015.7802, "rew_std": 676.9585, "Agent": "DDPG"}, {"env_step": 300000, "rew": 9137.0428, "rew_std": 784.2173, "Agent": "DDPG"}, {"env_step": 305000, "rew": 9330.9567, "rew_std": 671.3886, "Agent": "DDPG"}, {"env_step": 310000, "rew": 9409.5571, "rew_std": 721.7062, "Agent": "DDPG"}, {"env_step": 315000, "rew": 9341.3278, "rew_std": 651.8969, "Agent": "DDPG"}, {"env_step": 320000, "rew": 9425.0942, "rew_std": 645.917, "Agent": "DDPG"}, {"env_step": 325000, "rew": 9431.0494, "rew_std": 869.0498, "Agent": "DDPG"}, {"env_step": 330000, "rew": 9086.6945, "rew_std": 688.3953, "Agent": "DDPG"}, {"env_step": 335000, "rew": 9417.2718, "rew_std": 746.1302, "Agent": "DDPG"}, {"env_step": 340000, "rew": 9602.646, "rew_std": 701.0568, "Agent": "DDPG"}, {"env_step": 345000, "rew": 9777.0993, "rew_std": 747.7249, "Agent": "DDPG"}, {"env_step": 350000, "rew": 9554.0485, "rew_std": 722.7574, "Agent": "DDPG"}, {"env_step": 355000, "rew": 9594.6082, "rew_std": 755.1396, "Agent": "DDPG"}, {"env_step": 360000, "rew": 9544.3629, "rew_std": 688.7421, "Agent": "DDPG"}, {"env_step": 365000, "rew": 9405.8409, "rew_std": 582.176, "Agent": "DDPG"}, {"env_step": 370000, "rew": 9343.8184, "rew_std": 670.104, "Agent": "DDPG"}, {"env_step": 375000, "rew": 9658.2741, "rew_std": 533.29, "Agent": "DDPG"}, {"env_step": 380000, "rew": 9728.9095, "rew_std": 538.4292, "Agent": "DDPG"}, {"env_step": 385000, "rew": 9820.3723, "rew_std": 629.1376, "Agent": "DDPG"}, {"env_step": 390000, "rew": 9865.2476, "rew_std": 547.6719, "Agent": "DDPG"}, {"env_step": 395000, "rew": 10002.046, "rew_std": 736.7768, "Agent": "DDPG"}, {"env_step": 400000, "rew": 9945.8354, "rew_std": 547.7547, "Agent": "DDPG"}, {"env_step": 405000, "rew": 9959.5984, "rew_std": 546.7624, "Agent": "DDPG"}, {"env_step": 410000, "rew": 10083.6288, "rew_std": 541.2135, "Agent": "DDPG"}, {"env_step": 415000, "rew": 9978.6106, "rew_std": 680.8054, "Agent": "DDPG"}, {"env_step": 420000, "rew": 10000.9096, "rew_std": 786.5215, "Agent": "DDPG"}, {"env_step": 425000, "rew": 10019.7757, "rew_std": 435.3879, "Agent": "DDPG"}, {"env_step": 430000, "rew": 9872.1755, "rew_std": 779.0172, "Agent": "DDPG"}, {"env_step": 435000, "rew": 10025.4855, "rew_std": 482.0434, "Agent": "DDPG"}, {"env_step": 440000, "rew": 10240.6122, "rew_std": 656.8871, "Agent": "DDPG"}, {"env_step": 445000, "rew": 10257.9228, "rew_std": 762.7639, "Agent": "DDPG"}, {"env_step": 450000, "rew": 10107.0443, "rew_std": 554.7625, "Agent": "DDPG"}, {"env_step": 455000, "rew": 10270.8498, "rew_std": 524.4578, "Agent": "DDPG"}, {"env_step": 460000, "rew": 10353.1613, "rew_std": 583.0093, "Agent": "DDPG"}, {"env_step": 465000, "rew": 10209.6424, "rew_std": 594.339, "Agent": "DDPG"}, {"env_step": 470000, "rew": 10087.5832, "rew_std": 663.6491, "Agent": "DDPG"}, {"env_step": 475000, "rew": 10517.1995, "rew_std": 632.7956, "Agent": "DDPG"}, {"env_step": 480000, "rew": 10349.4821, "rew_std": 536.1071, "Agent": "DDPG"}, {"env_step": 485000, "rew": 10127.5573, "rew_std": 691.1824, "Agent": "DDPG"}, {"env_step": 490000, "rew": 10253.503, "rew_std": 848.9819, "Agent": "DDPG"}, {"env_step": 495000, "rew": 10441.2324, "rew_std": 711.643, "Agent": "DDPG"}, {"env_step": 500000, "rew": 10440.0106, "rew_std": 593.0907, "Agent": "DDPG"}, {"env_step": 505000, "rew": 10530.2291, "rew_std": 587.6, "Agent": "DDPG"}, {"env_step": 510000, "rew": 10117.4034, "rew_std": 800.7787, "Agent": "DDPG"}, {"env_step": 515000, "rew": 10467.5302, "rew_std": 791.5499, "Agent": "DDPG"}, {"env_step": 520000, "rew": 10716.2178, "rew_std": 604.1685, "Agent": "DDPG"}, {"env_step": 525000, "rew": 10378.1373, "rew_std": 634.8955, "Agent": "DDPG"}, {"env_step": 530000, "rew": 10637.9629, "rew_std": 679.0302, "Agent": "DDPG"}, {"env_step": 535000, "rew": 10373.6315, "rew_std": 510.653, "Agent": "DDPG"}, {"env_step": 540000, "rew": 10604.1965, "rew_std": 628.5797, "Agent": "DDPG"}, {"env_step": 545000, "rew": 10653.719, "rew_std": 416.4147, "Agent": "DDPG"}, {"env_step": 550000, "rew": 10511.583, "rew_std": 587.2064, "Agent": "DDPG"}, {"env_step": 555000, "rew": 10560.0644, "rew_std": 646.5575, "Agent": "DDPG"}, {"env_step": 560000, "rew": 10754.83, "rew_std": 588.194, "Agent": "DDPG"}, {"env_step": 565000, "rew": 10668.4106, "rew_std": 539.8896, "Agent": "DDPG"}, {"env_step": 570000, "rew": 10749.6936, "rew_std": 447.1471, "Agent": "DDPG"}, {"env_step": 575000, "rew": 10918.2499, "rew_std": 640.5309, "Agent": "DDPG"}, {"env_step": 580000, "rew": 10610.7114, "rew_std": 643.848, "Agent": "DDPG"}, {"env_step": 585000, "rew": 10678.5014, "rew_std": 419.7959, "Agent": "DDPG"}, {"env_step": 590000, "rew": 10629.0255, "rew_std": 566.6714, "Agent": "DDPG"}, {"env_step": 595000, "rew": 10886.1181, "rew_std": 636.4089, "Agent": "DDPG"}, {"env_step": 600000, "rew": 10742.807, "rew_std": 927.385, "Agent": "DDPG"}, {"env_step": 605000, "rew": 10945.2297, "rew_std": 613.0327, "Agent": "DDPG"}, {"env_step": 610000, "rew": 10709.0516, "rew_std": 721.4677, "Agent": "DDPG"}, {"env_step": 615000, "rew": 11037.4454, "rew_std": 506.5949, "Agent": "DDPG"}, {"env_step": 620000, "rew": 11016.5806, "rew_std": 569.935, "Agent": "DDPG"}, {"env_step": 625000, "rew": 10885.3285, "rew_std": 659.2231, "Agent": "DDPG"}, {"env_step": 630000, "rew": 10900.9946, "rew_std": 707.7155, "Agent": "DDPG"}, {"env_step": 635000, "rew": 10942.9195, "rew_std": 636.7993, "Agent": "DDPG"}, {"env_step": 640000, "rew": 10882.5497, "rew_std": 841.9896, "Agent": "DDPG"}, {"env_step": 645000, "rew": 11028.7324, "rew_std": 506.2372, "Agent": "DDPG"}, {"env_step": 650000, "rew": 11011.8379, "rew_std": 618.0482, "Agent": "DDPG"}, {"env_step": 655000, "rew": 11139.0448, "rew_std": 467.1458, "Agent": "DDPG"}, {"env_step": 660000, "rew": 10950.6443, "rew_std": 616.6183, "Agent": "DDPG"}, {"env_step": 665000, "rew": 11023.1547, "rew_std": 665.6591, "Agent": "DDPG"}, {"env_step": 670000, "rew": 11194.2498, "rew_std": 574.0943, "Agent": "DDPG"}, {"env_step": 675000, "rew": 11059.1481, "rew_std": 584.0984, "Agent": "DDPG"}, {"env_step": 680000, "rew": 11154.7111, "rew_std": 658.793, "Agent": "DDPG"}, {"env_step": 685000, "rew": 11019.586, "rew_std": 645.6744, "Agent": "DDPG"}, {"env_step": 690000, "rew": 11172.7984, "rew_std": 594.8887, "Agent": "DDPG"}, {"env_step": 695000, "rew": 11071.6482, "rew_std": 451.4383, "Agent": "DDPG"}, {"env_step": 700000, "rew": 11236.911, "rew_std": 467.8947, "Agent": "DDPG"}, {"env_step": 705000, "rew": 11105.3196, "rew_std": 567.6877, "Agent": "DDPG"}, {"env_step": 710000, "rew": 11044.5712, "rew_std": 582.38, "Agent": "DDPG"}, {"env_step": 715000, "rew": 11403.593, "rew_std": 594.2401, "Agent": "DDPG"}, {"env_step": 720000, "rew": 11207.3252, "rew_std": 552.8052, "Agent": "DDPG"}, {"env_step": 725000, "rew": 11142.915, "rew_std": 569.0722, "Agent": "DDPG"}, {"env_step": 730000, "rew": 11156.9241, "rew_std": 510.7954, "Agent": "DDPG"}, {"env_step": 735000, "rew": 11116.1692, "rew_std": 432.8838, "Agent": "DDPG"}, {"env_step": 740000, "rew": 11067.6984, "rew_std": 767.6581, "Agent": "DDPG"}, {"env_step": 745000, "rew": 11300.9546, "rew_std": 607.1508, "Agent": "DDPG"}, {"env_step": 750000, "rew": 11083.3306, "rew_std": 603.7046, "Agent": "DDPG"}, {"env_step": 755000, "rew": 11192.8106, "rew_std": 493.0479, "Agent": "DDPG"}, {"env_step": 760000, "rew": 11286.6854, "rew_std": 522.0469, "Agent": "DDPG"}, {"env_step": 765000, "rew": 11233.9554, "rew_std": 463.6113, "Agent": "DDPG"}, {"env_step": 770000, "rew": 11439.1584, "rew_std": 585.3903, "Agent": "DDPG"}, {"env_step": 775000, "rew": 11361.0733, "rew_std": 546.9008, "Agent": "DDPG"}, {"env_step": 780000, "rew": 11468.0895, "rew_std": 552.944, "Agent": "DDPG"}, {"env_step": 785000, "rew": 11191.989, "rew_std": 763.2787, "Agent": "DDPG"}, {"env_step": 790000, "rew": 11370.4669, "rew_std": 596.5506, "Agent": "DDPG"}, {"env_step": 795000, "rew": 11218.5534, "rew_std": 525.4173, "Agent": "DDPG"}, {"env_step": 800000, "rew": 11289.6965, "rew_std": 517.6745, "Agent": "DDPG"}, {"env_step": 805000, "rew": 11147.309, "rew_std": 621.4135, "Agent": "DDPG"}, {"env_step": 810000, "rew": 11321.261, "rew_std": 395.6105, "Agent": "DDPG"}, {"env_step": 815000, "rew": 11385.979, "rew_std": 557.1665, "Agent": "DDPG"}, {"env_step": 820000, "rew": 11481.979, "rew_std": 490.3213, "Agent": "DDPG"}, {"env_step": 825000, "rew": 11310.0771, "rew_std": 391.0254, "Agent": "DDPG"}, {"env_step": 830000, "rew": 11467.7414, "rew_std": 609.875, "Agent": "DDPG"}, {"env_step": 835000, "rew": 11366.6416, "rew_std": 575.2764, "Agent": "DDPG"}, {"env_step": 840000, "rew": 11284.9116, "rew_std": 708.7849, "Agent": "DDPG"}, {"env_step": 845000, "rew": 11319.6365, "rew_std": 689.111, "Agent": "DDPG"}, {"env_step": 850000, "rew": 11282.7886, "rew_std": 396.2033, "Agent": "DDPG"}, {"env_step": 855000, "rew": 11381.5945, "rew_std": 471.7505, "Agent": "DDPG"}, {"env_step": 860000, "rew": 11411.786, "rew_std": 547.2996, "Agent": "DDPG"}, {"env_step": 865000, "rew": 11454.9553, "rew_std": 563.5031, "Agent": "DDPG"}, {"env_step": 870000, "rew": 11457.6559, "rew_std": 556.0714, "Agent": "DDPG"}, {"env_step": 875000, "rew": 11472.6449, "rew_std": 638.8048, "Agent": "DDPG"}, {"env_step": 880000, "rew": 11465.5412, "rew_std": 705.4152, "Agent": "DDPG"}, {"env_step": 885000, "rew": 11549.7596, "rew_std": 514.3814, "Agent": "DDPG"}, {"env_step": 890000, "rew": 11235.0108, "rew_std": 834.1102, "Agent": "DDPG"}, {"env_step": 895000, "rew": 11622.4758, "rew_std": 536.3827, "Agent": "DDPG"}, {"env_step": 900000, "rew": 11668.2049, "rew_std": 425.4828, "Agent": "DDPG"}, {"env_step": 905000, "rew": 11616.5358, "rew_std": 520.914, "Agent": "DDPG"}, {"env_step": 910000, "rew": 11570.1639, "rew_std": 521.4163, "Agent": "DDPG"}, {"env_step": 915000, "rew": 11541.2839, "rew_std": 554.1431, "Agent": "DDPG"}, {"env_step": 920000, "rew": 11296.8198, "rew_std": 749.0817, "Agent": "DDPG"}, {"env_step": 925000, "rew": 11646.0875, "rew_std": 521.0823, "Agent": "DDPG"}, {"env_step": 930000, "rew": 11592.4523, "rew_std": 562.7359, "Agent": "DDPG"}, {"env_step": 935000, "rew": 11427.8314, "rew_std": 530.3684, "Agent": "DDPG"}, {"env_step": 940000, "rew": 11597.167, "rew_std": 618.9079, "Agent": "DDPG"}, {"env_step": 945000, "rew": 11580.1866, "rew_std": 415.1078, "Agent": "DDPG"}, {"env_step": 950000, "rew": 11642.5185, "rew_std": 518.7493, "Agent": "DDPG"}, {"env_step": 955000, "rew": 11612.4348, "rew_std": 567.302, "Agent": "DDPG"}, {"env_step": 960000, "rew": 11654.0423, "rew_std": 636.8007, "Agent": "DDPG"}, {"env_step": 965000, "rew": 11365.9275, "rew_std": 571.5053, "Agent": "DDPG"}, {"env_step": 970000, "rew": 11294.5028, "rew_std": 518.7431, "Agent": "DDPG"}, {"env_step": 975000, "rew": 11529.7316, "rew_std": 460.8124, "Agent": "DDPG"}, {"env_step": 980000, "rew": 11718.7478, "rew_std": 465.5913, "Agent": "DDPG"}, {"env_step": 985000, "rew": 11458.796, "rew_std": 711.0699, "Agent": "DDPG"}, {"env_step": 990000, "rew": 11604.3687, "rew_std": 652.2274, "Agent": "DDPG"}, {"env_step": 995000, "rew": 11693.6323, "rew_std": 500.5428, "Agent": "DDPG"}, {"env_step": 1000000, "rew": 11652.8908, "rew_std": 430.4893, "Agent": "DDPG"}, {"env_step": 1005000, "rew": 11678.9465, "rew_std": 431.8784, "Agent": "DDPG"}, {"env_step": 1010000, "rew": 11774.2687, "rew_std": 529.5313, "Agent": "DDPG"}, {"env_step": 1015000, "rew": 11708.9961, "rew_std": 340.2499, "Agent": "DDPG"}, {"env_step": 1020000, "rew": 11709.5112, "rew_std": 593.4881, "Agent": "DDPG"}, {"env_step": 1025000, "rew": 11478.2603, "rew_std": 583.3108, "Agent": "DDPG"}, {"env_step": 1030000, "rew": 11735.4503, "rew_std": 622.3741, "Agent": "DDPG"}, {"env_step": 1035000, "rew": 11926.9122, "rew_std": 441.7554, "Agent": "DDPG"}, {"env_step": 1040000, "rew": 11727.8934, "rew_std": 626.3022, "Agent": "DDPG"}, {"env_step": 1045000, "rew": 11860.2139, "rew_std": 306.5245, "Agent": "DDPG"}, {"env_step": 1050000, "rew": 11766.3819, "rew_std": 402.2232, "Agent": "DDPG"}, {"env_step": 1055000, "rew": 11788.8851, "rew_std": 607.4994, "Agent": "DDPG"}, {"env_step": 1060000, "rew": 12029.9967, "rew_std": 457.2206, "Agent": "DDPG"}, {"env_step": 1065000, "rew": 11764.5045, "rew_std": 547.902, "Agent": "DDPG"}, {"env_step": 1070000, "rew": 11685.009, "rew_std": 708.9527, "Agent": "DDPG"}, {"env_step": 1075000, "rew": 11612.3431, "rew_std": 411.729, "Agent": "DDPG"}, {"env_step": 1080000, "rew": 11726.5448, "rew_std": 479.7486, "Agent": "DDPG"}, {"env_step": 1085000, "rew": 11942.8728, "rew_std": 481.9975, "Agent": "DDPG"}, {"env_step": 1090000, "rew": 11991.8823, "rew_std": 452.0352, "Agent": "DDPG"}, {"env_step": 1095000, "rew": 11780.3107, "rew_std": 337.2172, "Agent": "DDPG"}, {"env_step": 1100000, "rew": 11866.922, "rew_std": 550.2163, "Agent": "DDPG"}, {"env_step": 1105000, "rew": 11797.3379, "rew_std": 290.9405, "Agent": "DDPG"}, {"env_step": 1110000, "rew": 11751.0919, "rew_std": 432.3337, "Agent": "DDPG"}, {"env_step": 1115000, "rew": 11676.7626, "rew_std": 573.8274, "Agent": "DDPG"}, {"env_step": 1120000, "rew": 11926.8204, "rew_std": 462.6329, "Agent": "DDPG"}, {"env_step": 1125000, "rew": 11934.5671, "rew_std": 449.9755, "Agent": "DDPG"}, {"env_step": 1130000, "rew": 11872.5645, "rew_std": 571.6153, "Agent": "DDPG"}, {"env_step": 1135000, "rew": 11845.6371, "rew_std": 434.0573, "Agent": "DDPG"}, {"env_step": 1140000, "rew": 11960.4539, "rew_std": 338.6846, "Agent": "DDPG"}, {"env_step": 1145000, "rew": 12070.2261, "rew_std": 428.1063, "Agent": "DDPG"}, {"env_step": 1150000, "rew": 11943.9107, "rew_std": 461.9049, "Agent": "DDPG"}, {"env_step": 1155000, "rew": 11802.2626, "rew_std": 481.006, "Agent": "DDPG"}, {"env_step": 1160000, "rew": 11843.9752, "rew_std": 752.8546, "Agent": "DDPG"}, {"env_step": 1165000, "rew": 12029.565, "rew_std": 598.7713, "Agent": "DDPG"}, {"env_step": 1170000, "rew": 11770.2589, "rew_std": 490.3858, "Agent": "DDPG"}, {"env_step": 1175000, "rew": 11822.2428, "rew_std": 784.5172, "Agent": "DDPG"}, {"env_step": 1180000, "rew": 11512.4653, "rew_std": 766.8959, "Agent": "DDPG"}, {"env_step": 1185000, "rew": 11956.7763, "rew_std": 456.4773, "Agent": "DDPG"}, {"env_step": 1190000, "rew": 11728.895, "rew_std": 673.0261, "Agent": "DDPG"}, {"env_step": 1195000, "rew": 11935.8341, "rew_std": 574.4006, "Agent": "DDPG"}, {"env_step": 1200000, "rew": 11926.2648, "rew_std": 355.5858, "Agent": "DDPG"}, {"env_step": 1205000, "rew": 11928.9478, "rew_std": 478.6533, "Agent": "DDPG"}, {"env_step": 1210000, "rew": 11856.7503, "rew_std": 700.5533, "Agent": "DDPG"}, {"env_step": 1215000, "rew": 12008.802, "rew_std": 387.26, "Agent": "DDPG"}, {"env_step": 1220000, "rew": 12019.8192, "rew_std": 289.377, "Agent": "DDPG"}, {"env_step": 1225000, "rew": 12057.7479, "rew_std": 414.885, "Agent": "DDPG"}, {"env_step": 1230000, "rew": 11917.911, "rew_std": 378.1731, "Agent": "DDPG"}, {"env_step": 1235000, "rew": 12072.7728, "rew_std": 642.2292, "Agent": "DDPG"}, {"env_step": 1240000, "rew": 11910.5075, "rew_std": 415.5465, "Agent": "DDPG"}, {"env_step": 1245000, "rew": 12119.5313, "rew_std": 376.6005, "Agent": "DDPG"}, {"env_step": 1250000, "rew": 11859.1451, "rew_std": 702.3344, "Agent": "DDPG"}, {"env_step": 0, "rew": -269.0138, "rew_std": 20.4789, "Agent": "NPG"}, {"env_step": 30720, "rew": -160.5127, "rew_std": 18.9782, "Agent": "NPG"}, {"env_step": 61440, "rew": -94.2784, "rew_std": 24.5576, "Agent": "NPG"}, {"env_step": 92160, "rew": -23.7564, "rew_std": 37.4827, "Agent": "NPG"}, {"env_step": 122880, "rew": 60.5486, "rew_std": 45.9191, "Agent": "NPG"}, {"env_step": 153600, "rew": 152.773, "rew_std": 51.9568, "Agent": "NPG"}, {"env_step": 184320, "rew": 255.3932, "rew_std": 44.2658, "Agent": "NPG"}, {"env_step": 215040, "rew": 385.9975, "rew_std": 58.6801, "Agent": "NPG"}, {"env_step": 245760, "rew": 512.9514, "rew_std": 73.3064, "Agent": "NPG"}, {"env_step": 276480, "rew": 715.265, "rew_std": 140.5167, "Agent": "NPG"}, {"env_step": 307200, "rew": 911.1576, "rew_std": 178.3159, "Agent": "NPG"}, {"env_step": 337920, "rew": 1018.4086, "rew_std": 329.9283, "Agent": "NPG"}, {"env_step": 368640, "rew": 1235.0224, "rew_std": 341.5778, "Agent": "NPG"}, {"env_step": 399360, "rew": 1443.9733, "rew_std": 468.6704, "Agent": "NPG"}, {"env_step": 430080, "rew": 1667.7531, "rew_std": 442.2423, "Agent": "NPG"}, {"env_step": 460800, "rew": 1831.5479, "rew_std": 545.5386, "Agent": "NPG"}, {"env_step": 491520, "rew": 1934.0746, "rew_std": 626.3789, "Agent": "NPG"}, {"env_step": 522240, "rew": 2237.3684, "rew_std": 593.4551, "Agent": "NPG"}, {"env_step": 552960, "rew": 2281.3317, "rew_std": 529.5114, "Agent": "NPG"}, {"env_step": 583680, "rew": 2427.3805, "rew_std": 693.1959, "Agent": "NPG"}, {"env_step": 614400, "rew": 2619.6263, "rew_std": 694.447, "Agent": "NPG"}, {"env_step": 645120, "rew": 2666.1783, "rew_std": 749.1838, "Agent": "NPG"}, {"env_step": 675840, "rew": 2752.3068, "rew_std": 775.6274, "Agent": "NPG"}, {"env_step": 706560, "rew": 2874.7079, "rew_std": 765.8785, "Agent": "NPG"}, {"env_step": 737280, "rew": 2872.5102, "rew_std": 748.8915, "Agent": "NPG"}, {"env_step": 768000, "rew": 3056.0453, "rew_std": 738.495, "Agent": "NPG"}, {"env_step": 798720, "rew": 3134.671, "rew_std": 743.2283, "Agent": "NPG"}, {"env_step": 829440, "rew": 3142.2193, "rew_std": 674.6281, "Agent": "NPG"}, {"env_step": 860160, "rew": 3243.519, "rew_std": 696.3507, "Agent": "NPG"}, {"env_step": 890880, "rew": 3307.7985, "rew_std": 717.1152, "Agent": "NPG"}, {"env_step": 921600, "rew": 3401.0174, "rew_std": 676.2871, "Agent": "NPG"}, {"env_step": 952320, "rew": 3315.1973, "rew_std": 678.3955, "Agent": "NPG"}, {"env_step": 983040, "rew": 3475.9233, "rew_std": 634.5106, "Agent": "NPG"}, {"env_step": 1013760, "rew": 3492.6633, "rew_std": 783.2726, "Agent": "NPG"}, {"env_step": 1044480, "rew": 3573.5354, "rew_std": 708.0869, "Agent": "NPG"}, {"env_step": 1075200, "rew": 3493.0792, "rew_std": 815.7911, "Agent": "NPG"}, {"env_step": 1105920, "rew": 3717.4237, "rew_std": 633.3164, "Agent": "NPG"}, {"env_step": 1136640, "rew": 3534.8559, "rew_std": 663.244, "Agent": "NPG"}, {"env_step": 1167360, "rew": 3769.5235, "rew_std": 601.7829, "Agent": "NPG"}, {"env_step": 1198080, "rew": 3819.8011, "rew_std": 606.2243, "Agent": "NPG"}, {"env_step": 1228800, "rew": 3723.3166, "rew_std": 587.2669, "Agent": "NPG"}, {"env_step": 1259520, "rew": 3885.6694, "rew_std": 546.0698, "Agent": "NPG"}, {"env_step": 1290240, "rew": 4003.4706, "rew_std": 585.2037, "Agent": "NPG"}, {"env_step": 1320960, "rew": 3967.675, "rew_std": 571.6276, "Agent": "NPG"}, {"env_step": 1351680, "rew": 3887.6813, "rew_std": 553.2184, "Agent": "NPG"}, {"env_step": 1382400, "rew": 3977.8229, "rew_std": 583.3682, "Agent": "NPG"}, {"env_step": 1413120, "rew": 4046.488, "rew_std": 555.6311, "Agent": "NPG"}, {"env_step": 1443840, "rew": 4133.6654, "rew_std": 539.3119, "Agent": "NPG"}, {"env_step": 1474560, "rew": 4109.0703, "rew_std": 531.0234, "Agent": "NPG"}, {"env_step": 1505280, "rew": 4101.6238, "rew_std": 580.5682, "Agent": "NPG"}, {"env_step": 1536000, "rew": 3914.0319, "rew_std": 640.2358, "Agent": "NPG"}, {"env_step": 1566720, "rew": 4147.142, "rew_std": 521.3236, "Agent": "NPG"}, {"env_step": 1597440, "rew": 3997.6052, "rew_std": 402.0909, "Agent": "NPG"}, {"env_step": 1628160, "rew": 4118.4834, "rew_std": 456.8417, "Agent": "NPG"}, {"env_step": 1658880, "rew": 4128.8423, "rew_std": 512.5041, "Agent": "NPG"}, {"env_step": 1689600, "rew": 4154.8767, "rew_std": 492.5337, "Agent": "NPG"}, {"env_step": 1720320, "rew": 4245.4902, "rew_std": 553.1697, "Agent": "NPG"}, {"env_step": 1751040, "rew": 4453.0335, "rew_std": 521.9303, "Agent": "NPG"}, {"env_step": 1781760, "rew": 4278.3811, "rew_std": 568.3031, "Agent": "NPG"}, {"env_step": 1812480, "rew": 4364.6593, "rew_std": 404.1046, "Agent": "NPG"}, {"env_step": 1843200, "rew": 4236.0875, "rew_std": 444.7574, "Agent": "NPG"}, {"env_step": 1873920, "rew": 4419.8157, "rew_std": 379.6884, "Agent": "NPG"}, {"env_step": 1904640, "rew": 4417.7341, "rew_std": 540.1818, "Agent": "NPG"}, {"env_step": 1935360, "rew": 4481.7258, "rew_std": 422.5195, "Agent": "NPG"}, {"env_step": 1966080, "rew": 4297.6024, "rew_std": 493.0859, "Agent": "NPG"}, {"env_step": 1996800, "rew": 4558.7537, "rew_std": 522.5865, "Agent": "NPG"}, {"env_step": 2027520, "rew": 4713.4929, "rew_std": 496.563, "Agent": "NPG"}, {"env_step": 2058240, "rew": 4553.3987, "rew_std": 379.8311, "Agent": "NPG"}, {"env_step": 2088960, "rew": 4577.1719, "rew_std": 550.7598, "Agent": "NPG"}, {"env_step": 2119680, "rew": 4473.5176, "rew_std": 435.4927, "Agent": "NPG"}, {"env_step": 2150400, "rew": 4469.529, "rew_std": 364.1314, "Agent": "NPG"}, {"env_step": 2181120, "rew": 4703.259, "rew_std": 458.4855, "Agent": "NPG"}, {"env_step": 2211840, "rew": 4770.1423, "rew_std": 462.8473, "Agent": "NPG"}, {"env_step": 2242560, "rew": 4669.0878, "rew_std": 424.4639, "Agent": "NPG"}, {"env_step": 2273280, "rew": 4740.9984, "rew_std": 485.3402, "Agent": "NPG"}, {"env_step": 2304000, "rew": 4769.8851, "rew_std": 436.0283, "Agent": "NPG"}, {"env_step": 2334720, "rew": 4727.8013, "rew_std": 434.6513, "Agent": "NPG"}, {"env_step": 2365440, "rew": 4747.5171, "rew_std": 373.4963, "Agent": "NPG"}, {"env_step": 2396160, "rew": 4843.9878, "rew_std": 436.6808, "Agent": "NPG"}, {"env_step": 2426880, "rew": 4700.4783, "rew_std": 581.0517, "Agent": "NPG"}, {"env_step": 2457600, "rew": 4864.3453, "rew_std": 415.3474, "Agent": "NPG"}, {"env_step": 2488320, "rew": 4793.7081, "rew_std": 505.4735, "Agent": "NPG"}, {"env_step": 2519040, "rew": 4967.6986, "rew_std": 460.7779, "Agent": "NPG"}, {"env_step": 2549760, "rew": 4890.799, "rew_std": 554.8942, "Agent": "NPG"}, {"env_step": 2580480, "rew": 4883.3211, "rew_std": 579.113, "Agent": "NPG"}, {"env_step": 2611200, "rew": 5020.9774, "rew_std": 433.0335, "Agent": "NPG"}, {"env_step": 2641920, "rew": 5016.0219, "rew_std": 521.9597, "Agent": "NPG"}, {"env_step": 2672640, "rew": 4845.6006, "rew_std": 456.044, "Agent": "NPG"}, {"env_step": 2703360, "rew": 4953.4677, "rew_std": 326.5535, "Agent": "NPG"}, {"env_step": 2734080, "rew": 4944.539, "rew_std": 494.4399, "Agent": "NPG"}, {"env_step": 2764800, "rew": 4991.2135, "rew_std": 510.6281, "Agent": "NPG"}, {"env_step": 2795520, "rew": 5098.4004, "rew_std": 463.7462, "Agent": "NPG"}, {"env_step": 2826240, "rew": 4930.7397, "rew_std": 688.5445, "Agent": "NPG"}, {"env_step": 2856960, "rew": 5097.8203, "rew_std": 353.8135, "Agent": "NPG"}, {"env_step": 2887680, "rew": 4994.2381, "rew_std": 353.1664, "Agent": "NPG"}, {"env_step": 2918400, "rew": 5092.6367, "rew_std": 421.4692, "Agent": "NPG"}, {"env_step": 2949120, "rew": 5126.6559, "rew_std": 402.9355, "Agent": "NPG"}, {"env_step": 2979840, "rew": 5147.4423, "rew_std": 399.1398, "Agent": "NPG"}, {"env_step": 3010560, "rew": 5225.5276, "rew_std": 446.2045, "Agent": "NPG"}, {"env_step": 3041280, "rew": 5155.818, "rew_std": 493.2056, "Agent": "NPG"}, {"env_step": 3072000, "rew": 5141.6016, "rew_std": 533.5805, "Agent": "NPG"}]