[{"env_step": 0, "rew": 17.4591, "rew_std": 3.1393, "Agent": "PPO"}, {"env_step": 30720, "rew": 258.0573, "rew_std": 21.2869, "Agent": "PPO"}, {"env_step": 61440, "rew": 321.5229, "rew_std": 32.9819, "Agent": "PPO"}, {"env_step": 92160, "rew": 368.9201, "rew_std": 45.9052, "Agent": "PPO"}, {"env_step": 122880, "rew": 399.3288, "rew_std": 43.0806, "Agent": "PPO"}, {"env_step": 153600, "rew": 432.5139, "rew_std": 71.3239, "Agent": "PPO"}, {"env_step": 184320, "rew": 499.772, "rew_std": 111.9788, "Agent": "PPO"}, {"env_step": 215040, "rew": 555.8803, "rew_std": 145.4804, "Agent": "PPO"}, {"env_step": 245760, "rew": 676.9764, "rew_std": 211.6327, "Agent": "PPO"}, {"env_step": 276480, "rew": 813.3559, "rew_std": 313.94, "Agent": "PPO"}, {"env_step": 307200, "rew": 883.8523, "rew_std": 297.6962, "Agent": "PPO"}, {"env_step": 337920, "rew": 965.7387, "rew_std": 317.0964, "Agent": "PPO"}, {"env_step": 368640, "rew": 1133.3987, "rew_std": 313.3517, "Agent": "PPO"}, {"env_step": 399360, "rew": 1301.2343, "rew_std": 435.8154, "Agent": "PPO"}, {"env_step": 430080, "rew": 1508.3458, "rew_std": 468.8199, "Agent": "PPO"}, {"env_step": 460800, "rew": 2025.0004, "rew_std": 756.4872, "Agent": "PPO"}, {"env_step": 491520, "rew": 1975.8486, "rew_std": 705.2052, "Agent": "PPO"}, {"env_step": 522240, "rew": 2227.2255, "rew_std": 669.5327, "Agent": "PPO"}, {"env_step": 552960, "rew": 2409.7045, "rew_std": 716.1465, "Agent": "PPO"}, {"env_step": 583680, "rew": 2393.2191, "rew_std": 703.3068, "Agent": "PPO"}, {"env_step": 614400, "rew": 2312.3677, "rew_std": 731.6068, "Agent": "PPO"}, {"env_step": 645120, "rew": 2165.5728, "rew_std": 703.9315, "Agent": "PPO"}, {"env_step": 675840, "rew": 2199.1089, "rew_std": 663.8891, "Agent": "PPO"}, {"env_step": 706560, "rew": 2253.354, "rew_std": 723.8256, "Agent": "PPO"}, {"env_step": 737280, "rew": 2047.2415, "rew_std": 670.5035, "Agent": "PPO"}, {"env_step": 768000, "rew": 2268.8839, "rew_std": 920.2149, "Agent": "PPO"}, {"env_step": 798720, "rew": 2331.4466, "rew_std": 660.495, "Agent": "PPO"}, {"env_step": 829440, "rew": 2395.9565, "rew_std": 766.3797, "Agent": "PPO"}, {"env_step": 860160, "rew": 2412.8335, "rew_std": 845.1709, "Agent": "PPO"}, {"env_step": 890880, "rew": 2609.335, "rew_std": 700.8103, "Agent": "PPO"}, {"env_step": 921600, "rew": 2323.7125, "rew_std": 554.5084, "Agent": "PPO"}, {"env_step": 952320, "rew": 2342.3823, "rew_std": 677.2163, "Agent": "PPO"}, {"env_step": 983040, "rew": 2370.1043, "rew_std": 695.5023, "Agent": "PPO"}, {"env_step": 1013760, "rew": 2482.5501, "rew_std": 852.3902, "Agent": "PPO"}, {"env_step": 1044480, "rew": 2543.0648, "rew_std": 664.076, "Agent": "PPO"}, {"env_step": 1075200, "rew": 2595.0248, "rew_std": 682.0517, "Agent": "PPO"}, {"env_step": 1105920, "rew": 2293.5028, "rew_std": 619.1544, "Agent": "PPO"}, {"env_step": 1136640, "rew": 2665.0402, "rew_std": 689.8843, "Agent": "PPO"}, {"env_step": 1167360, "rew": 2365.2063, "rew_std": 640.2129, "Agent": "PPO"}, {"env_step": 1198080, "rew": 2740.7154, "rew_std": 743.8731, "Agent": "PPO"}, {"env_step": 1228800, "rew": 2375.3191, "rew_std": 919.2542, "Agent": "PPO"}, {"env_step": 1259520, "rew": 2752.1238, "rew_std": 635.7227, "Agent": "PPO"}, {"env_step": 1290240, "rew": 2652.1802, "rew_std": 545.9033, "Agent": "PPO"}, {"env_step": 1320960, "rew": 2563.4924, "rew_std": 543.7153, "Agent": "PPO"}, {"env_step": 1351680, "rew": 2903.989, "rew_std": 437.1591, "Agent": "PPO"}, {"env_step": 1382400, "rew": 2708.8197, "rew_std": 442.3195, "Agent": "PPO"}, {"env_step": 1413120, "rew": 2696.5147, "rew_std": 533.7476, "Agent": "PPO"}, {"env_step": 1443840, "rew": 2825.6167, "rew_std": 502.3265, "Agent": "PPO"}, {"env_step": 1474560, "rew": 2837.7101, "rew_std": 583.6296, "Agent": "PPO"}, {"env_step": 1505280, "rew": 2286.467, "rew_std": 775.9048, "Agent": "PPO"}, {"env_step": 1536000, "rew": 2564.4424, "rew_std": 609.329, "Agent": "PPO"}, {"env_step": 1566720, "rew": 2815.8548, "rew_std": 473.1315, "Agent": "PPO"}, {"env_step": 1597440, "rew": 2637.735, "rew_std": 407.1216, "Agent": "PPO"}, {"env_step": 1628160, "rew": 2826.9888, "rew_std": 466.1343, "Agent": "PPO"}, {"env_step": 1658880, "rew": 2679.819, "rew_std": 604.9165, "Agent": "PPO"}, {"env_step": 1689600, "rew": 2310.0095, "rew_std": 820.3102, "Agent": "PPO"}, {"env_step": 1720320, "rew": 2401.5418, "rew_std": 607.9464, "Agent": "PPO"}, {"env_step": 1751040, "rew": 2253.5243, "rew_std": 640.3227, "Agent": "PPO"}, {"env_step": 1781760, "rew": 2329.541, "rew_std": 569.5139, "Agent": "PPO"}, {"env_step": 1812480, "rew": 2402.1102, "rew_std": 546.2053, "Agent": "PPO"}, {"env_step": 1843200, "rew": 2731.4867, "rew_std": 377.6566, "Agent": "PPO"}, {"env_step": 1873920, "rew": 2638.8958, "rew_std": 423.2264, "Agent": "PPO"}, {"env_step": 1904640, "rew": 2741.9472, "rew_std": 490.6814, "Agent": "PPO"}, {"env_step": 1935360, "rew": 2672.56, "rew_std": 626.8115, "Agent": "PPO"}, {"env_step": 1966080, "rew": 2579.2487, "rew_std": 823.8814, "Agent": "PPO"}, {"env_step": 1996800, "rew": 2532.4619, "rew_std": 608.9239, "Agent": "PPO"}, {"env_step": 2027520, "rew": 2714.8373, "rew_std": 558.9923, "Agent": "PPO"}, {"env_step": 2058240, "rew": 2790.1972, "rew_std": 606.7406, "Agent": "PPO"}, {"env_step": 2088960, "rew": 2806.6684, "rew_std": 594.6761, "Agent": "PPO"}, {"env_step": 2119680, "rew": 2983.2358, "rew_std": 490.9231, "Agent": "PPO"}, {"env_step": 2150400, "rew": 2678.8518, "rew_std": 383.2641, "Agent": "PPO"}, {"env_step": 2181120, "rew": 2504.8482, "rew_std": 731.2124, "Agent": "PPO"}, {"env_step": 2211840, "rew": 2916.3325, "rew_std": 529.2655, "Agent": "PPO"}, {"env_step": 2242560, "rew": 2736.5338, "rew_std": 549.6671, "Agent": "PPO"}, {"env_step": 2273280, "rew": 2704.9419, "rew_std": 624.3988, "Agent": "PPO"}, {"env_step": 2304000, "rew": 2578.0559, "rew_std": 619.9542, "Agent": "PPO"}, {"env_step": 2334720, "rew": 2459.1878, "rew_std": 714.9442, "Agent": "PPO"}, {"env_step": 2365440, "rew": 2359.8527, "rew_std": 534.6146, "Agent": "PPO"}, {"env_step": 2396160, "rew": 2530.1409, "rew_std": 724.2738, "Agent": "PPO"}, {"env_step": 2426880, "rew": 2624.1701, "rew_std": 535.1847, "Agent": "PPO"}, {"env_step": 2457600, "rew": 2731.1249, "rew_std": 553.7215, "Agent": "PPO"}, {"env_step": 2488320, "rew": 2601.1055, "rew_std": 374.4485, "Agent": "PPO"}, {"env_step": 2519040, "rew": 2680.2664, "rew_std": 439.8017, "Agent": "PPO"}, {"env_step": 2549760, "rew": 2991.4033, "rew_std": 377.8164, "Agent": "PPO"}, {"env_step": 2580480, "rew": 2935.6051, "rew_std": 455.1756, "Agent": "PPO"}, {"env_step": 2611200, "rew": 3086.7075, "rew_std": 346.5505, "Agent": "PPO"}, {"env_step": 2641920, "rew": 2894.2612, "rew_std": 316.5737, "Agent": "PPO"}, {"env_step": 2672640, "rew": 3127.6851, "rew_std": 413.0159, "Agent": "PPO"}, {"env_step": 2703360, "rew": 2947.9566, "rew_std": 440.9114, "Agent": "PPO"}, {"env_step": 2734080, "rew": 3080.4229, "rew_std": 392.3963, "Agent": "PPO"}, {"env_step": 2764800, "rew": 2959.3085, "rew_std": 509.0458, "Agent": "PPO"}, {"env_step": 2795520, "rew": 2998.2617, "rew_std": 363.2342, "Agent": "PPO"}, {"env_step": 2826240, "rew": 3025.9286, "rew_std": 327.0367, "Agent": "PPO"}, {"env_step": 2856960, "rew": 2685.6607, "rew_std": 479.2221, "Agent": "PPO"}, {"env_step": 2887680, "rew": 2904.1953, "rew_std": 525.6346, "Agent": "PPO"}, {"env_step": 2918400, "rew": 2766.6171, "rew_std": 547.6156, "Agent": "PPO"}, {"env_step": 2949120, "rew": 2775.0355, "rew_std": 490.8935, "Agent": "PPO"}, {"env_step": 2979840, "rew": 2534.7584, "rew_std": 647.3288, "Agent": "PPO"}, {"env_step": 3010560, "rew": 2747.8063, "rew_std": 647.902, "Agent": "PPO"}, {"env_step": 3041280, "rew": 2786.2628, "rew_std": 657.6806, "Agent": "PPO"}, {"env_step": 3072000, "rew": 2714.6257, "rew_std": 651.8296, "Agent": "PPO"}, {"env_step": 0, "rew": 47.4556, "rew_std": 36.0937, "Agent": "TD3"}, {"env_step": 5000, "rew": 181.1706, "rew_std": 11.8607, "Agent": "TD3"}, {"env_step": 10000, "rew": 195.6339, "rew_std": 28.1807, "Agent": "TD3"}, {"env_step": 15000, "rew": 196.3426, "rew_std": 38.924, "Agent": "TD3"}, {"env_step": 20000, "rew": 245.9809, "rew_std": 64.7713, "Agent": "TD3"}, {"env_step": 25000, "rew": 226.7399, "rew_std": 45.5801, "Agent": "TD3"}, {"env_step": 30000, "rew": 244.7301, "rew_std": 37.4813, "Agent": "TD3"}, {"env_step": 35000, "rew": 230.0412, "rew_std": 31.198, "Agent": "TD3"}, {"env_step": 40000, "rew": 261.6885, "rew_std": 26.8584, "Agent": "TD3"}, {"env_step": 45000, "rew": 329.7057, "rew_std": 58.7719, "Agent": "TD3"}, {"env_step": 50000, "rew": 321.4114, "rew_std": 45.1645, "Agent": "TD3"}, {"env_step": 55000, "rew": 403.0395, "rew_std": 213.6362, "Agent": "TD3"}, {"env_step": 60000, "rew": 341.5308, "rew_std": 98.1405, "Agent": "TD3"}, {"env_step": 65000, "rew": 461.4619, "rew_std": 232.873, "Agent": "TD3"}, {"env_step": 70000, "rew": 346.6516, "rew_std": 94.5479, "Agent": "TD3"}, {"env_step": 75000, "rew": 336.0042, "rew_std": 81.4701, "Agent": "TD3"}, {"env_step": 80000, "rew": 391.4512, "rew_std": 149.1327, "Agent": "TD3"}, {"env_step": 85000, "rew": 544.4272, "rew_std": 227.6467, "Agent": "TD3"}, {"env_step": 90000, "rew": 710.7108, "rew_std": 549.5041, "Agent": "TD3"}, {"env_step": 95000, "rew": 500.0801, "rew_std": 247.3054, "Agent": "TD3"}, {"env_step": 100000, "rew": 596.5279, "rew_std": 287.8254, "Agent": "TD3"}, {"env_step": 105000, "rew": 623.8025, "rew_std": 327.5888, "Agent": "TD3"}, {"env_step": 110000, "rew": 513.4111, "rew_std": 255.0535, "Agent": "TD3"}, {"env_step": 115000, "rew": 495.5632, "rew_std": 212.4063, "Agent": "TD3"}, {"env_step": 120000, "rew": 555.7409, "rew_std": 227.1517, "Agent": "TD3"}, {"env_step": 125000, "rew": 718.938, "rew_std": 723.5998, "Agent": "TD3"}, {"env_step": 130000, "rew": 680.9442, "rew_std": 460.8098, "Agent": "TD3"}, {"env_step": 135000, "rew": 520.8898, "rew_std": 214.5221, "Agent": "TD3"}, {"env_step": 140000, "rew": 650.3446, "rew_std": 461.5131, "Agent": "TD3"}, {"env_step": 145000, "rew": 684.433, "rew_std": 475.0653, "Agent": "TD3"}, {"env_step": 150000, "rew": 696.6079, "rew_std": 409.8031, "Agent": "TD3"}, {"env_step": 155000, "rew": 927.7476, "rew_std": 772.3126, "Agent": "TD3"}, {"env_step": 160000, "rew": 625.1645, "rew_std": 477.6126, "Agent": "TD3"}, {"env_step": 165000, "rew": 794.7899, "rew_std": 506.2143, "Agent": "TD3"}, {"env_step": 170000, "rew": 1005.2103, "rew_std": 853.9211, "Agent": "TD3"}, {"env_step": 175000, "rew": 845.2076, "rew_std": 627.2596, "Agent": "TD3"}, {"env_step": 180000, "rew": 854.2243, "rew_std": 463.2582, "Agent": "TD3"}, {"env_step": 185000, "rew": 882.8193, "rew_std": 611.5015, "Agent": "TD3"}, {"env_step": 190000, "rew": 881.529, "rew_std": 520.6295, "Agent": "TD3"}, {"env_step": 195000, "rew": 936.7988, "rew_std": 578.7772, "Agent": "TD3"}, {"env_step": 200000, "rew": 887.1944, "rew_std": 649.2743, "Agent": "TD3"}, {"env_step": 205000, "rew": 1003.2064, "rew_std": 719.9525, "Agent": "TD3"}, {"env_step": 210000, "rew": 1259.7631, "rew_std": 918.6324, "Agent": "TD3"}, {"env_step": 215000, "rew": 1218.8341, "rew_std": 909.5814, "Agent": "TD3"}, {"env_step": 220000, "rew": 1454.8435, "rew_std": 961.2179, "Agent": "TD3"}, {"env_step": 225000, "rew": 1120.2673, "rew_std": 742.6399, "Agent": "TD3"}, {"env_step": 230000, "rew": 1388.694, "rew_std": 971.8594, "Agent": "TD3"}, {"env_step": 235000, "rew": 1141.3244, "rew_std": 584.5602, "Agent": "TD3"}, {"env_step": 240000, "rew": 1218.6979, "rew_std": 672.9531, "Agent": "TD3"}, {"env_step": 245000, "rew": 1227.6752, "rew_std": 779.683, "Agent": "TD3"}, {"env_step": 250000, "rew": 1426.1448, "rew_std": 883.1093, "Agent": "TD3"}, {"env_step": 255000, "rew": 1356.3186, "rew_std": 913.06, "Agent": "TD3"}, {"env_step": 260000, "rew": 1519.809, "rew_std": 974.498, "Agent": "TD3"}, {"env_step": 265000, "rew": 1430.8821, "rew_std": 1039.3051, "Agent": "TD3"}, {"env_step": 270000, "rew": 1697.1211, "rew_std": 967.8384, "Agent": "TD3"}, {"env_step": 275000, "rew": 1505.3005, "rew_std": 877.8138, "Agent": "TD3"}, {"env_step": 280000, "rew": 1616.8995, "rew_std": 1006.4543, "Agent": "TD3"}, {"env_step": 285000, "rew": 1595.6735, "rew_std": 880.8836, "Agent": "TD3"}, {"env_step": 290000, "rew": 1669.8616, "rew_std": 788.7447, "Agent": "TD3"}, {"env_step": 295000, "rew": 1680.3393, "rew_std": 771.5441, "Agent": "TD3"}, {"env_step": 300000, "rew": 1583.401, "rew_std": 639.2439, "Agent": "TD3"}, {"env_step": 305000, "rew": 1410.9341, "rew_std": 802.8923, "Agent": "TD3"}, {"env_step": 310000, "rew": 1579.7909, "rew_std": 833.9381, "Agent": "TD3"}, {"env_step": 315000, "rew": 1790.2155, "rew_std": 852.3138, "Agent": "TD3"}, {"env_step": 320000, "rew": 1725.0626, "rew_std": 1004.9677, "Agent": "TD3"}, {"env_step": 325000, "rew": 1773.9219, "rew_std": 818.0885, "Agent": "TD3"}, {"env_step": 330000, "rew": 1934.2742, "rew_std": 983.5329, "Agent": "TD3"}, {"env_step": 335000, "rew": 2059.7185, "rew_std": 992.11, "Agent": "TD3"}, {"env_step": 340000, "rew": 2165.3606, "rew_std": 801.6612, "Agent": "TD3"}, {"env_step": 345000, "rew": 2249.709, "rew_std": 867.5837, "Agent": "TD3"}, {"env_step": 350000, "rew": 2394.7054, "rew_std": 793.9618, "Agent": "TD3"}, {"env_step": 355000, "rew": 2366.3303, "rew_std": 864.5402, "Agent": "TD3"}, {"env_step": 360000, "rew": 2160.4499, "rew_std": 615.6932, "Agent": "TD3"}, {"env_step": 365000, "rew": 2308.3733, "rew_std": 745.4213, "Agent": "TD3"}, {"env_step": 370000, "rew": 1827.3007, "rew_std": 889.1223, "Agent": "TD3"}, {"env_step": 375000, "rew": 2541.1833, "rew_std": 828.5518, "Agent": "TD3"}, {"env_step": 380000, "rew": 2423.2221, "rew_std": 908.2991, "Agent": "TD3"}, {"env_step": 385000, "rew": 2213.5402, "rew_std": 885.9217, "Agent": "TD3"}, {"env_step": 390000, "rew": 2481.258, "rew_std": 730.3209, "Agent": "TD3"}, {"env_step": 395000, "rew": 2167.8909, "rew_std": 919.1415, "Agent": "TD3"}, {"env_step": 400000, "rew": 2247.8712, "rew_std": 1008.3715, "Agent": "TD3"}, {"env_step": 405000, "rew": 2381.9554, "rew_std": 942.0726, "Agent": "TD3"}, {"env_step": 410000, "rew": 2653.6324, "rew_std": 858.8246, "Agent": "TD3"}, {"env_step": 415000, "rew": 2547.441, "rew_std": 933.1938, "Agent": "TD3"}, {"env_step": 420000, "rew": 2613.1125, "rew_std": 735.4271, "Agent": "TD3"}, {"env_step": 425000, "rew": 2594.5911, "rew_std": 757.9404, "Agent": "TD3"}, {"env_step": 430000, "rew": 2264.0453, "rew_std": 1073.4573, "Agent": "TD3"}, {"env_step": 435000, "rew": 2646.8585, "rew_std": 896.8083, "Agent": "TD3"}, {"env_step": 440000, "rew": 2755.1494, "rew_std": 610.0019, "Agent": "TD3"}, {"env_step": 445000, "rew": 2805.4777, "rew_std": 803.6409, "Agent": "TD3"}, {"env_step": 450000, "rew": 2875.6351, "rew_std": 744.3018, "Agent": "TD3"}, {"env_step": 455000, "rew": 2817.7326, "rew_std": 794.6529, "Agent": "TD3"}, {"env_step": 460000, "rew": 2793.4703, "rew_std": 717.5994, "Agent": "TD3"}, {"env_step": 465000, "rew": 2842.3719, "rew_std": 765.139, "Agent": "TD3"}, {"env_step": 470000, "rew": 2563.8287, "rew_std": 712.3143, "Agent": "TD3"}, {"env_step": 475000, "rew": 2669.7186, "rew_std": 933.7879, "Agent": "TD3"}, {"env_step": 480000, "rew": 2685.2956, "rew_std": 968.0261, "Agent": "TD3"}, {"env_step": 485000, "rew": 2700.6731, "rew_std": 821.3018, "Agent": "TD3"}, {"env_step": 490000, "rew": 2964.1087, "rew_std": 448.9934, "Agent": "TD3"}, {"env_step": 495000, "rew": 2943.0135, "rew_std": 647.4103, "Agent": "TD3"}, {"env_step": 500000, "rew": 2961.4207, "rew_std": 655.0678, "Agent": "TD3"}, {"env_step": 505000, "rew": 2849.137, "rew_std": 761.0781, "Agent": "TD3"}, {"env_step": 510000, "rew": 3098.253, "rew_std": 469.053, "Agent": "TD3"}, {"env_step": 515000, "rew": 3154.2582, "rew_std": 501.1539, "Agent": "TD3"}, {"env_step": 520000, "rew": 2987.3938, "rew_std": 511.4157, "Agent": "TD3"}, {"env_step": 525000, "rew": 3201.9522, "rew_std": 309.5776, "Agent": "TD3"}, {"env_step": 530000, "rew": 3127.0868, "rew_std": 499.4894, "Agent": "TD3"}, {"env_step": 535000, "rew": 3231.7025, "rew_std": 247.2752, "Agent": "TD3"}, {"env_step": 540000, "rew": 3246.6948, "rew_std": 423.8079, "Agent": "TD3"}, {"env_step": 545000, "rew": 3244.2828, "rew_std": 285.0854, "Agent": "TD3"}, {"env_step": 550000, "rew": 3296.3845, "rew_std": 280.0152, "Agent": "TD3"}, {"env_step": 555000, "rew": 3339.8197, "rew_std": 133.4885, "Agent": "TD3"}, {"env_step": 560000, "rew": 3292.3128, "rew_std": 240.2349, "Agent": "TD3"}, {"env_step": 565000, "rew": 3351.0744, "rew_std": 136.4845, "Agent": "TD3"}, {"env_step": 570000, "rew": 3253.555, "rew_std": 283.2193, "Agent": "TD3"}, {"env_step": 575000, "rew": 3142.2054, "rew_std": 641.4588, "Agent": "TD3"}, {"env_step": 580000, "rew": 3145.471, "rew_std": 655.4939, "Agent": "TD3"}, {"env_step": 585000, "rew": 3212.4539, "rew_std": 238.0762, "Agent": "TD3"}, {"env_step": 590000, "rew": 3020.1885, "rew_std": 722.6471, "Agent": "TD3"}, {"env_step": 595000, "rew": 3354.9395, "rew_std": 97.4237, "Agent": "TD3"}, {"env_step": 600000, "rew": 3192.8687, "rew_std": 478.9294, "Agent": "TD3"}, {"env_step": 605000, "rew": 2998.3348, "rew_std": 798.7227, "Agent": "TD3"}, {"env_step": 610000, "rew": 3357.0238, "rew_std": 134.9546, "Agent": "TD3"}, {"env_step": 615000, "rew": 3366.7968, "rew_std": 103.0748, "Agent": "TD3"}, {"env_step": 620000, "rew": 3206.5507, "rew_std": 436.868, "Agent": "TD3"}, {"env_step": 625000, "rew": 3171.6245, "rew_std": 659.9982, "Agent": "TD3"}, {"env_step": 630000, "rew": 3231.2786, "rew_std": 265.3576, "Agent": "TD3"}, {"env_step": 635000, "rew": 3307.9242, "rew_std": 241.2563, "Agent": "TD3"}, {"env_step": 640000, "rew": 3016.9011, "rew_std": 926.3848, "Agent": "TD3"}, {"env_step": 645000, "rew": 3368.7732, "rew_std": 129.5799, "Agent": "TD3"}, {"env_step": 650000, "rew": 3227.2273, "rew_std": 289.7332, "Agent": "TD3"}, {"env_step": 655000, "rew": 3240.2439, "rew_std": 365.6094, "Agent": "TD3"}, {"env_step": 660000, "rew": 3227.2667, "rew_std": 285.7852, "Agent": "TD3"}, {"env_step": 665000, "rew": 3265.8132, "rew_std": 418.3806, "Agent": "TD3"}, {"env_step": 670000, "rew": 3282.3655, "rew_std": 368.4049, "Agent": "TD3"}, {"env_step": 675000, "rew": 3258.526, "rew_std": 377.9988, "Agent": "TD3"}, {"env_step": 680000, "rew": 3263.2283, "rew_std": 152.4962, "Agent": "TD3"}, {"env_step": 685000, "rew": 3089.7907, "rew_std": 295.5492, "Agent": "TD3"}, {"env_step": 690000, "rew": 3172.968, "rew_std": 315.6106, "Agent": "TD3"}, {"env_step": 695000, "rew": 3092.3138, "rew_std": 482.2803, "Agent": "TD3"}, {"env_step": 700000, "rew": 3086.4148, "rew_std": 537.6133, "Agent": "TD3"}, {"env_step": 705000, "rew": 3187.0369, "rew_std": 376.8388, "Agent": "TD3"}, {"env_step": 710000, "rew": 3257.3183, "rew_std": 384.8109, "Agent": "TD3"}, {"env_step": 715000, "rew": 3217.0255, "rew_std": 331.0033, "Agent": "TD3"}, {"env_step": 720000, "rew": 3053.4691, "rew_std": 728.2795, "Agent": "TD3"}, {"env_step": 725000, "rew": 3255.4324, "rew_std": 315.9673, "Agent": "TD3"}, {"env_step": 730000, "rew": 3048.3769, "rew_std": 760.9075, "Agent": "TD3"}, {"env_step": 735000, "rew": 3265.5531, "rew_std": 269.5899, "Agent": "TD3"}, {"env_step": 740000, "rew": 3283.9958, "rew_std": 289.6054, "Agent": "TD3"}, {"env_step": 745000, "rew": 3073.2362, "rew_std": 408.9806, "Agent": "TD3"}, {"env_step": 750000, "rew": 3045.4661, "rew_std": 593.2175, "Agent": "TD3"}, {"env_step": 755000, "rew": 3077.6696, "rew_std": 472.3235, "Agent": "TD3"}, {"env_step": 760000, "rew": 3080.2428, "rew_std": 695.1234, "Agent": "TD3"}, {"env_step": 765000, "rew": 3198.3011, "rew_std": 231.1821, "Agent": "TD3"}, {"env_step": 770000, "rew": 3342.6777, "rew_std": 303.2243, "Agent": "TD3"}, {"env_step": 775000, "rew": 3374.2952, "rew_std": 204.2809, "Agent": "TD3"}, {"env_step": 780000, "rew": 3350.8202, "rew_std": 251.5599, "Agent": "TD3"}, {"env_step": 785000, "rew": 3417.5119, "rew_std": 153.9788, "Agent": "TD3"}, {"env_step": 790000, "rew": 3062.315, "rew_std": 753.7818, "Agent": "TD3"}, {"env_step": 795000, "rew": 3443.6579, "rew_std": 140.8264, "Agent": "TD3"}, {"env_step": 800000, "rew": 3214.8637, "rew_std": 393.858, "Agent": "TD3"}, {"env_step": 805000, "rew": 3172.6333, "rew_std": 538.8215, "Agent": "TD3"}, {"env_step": 810000, "rew": 3314.041, "rew_std": 291.0874, "Agent": "TD3"}, {"env_step": 815000, "rew": 3414.3737, "rew_std": 133.3112, "Agent": "TD3"}, {"env_step": 820000, "rew": 2948.3976, "rew_std": 1085.3824, "Agent": "TD3"}, {"env_step": 825000, "rew": 3418.1071, "rew_std": 219.9899, "Agent": "TD3"}, {"env_step": 830000, "rew": 3054.1659, "rew_std": 749.0992, "Agent": "TD3"}, {"env_step": 835000, "rew": 3421.8961, "rew_std": 174.2378, "Agent": "TD3"}, {"env_step": 840000, "rew": 3402.1026, "rew_std": 254.3867, "Agent": "TD3"}, {"env_step": 845000, "rew": 3391.7669, "rew_std": 209.177, "Agent": "TD3"}, {"env_step": 850000, "rew": 3122.6524, "rew_std": 611.6579, "Agent": "TD3"}, {"env_step": 855000, "rew": 3437.683, "rew_std": 156.0111, "Agent": "TD3"}, {"env_step": 860000, "rew": 3421.7968, "rew_std": 175.8982, "Agent": "TD3"}, {"env_step": 865000, "rew": 3472.2399, "rew_std": 116.7905, "Agent": "TD3"}, {"env_step": 870000, "rew": 3181.0626, "rew_std": 532.352, "Agent": "TD3"}, {"env_step": 875000, "rew": 3355.169, "rew_std": 366.8383, "Agent": "TD3"}, {"env_step": 880000, "rew": 3276.6772, "rew_std": 365.8959, "Agent": "TD3"}, {"env_step": 885000, "rew": 3234.2254, "rew_std": 380.1403, "Agent": "TD3"}, {"env_step": 890000, "rew": 3449.26, "rew_std": 159.677, "Agent": "TD3"}, {"env_step": 895000, "rew": 3092.4727, "rew_std": 723.0347, "Agent": "TD3"}, {"env_step": 900000, "rew": 3378.2511, "rew_std": 174.6047, "Agent": "TD3"}, {"env_step": 905000, "rew": 3419.4817, "rew_std": 97.2881, "Agent": "TD3"}, {"env_step": 910000, "rew": 3385.7236, "rew_std": 231.5133, "Agent": "TD3"}, {"env_step": 915000, "rew": 3168.5126, "rew_std": 752.5883, "Agent": "TD3"}, {"env_step": 920000, "rew": 3258.2632, "rew_std": 564.3516, "Agent": "TD3"}, {"env_step": 925000, "rew": 3328.8538, "rew_std": 287.7357, "Agent": "TD3"}, {"env_step": 930000, "rew": 3416.1365, "rew_std": 199.7163, "Agent": "TD3"}, {"env_step": 935000, "rew": 3310.5707, "rew_std": 422.2578, "Agent": "TD3"}, {"env_step": 940000, "rew": 3469.4841, "rew_std": 132.6303, "Agent": "TD3"}, {"env_step": 945000, "rew": 3411.9133, "rew_std": 184.6796, "Agent": "TD3"}, {"env_step": 950000, "rew": 3445.803, "rew_std": 188.1911, "Agent": "TD3"}, {"env_step": 955000, "rew": 3433.6352, "rew_std": 199.4321, "Agent": "TD3"}, {"env_step": 960000, "rew": 3252.8105, "rew_std": 695.7155, "Agent": "TD3"}, {"env_step": 965000, "rew": 3229.0901, "rew_std": 685.0382, "Agent": "TD3"}, {"env_step": 970000, "rew": 3035.6979, "rew_std": 1069.2395, "Agent": "TD3"}, {"env_step": 975000, "rew": 3298.0468, "rew_std": 460.4312, "Agent": "TD3"}, {"env_step": 980000, "rew": 3349.4871, "rew_std": 261.0919, "Agent": "TD3"}, {"env_step": 985000, "rew": 3318.7927, "rew_std": 490.6575, "Agent": "TD3"}, {"env_step": 990000, "rew": 3055.1773, "rew_std": 695.5763, "Agent": "TD3"}, {"env_step": 995000, "rew": 3264.6276, "rew_std": 440.8577, "Agent": "TD3"}, {"env_step": 1000000, "rew": 3132.5766, "rew_std": 771.7353, "Agent": "TD3"}, {"env_step": 1005000, "rew": 3309.2497, "rew_std": 546.4882, "Agent": "TD3"}, {"env_step": 1010000, "rew": 3308.7683, "rew_std": 358.811, "Agent": "TD3"}, {"env_step": 1015000, "rew": 3300.2122, "rew_std": 407.792, "Agent": "TD3"}, {"env_step": 1020000, "rew": 3454.3862, "rew_std": 180.6148, "Agent": "TD3"}, {"env_step": 1025000, "rew": 3355.6457, "rew_std": 306.9581, "Agent": "TD3"}, {"env_step": 1030000, "rew": 3362.1583, "rew_std": 296.1113, "Agent": "TD3"}, {"env_step": 1035000, "rew": 3398.9778, "rew_std": 186.8083, "Agent": "TD3"}, {"env_step": 1040000, "rew": 3388.1484, "rew_std": 205.7846, "Agent": "TD3"}, {"env_step": 1045000, "rew": 3487.3008, "rew_std": 116.211, "Agent": "TD3"}, {"env_step": 1050000, "rew": 3451.232, "rew_std": 110.6646, "Agent": "TD3"}, {"env_step": 1055000, "rew": 3088.9652, "rew_std": 879.486, "Agent": "TD3"}, {"env_step": 1060000, "rew": 3363.9858, "rew_std": 303.7124, "Agent": "TD3"}, {"env_step": 1065000, "rew": 3415.9527, "rew_std": 241.6345, "Agent": "TD3"}, {"env_step": 1070000, "rew": 3220.853, "rew_std": 626.2711, "Agent": "TD3"}, {"env_step": 1075000, "rew": 3387.6881, "rew_std": 241.4848, "Agent": "TD3"}, {"env_step": 1080000, "rew": 3492.6301, "rew_std": 107.173, "Agent": "TD3"}, {"env_step": 1085000, "rew": 3496.5603, "rew_std": 90.9081, "Agent": "TD3"}, {"env_step": 1090000, "rew": 3497.1501, "rew_std": 100.4975, "Agent": "TD3"}, {"env_step": 1095000, "rew": 3245.6992, "rew_std": 528.5044, "Agent": "TD3"}, {"env_step": 1100000, "rew": 3214.6306, "rew_std": 509.1668, "Agent": "TD3"}, {"env_step": 1105000, "rew": 3470.5285, "rew_std": 116.7226, "Agent": "TD3"}, {"env_step": 1110000, "rew": 3495.2515, "rew_std": 158.7062, "Agent": "TD3"}, {"env_step": 1115000, "rew": 3478.5048, "rew_std": 144.9464, "Agent": "TD3"}, {"env_step": 1120000, "rew": 3281.0796, "rew_std": 527.6014, "Agent": "TD3"}, {"env_step": 1125000, "rew": 3192.937, "rew_std": 669.8894, "Agent": "TD3"}, {"env_step": 1130000, "rew": 3438.1592, "rew_std": 230.622, "Agent": "TD3"}, {"env_step": 1135000, "rew": 3334.115, "rew_std": 460.8531, "Agent": "TD3"}, {"env_step": 1140000, "rew": 3071.3359, "rew_std": 817.2291, "Agent": "TD3"}, {"env_step": 1145000, "rew": 3422.9416, "rew_std": 196.0724, "Agent": "TD3"}, {"env_step": 1150000, "rew": 3146.4052, "rew_std": 687.3626, "Agent": "TD3"}, {"env_step": 1155000, "rew": 3223.623, "rew_std": 830.6122, "Agent": "TD3"}, {"env_step": 1160000, "rew": 3033.3122, "rew_std": 1060.267, "Agent": "TD3"}, {"env_step": 1165000, "rew": 3280.1819, "rew_std": 527.1591, "Agent": "TD3"}, {"env_step": 1170000, "rew": 3218.5815, "rew_std": 536.6197, "Agent": "TD3"}, {"env_step": 1175000, "rew": 3337.7382, "rew_std": 372.1618, "Agent": "TD3"}, {"env_step": 1180000, "rew": 3064.0044, "rew_std": 729.3349, "Agent": "TD3"}, {"env_step": 1185000, "rew": 3153.8193, "rew_std": 720.2014, "Agent": "TD3"}, {"env_step": 1190000, "rew": 2789.3759, "rew_std": 1169.6733, "Agent": "TD3"}, {"env_step": 1195000, "rew": 3351.8698, "rew_std": 493.6516, "Agent": "TD3"}, {"env_step": 1200000, "rew": 3012.5723, "rew_std": 1035.4349, "Agent": "TD3"}, {"env_step": 1205000, "rew": 3186.304, "rew_std": 730.071, "Agent": "TD3"}, {"env_step": 1210000, "rew": 3420.0329, "rew_std": 201.5622, "Agent": "TD3"}, {"env_step": 1215000, "rew": 3231.3499, "rew_std": 687.0777, "Agent": "TD3"}, {"env_step": 1220000, "rew": 3414.9551, "rew_std": 290.8079, "Agent": "TD3"}, {"env_step": 1225000, "rew": 3302.7639, "rew_std": 645.4993, "Agent": "TD3"}, {"env_step": 1230000, "rew": 3169.7956, "rew_std": 627.4685, "Agent": "TD3"}, {"env_step": 1235000, "rew": 3100.7851, "rew_std": 888.5842, "Agent": "TD3"}, {"env_step": 1240000, "rew": 3441.4178, "rew_std": 279.3749, "Agent": "TD3"}, {"env_step": 1245000, "rew": 3312.542, "rew_std": 575.5337, "Agent": "TD3"}, {"env_step": 1250000, "rew": 3097.3408, "rew_std": 746.9811, "Agent": "TD3"}, {"env_step": 0, "rew": 17.9154, "rew_std": 1.9743, "Agent": "REINFORCE"}, {"env_step": 30720, "rew": 29.3731, "rew_std": 10.4893, "Agent": "REINFORCE"}, {"env_step": 61440, "rew": 66.6037, "rew_std": 24.3997, "Agent": "REINFORCE"}, {"env_step": 92160, "rew": 198.8276, "rew_std": 36.86, "Agent": "REINFORCE"}, {"env_step": 122880, "rew": 232.7992, "rew_std": 26.5837, "Agent": "REINFORCE"}, {"env_step": 153600, "rew": 260.3133, "rew_std": 22.0087, "Agent": "REINFORCE"}, {"env_step": 184320, "rew": 268.9626, "rew_std": 28.6902, "Agent": "REINFORCE"}, {"env_step": 215040, "rew": 288.7649, "rew_std": 32.1015, "Agent": "REINFORCE"}, {"env_step": 245760, "rew": 295.2648, "rew_std": 22.7345, "Agent": "REINFORCE"}, {"env_step": 276480, "rew": 306.5046, "rew_std": 15.8915, "Agent": "REINFORCE"}, {"env_step": 307200, "rew": 318.4252, "rew_std": 9.9478, "Agent": "REINFORCE"}, {"env_step": 337920, "rew": 322.6908, "rew_std": 17.5204, "Agent": "REINFORCE"}, {"env_step": 368640, "rew": 336.2168, "rew_std": 28.7181, "Agent": "REINFORCE"}, {"env_step": 399360, "rew": 330.8605, "rew_std": 45.2815, "Agent": "REINFORCE"}, {"env_step": 430080, "rew": 331.2807, "rew_std": 23.8464, "Agent": "REINFORCE"}, {"env_step": 460800, "rew": 350.7925, "rew_std": 64.5441, "Agent": "REINFORCE"}, {"env_step": 491520, "rew": 341.1786, "rew_std": 43.6435, "Agent": "REINFORCE"}, {"env_step": 522240, "rew": 346.7587, "rew_std": 38.0414, "Agent": "REINFORCE"}, {"env_step": 552960, "rew": 343.9709, "rew_std": 40.9004, "Agent": "REINFORCE"}, {"env_step": 583680, "rew": 346.0514, "rew_std": 47.826, "Agent": "REINFORCE"}, {"env_step": 614400, "rew": 355.0738, "rew_std": 51.1227, "Agent": "REINFORCE"}, {"env_step": 645120, "rew": 353.4741, "rew_std": 39.3418, "Agent": "REINFORCE"}, {"env_step": 675840, "rew": 363.9368, "rew_std": 53.8079, "Agent": "REINFORCE"}, {"env_step": 706560, "rew": 369.7521, "rew_std": 76.4353, "Agent": "REINFORCE"}, {"env_step": 737280, "rew": 362.2687, "rew_std": 94.7053, "Agent": "REINFORCE"}, {"env_step": 768000, "rew": 367.0035, "rew_std": 79.9643, "Agent": "REINFORCE"}, {"env_step": 798720, "rew": 365.8843, "rew_std": 73.7307, "Agent": "REINFORCE"}, {"env_step": 829440, "rew": 370.4545, "rew_std": 74.0224, "Agent": "REINFORCE"}, {"env_step": 860160, "rew": 354.3553, "rew_std": 59.5886, "Agent": "REINFORCE"}, {"env_step": 890880, "rew": 386.9329, "rew_std": 76.6984, "Agent": "REINFORCE"}, {"env_step": 921600, "rew": 386.7397, "rew_std": 80.6028, "Agent": "REINFORCE"}, {"env_step": 952320, "rew": 387.5511, "rew_std": 95.2815, "Agent": "REINFORCE"}, {"env_step": 983040, "rew": 389.9666, "rew_std": 84.4154, "Agent": "REINFORCE"}, {"env_step": 1013760, "rew": 374.6943, "rew_std": 68.1604, "Agent": "REINFORCE"}, {"env_step": 1044480, "rew": 387.5142, "rew_std": 68.4897, "Agent": "REINFORCE"}, {"env_step": 1075200, "rew": 379.5257, "rew_std": 61.456, "Agent": "REINFORCE"}, {"env_step": 1105920, "rew": 382.3943, "rew_std": 63.4778, "Agent": "REINFORCE"}, {"env_step": 1136640, "rew": 376.9915, "rew_std": 69.3571, "Agent": "REINFORCE"}, {"env_step": 1167360, "rew": 386.4603, "rew_std": 67.3477, "Agent": "REINFORCE"}, {"env_step": 1198080, "rew": 393.3204, "rew_std": 79.687, "Agent": "REINFORCE"}, {"env_step": 1228800, "rew": 375.8716, "rew_std": 49.7071, "Agent": "REINFORCE"}, {"env_step": 1259520, "rew": 377.5592, "rew_std": 60.5279, "Agent": "REINFORCE"}, {"env_step": 1290240, "rew": 369.21, "rew_std": 29.6277, "Agent": "REINFORCE"}, {"env_step": 1320960, "rew": 373.6731, "rew_std": 42.2747, "Agent": "REINFORCE"}, {"env_step": 1351680, "rew": 363.1084, "rew_std": 27.0787, "Agent": "REINFORCE"}, {"env_step": 1382400, "rew": 374.9453, "rew_std": 43.472, "Agent": "REINFORCE"}, {"env_step": 1413120, "rew": 372.8838, "rew_std": 46.91, "Agent": "REINFORCE"}, {"env_step": 1443840, "rew": 382.9686, "rew_std": 51.2128, "Agent": "REINFORCE"}, {"env_step": 1474560, "rew": 374.1388, "rew_std": 55.2316, "Agent": "REINFORCE"}, {"env_step": 1505280, "rew": 370.8528, "rew_std": 62.1252, "Agent": "REINFORCE"}, {"env_step": 1536000, "rew": 372.8432, "rew_std": 62.8749, "Agent": "REINFORCE"}, {"env_step": 1566720, "rew": 381.4441, "rew_std": 67.9162, "Agent": "REINFORCE"}, {"env_step": 1597440, "rew": 393.132, "rew_std": 66.7161, "Agent": "REINFORCE"}, {"env_step": 1628160, "rew": 387.3093, "rew_std": 79.775, "Agent": "REINFORCE"}, {"env_step": 1658880, "rew": 391.0778, "rew_std": 64.053, "Agent": "REINFORCE"}, {"env_step": 1689600, "rew": 395.8294, "rew_std": 64.4886, "Agent": "REINFORCE"}, {"env_step": 1720320, "rew": 392.6451, "rew_std": 68.072, "Agent": "REINFORCE"}, {"env_step": 1751040, "rew": 390.7222, "rew_std": 58.8086, "Agent": "REINFORCE"}, {"env_step": 1781760, "rew": 374.8847, "rew_std": 39.4855, "Agent": "REINFORCE"}, {"env_step": 1812480, "rew": 361.9808, "rew_std": 49.6531, "Agent": "REINFORCE"}, {"env_step": 1843200, "rew": 386.8282, "rew_std": 66.9517, "Agent": "REINFORCE"}, {"env_step": 1873920, "rew": 373.0323, "rew_std": 63.2295, "Agent": "REINFORCE"}, {"env_step": 1904640, "rew": 373.7938, "rew_std": 69.8201, "Agent": "REINFORCE"}, {"env_step": 1935360, "rew": 376.2475, "rew_std": 77.6855, "Agent": "REINFORCE"}, {"env_step": 1966080, "rew": 380.674, "rew_std": 81.9143, "Agent": "REINFORCE"}, {"env_step": 1996800, "rew": 377.8038, "rew_std": 70.1288, "Agent": "REINFORCE"}, {"env_step": 2027520, "rew": 368.3728, "rew_std": 80.0865, "Agent": "REINFORCE"}, {"env_step": 2058240, "rew": 363.0808, "rew_std": 67.5735, "Agent": "REINFORCE"}, {"env_step": 2088960, "rew": 371.7142, "rew_std": 60.2024, "Agent": "REINFORCE"}, {"env_step": 2119680, "rew": 375.6939, "rew_std": 88.9606, "Agent": "REINFORCE"}, {"env_step": 2150400, "rew": 378.8614, "rew_std": 87.7811, "Agent": "REINFORCE"}, {"env_step": 2181120, "rew": 379.6722, "rew_std": 79.5336, "Agent": "REINFORCE"}, {"env_step": 2211840, "rew": 377.2777, "rew_std": 89.5931, "Agent": "REINFORCE"}, {"env_step": 2242560, "rew": 369.9105, "rew_std": 86.6011, "Agent": "REINFORCE"}, {"env_step": 2273280, "rew": 377.3181, "rew_std": 71.1586, "Agent": "REINFORCE"}, {"env_step": 2304000, "rew": 382.9155, "rew_std": 76.8354, "Agent": "REINFORCE"}, {"env_step": 2334720, "rew": 386.854, "rew_std": 79.9414, "Agent": "REINFORCE"}, {"env_step": 2365440, "rew": 380.7335, "rew_std": 109.3207, "Agent": "REINFORCE"}, {"env_step": 2396160, "rew": 393.7874, "rew_std": 80.6004, "Agent": "REINFORCE"}, {"env_step": 2426880, "rew": 380.0022, "rew_std": 77.799, "Agent": "REINFORCE"}, {"env_step": 2457600, "rew": 377.9924, "rew_std": 79.3554, "Agent": "REINFORCE"}, {"env_step": 2488320, "rew": 381.3284, "rew_std": 90.5689, "Agent": "REINFORCE"}, {"env_step": 2519040, "rew": 373.0119, "rew_std": 75.9316, "Agent": "REINFORCE"}, {"env_step": 2549760, "rew": 364.0844, "rew_std": 46.8014, "Agent": "REINFORCE"}, {"env_step": 2580480, "rew": 368.931, "rew_std": 42.3915, "Agent": "REINFORCE"}, {"env_step": 2611200, "rew": 365.2996, "rew_std": 34.5441, "Agent": "REINFORCE"}, {"env_step": 2641920, "rew": 375.5965, "rew_std": 51.0352, "Agent": "REINFORCE"}, {"env_step": 2672640, "rew": 366.0311, "rew_std": 54.5752, "Agent": "REINFORCE"}, {"env_step": 2703360, "rew": 375.709, "rew_std": 57.4101, "Agent": "REINFORCE"}, {"env_step": 2734080, "rew": 366.1557, "rew_std": 51.1812, "Agent": "REINFORCE"}, {"env_step": 2764800, "rew": 362.7805, "rew_std": 52.9235, "Agent": "REINFORCE"}, {"env_step": 2795520, "rew": 363.9702, "rew_std": 44.3478, "Agent": "REINFORCE"}, {"env_step": 2826240, "rew": 365.2992, "rew_std": 48.0731, "Agent": "REINFORCE"}, {"env_step": 2856960, "rew": 370.9386, "rew_std": 66.4269, "Agent": "REINFORCE"}, {"env_step": 2887680, "rew": 366.0387, "rew_std": 64.0745, "Agent": "REINFORCE"}, {"env_step": 2918400, "rew": 361.6844, "rew_std": 53.0049, "Agent": "REINFORCE"}, {"env_step": 2949120, "rew": 364.995, "rew_std": 55.0417, "Agent": "REINFORCE"}, {"env_step": 2979840, "rew": 367.1026, "rew_std": 46.2725, "Agent": "REINFORCE"}, {"env_step": 3010560, "rew": 368.1378, "rew_std": 50.5468, "Agent": "REINFORCE"}, {"env_step": 3041280, "rew": 368.6792, "rew_std": 59.7536, "Agent": "REINFORCE"}, {"env_step": 3072000, "rew": 355.6231, "rew_std": 41.6614, "Agent": "REINFORCE"}, {"env_step": 3102720, "rew": 355.8605, "rew_std": 44.1664, "Agent": "REINFORCE"}, {"env_step": 3133440, "rew": 355.502, "rew_std": 44.6819, "Agent": "REINFORCE"}, {"env_step": 3164160, "rew": 351.8672, "rew_std": 46.9554, "Agent": "REINFORCE"}, {"env_step": 3194880, "rew": 354.3732, "rew_std": 39.958, "Agent": "REINFORCE"}, {"env_step": 3225600, "rew": 363.8132, "rew_std": 43.6584, "Agent": "REINFORCE"}, {"env_step": 3256320, "rew": 366.9973, "rew_std": 52.4478, "Agent": "REINFORCE"}, {"env_step": 3287040, "rew": 359.498, "rew_std": 37.2594, "Agent": "REINFORCE"}, {"env_step": 3317760, "rew": 357.1697, "rew_std": 45.6055, "Agent": "REINFORCE"}, {"env_step": 3348480, "rew": 356.0397, "rew_std": 33.5679, "Agent": "REINFORCE"}, {"env_step": 3379200, "rew": 361.9803, "rew_std": 43.0103, "Agent": "REINFORCE"}, {"env_step": 3409920, "rew": 371.8563, "rew_std": 68.2704, "Agent": "REINFORCE"}, {"env_step": 3440640, "rew": 371.9357, "rew_std": 57.6749, "Agent": "REINFORCE"}, {"env_step": 3471360, "rew": 371.5511, "rew_std": 57.979, "Agent": "REINFORCE"}, {"env_step": 3502080, "rew": 356.9314, "rew_std": 40.984, "Agent": "REINFORCE"}, {"env_step": 3532800, "rew": 363.4594, "rew_std": 41.5677, "Agent": "REINFORCE"}, {"env_step": 3563520, "rew": 374.1565, "rew_std": 56.8199, "Agent": "REINFORCE"}, {"env_step": 3594240, "rew": 371.328, "rew_std": 48.9273, "Agent": "REINFORCE"}, {"env_step": 3624960, "rew": 368.6637, "rew_std": 52.6637, "Agent": "REINFORCE"}, {"env_step": 3655680, "rew": 362.5879, "rew_std": 35.8333, "Agent": "REINFORCE"}, {"env_step": 3686400, "rew": 360.6588, "rew_std": 40.4034, "Agent": "REINFORCE"}, {"env_step": 3717120, "rew": 358.0624, "rew_std": 27.6744, "Agent": "REINFORCE"}, {"env_step": 3747840, "rew": 362.8848, "rew_std": 31.2075, "Agent": "REINFORCE"}, {"env_step": 3778560, "rew": 369.7099, "rew_std": 49.5931, "Agent": "REINFORCE"}, {"env_step": 3809280, "rew": 362.1919, "rew_std": 26.8217, "Agent": "REINFORCE"}, {"env_step": 3840000, "rew": 365.3113, "rew_std": 40.6711, "Agent": "REINFORCE"}, {"env_step": 3870720, "rew": 370.9763, "rew_std": 51.2981, "Agent": "REINFORCE"}, {"env_step": 3901440, "rew": 394.1719, "rew_std": 79.1728, "Agent": "REINFORCE"}, {"env_step": 3932160, "rew": 409.7305, "rew_std": 88.1129, "Agent": "REINFORCE"}, {"env_step": 3962880, "rew": 405.7927, "rew_std": 94.4966, "Agent": "REINFORCE"}, {"env_step": 3993600, "rew": 405.7145, "rew_std": 98.6886, "Agent": "REINFORCE"}, {"env_step": 4024320, "rew": 400.252, "rew_std": 91.7664, "Agent": "REINFORCE"}, {"env_step": 4055040, "rew": 408.2449, "rew_std": 108.9827, "Agent": "REINFORCE"}, {"env_step": 4085760, "rew": 397.0612, "rew_std": 97.8046, "Agent": "REINFORCE"}, {"env_step": 4116480, "rew": 402.881, "rew_std": 99.515, "Agent": "REINFORCE"}, {"env_step": 4147200, "rew": 415.9558, "rew_std": 104.7377, "Agent": "REINFORCE"}, {"env_step": 4177920, "rew": 391.8573, "rew_std": 94.7846, "Agent": "REINFORCE"}, {"env_step": 4208640, "rew": 388.7508, "rew_std": 89.8436, "Agent": "REINFORCE"}, {"env_step": 4239360, "rew": 392.2457, "rew_std": 103.2659, "Agent": "REINFORCE"}, {"env_step": 4270080, "rew": 386.7837, "rew_std": 90.8458, "Agent": "REINFORCE"}, {"env_step": 4300800, "rew": 387.743, "rew_std": 103.9218, "Agent": "REINFORCE"}, {"env_step": 4331520, "rew": 400.4464, "rew_std": 102.1787, "Agent": "REINFORCE"}, {"env_step": 4362240, "rew": 392.1932, "rew_std": 87.3258, "Agent": "REINFORCE"}, {"env_step": 4392960, "rew": 396.4165, "rew_std": 105.8792, "Agent": "REINFORCE"}, {"env_step": 4423680, "rew": 387.7544, "rew_std": 97.0025, "Agent": "REINFORCE"}, {"env_step": 4454400, "rew": 391.0999, "rew_std": 98.9182, "Agent": "REINFORCE"}, {"env_step": 4485120, "rew": 391.6717, "rew_std": 102.3208, "Agent": "REINFORCE"}, {"env_step": 4515840, "rew": 392.4672, "rew_std": 111.5205, "Agent": "REINFORCE"}, {"env_step": 4546560, "rew": 382.6473, "rew_std": 97.9509, "Agent": "REINFORCE"}, {"env_step": 4577280, "rew": 385.3088, "rew_std": 96.1275, "Agent": "REINFORCE"}, {"env_step": 4608000, "rew": 383.38, "rew_std": 97.7575, "Agent": "REINFORCE"}, {"env_step": 4638720, "rew": 382.9842, "rew_std": 94.2347, "Agent": "REINFORCE"}, {"env_step": 4669440, "rew": 399.8325, "rew_std": 105.9479, "Agent": "REINFORCE"}, {"env_step": 4700160, "rew": 390.9329, "rew_std": 98.4279, "Agent": "REINFORCE"}, {"env_step": 4730880, "rew": 409.3433, "rew_std": 118.3284, "Agent": "REINFORCE"}, {"env_step": 4761600, "rew": 394.2645, "rew_std": 107.2525, "Agent": "REINFORCE"}, {"env_step": 4792320, "rew": 384.1185, "rew_std": 102.1598, "Agent": "REINFORCE"}, {"env_step": 4823040, "rew": 396.9076, "rew_std": 97.2542, "Agent": "REINFORCE"}, {"env_step": 4853760, "rew": 390.4801, "rew_std": 99.5176, "Agent": "REINFORCE"}, {"env_step": 4884480, "rew": 389.4399, "rew_std": 92.1015, "Agent": "REINFORCE"}, {"env_step": 4915200, "rew": 394.0313, "rew_std": 101.7443, "Agent": "REINFORCE"}, {"env_step": 4945920, "rew": 390.3732, "rew_std": 91.6181, "Agent": "REINFORCE"}, {"env_step": 4976640, "rew": 383.9362, "rew_std": 91.6545, "Agent": "REINFORCE"}, {"env_step": 5007360, "rew": 377.8827, "rew_std": 92.611, "Agent": "REINFORCE"}, {"env_step": 5038080, "rew": 381.0909, "rew_std": 95.6623, "Agent": "REINFORCE"}, {"env_step": 5068800, "rew": 386.0676, "rew_std": 85.6938, "Agent": "REINFORCE"}, {"env_step": 5099520, "rew": 374.0582, "rew_std": 62.9661, "Agent": "REINFORCE"}, {"env_step": 5130240, "rew": 382.5204, "rew_std": 67.5511, "Agent": "REINFORCE"}, {"env_step": 5160960, "rew": 385.7647, "rew_std": 81.6735, "Agent": "REINFORCE"}, {"env_step": 5191680, "rew": 385.5587, "rew_std": 79.1534, "Agent": "REINFORCE"}, {"env_step": 5222400, "rew": 375.1411, "rew_std": 89.7856, "Agent": "REINFORCE"}, {"env_step": 5253120, "rew": 382.3445, "rew_std": 96.1506, "Agent": "REINFORCE"}, {"env_step": 5283840, "rew": 392.8232, "rew_std": 121.0017, "Agent": "REINFORCE"}, {"env_step": 5314560, "rew": 381.6725, "rew_std": 95.3916, "Agent": "REINFORCE"}, {"env_step": 5345280, "rew": 390.9818, "rew_std": 104.5308, "Agent": "REINFORCE"}, {"env_step": 5376000, "rew": 384.3439, "rew_std": 106.4543, "Agent": "REINFORCE"}, {"env_step": 5406720, "rew": 378.383, "rew_std": 107.0747, "Agent": "REINFORCE"}, {"env_step": 5437440, "rew": 380.5131, "rew_std": 112.1825, "Agent": "REINFORCE"}, {"env_step": 5468160, "rew": 381.4596, "rew_std": 116.9546, "Agent": "REINFORCE"}, {"env_step": 5498880, "rew": 376.408, "rew_std": 109.4098, "Agent": "REINFORCE"}, {"env_step": 5529600, "rew": 371.7655, "rew_std": 94.5637, "Agent": "REINFORCE"}, {"env_step": 5560320, "rew": 371.3834, "rew_std": 99.8961, "Agent": "REINFORCE"}, {"env_step": 5591040, "rew": 373.4715, "rew_std": 105.4585, "Agent": "REINFORCE"}, {"env_step": 5621760, "rew": 379.2169, "rew_std": 114.6349, "Agent": "REINFORCE"}, {"env_step": 5652480, "rew": 377.9405, "rew_std": 107.3001, "Agent": "REINFORCE"}, {"env_step": 5683200, "rew": 373.9021, "rew_std": 97.6858, "Agent": "REINFORCE"}, {"env_step": 5713920, "rew": 375.604, "rew_std": 105.6384, "Agent": "REINFORCE"}, {"env_step": 5744640, "rew": 379.1034, "rew_std": 103.1234, "Agent": "REINFORCE"}, {"env_step": 5775360, "rew": 381.6423, "rew_std": 100.8259, "Agent": "REINFORCE"}, {"env_step": 5806080, "rew": 378.8504, "rew_std": 104.2578, "Agent": "REINFORCE"}, {"env_step": 5836800, "rew": 382.0778, "rew_std": 110.7984, "Agent": "REINFORCE"}, {"env_step": 5867520, "rew": 381.9858, "rew_std": 107.0871, "Agent": "REINFORCE"}, {"env_step": 5898240, "rew": 380.0554, "rew_std": 109.317, "Agent": "REINFORCE"}, {"env_step": 5928960, "rew": 381.0922, "rew_std": 101.8419, "Agent": "REINFORCE"}, {"env_step": 5959680, "rew": 378.747, "rew_std": 88.6599, "Agent": "REINFORCE"}, {"env_step": 5990400, "rew": 392.1596, "rew_std": 94.625, "Agent": "REINFORCE"}, {"env_step": 6021120, "rew": 388.2924, "rew_std": 106.6063, "Agent": "REINFORCE"}, {"env_step": 6051840, "rew": 391.8991, "rew_std": 105.9083, "Agent": "REINFORCE"}, {"env_step": 6082560, "rew": 395.3478, "rew_std": 106.1762, "Agent": "REINFORCE"}, {"env_step": 6113280, "rew": 402.5229, "rew_std": 118.2928, "Agent": "REINFORCE"}, {"env_step": 6144000, "rew": 402.5777, "rew_std": 123.3479, "Agent": "REINFORCE"}, {"env_step": 6174720, "rew": 409.2375, "rew_std": 123.5333, "Agent": "REINFORCE"}, {"env_step": 6205440, "rew": 401.1756, "rew_std": 105.6258, "Agent": "REINFORCE"}, {"env_step": 6236160, "rew": 393.5145, "rew_std": 103.74, "Agent": "REINFORCE"}, {"env_step": 6266880, "rew": 392.5335, "rew_std": 97.7167, "Agent": "REINFORCE"}, {"env_step": 6297600, "rew": 388.9988, "rew_std": 104.4046, "Agent": "REINFORCE"}, {"env_step": 6328320, "rew": 400.0679, "rew_std": 111.9244, "Agent": "REINFORCE"}, {"env_step": 6359040, "rew": 399.2567, "rew_std": 112.5052, "Agent": "REINFORCE"}, {"env_step": 6389760, "rew": 397.178, "rew_std": 109.4325, "Agent": "REINFORCE"}, {"env_step": 6420480, "rew": 397.1731, "rew_std": 95.5987, "Agent": "REINFORCE"}, {"env_step": 6451200, "rew": 405.8894, "rew_std": 102.3605, "Agent": "REINFORCE"}, {"env_step": 6481920, "rew": 399.0744, "rew_std": 108.8508, "Agent": "REINFORCE"}, {"env_step": 6512640, "rew": 405.8708, "rew_std": 112.578, "Agent": "REINFORCE"}, {"env_step": 6543360, "rew": 398.2285, "rew_std": 94.2502, "Agent": "REINFORCE"}, {"env_step": 6574080, "rew": 404.914, "rew_std": 96.5741, "Agent": "REINFORCE"}, {"env_step": 6604800, "rew": 393.1239, "rew_std": 84.9309, "Agent": "REINFORCE"}, {"env_step": 6635520, "rew": 404.68, "rew_std": 102.7677, "Agent": "REINFORCE"}, {"env_step": 6666240, "rew": 389.5942, "rew_std": 79.4133, "Agent": "REINFORCE"}, {"env_step": 6696960, "rew": 392.5762, "rew_std": 85.0446, "Agent": "REINFORCE"}, {"env_step": 6727680, "rew": 399.4966, "rew_std": 93.1352, "Agent": "REINFORCE"}, {"env_step": 6758400, "rew": 399.9873, "rew_std": 99.9946, "Agent": "REINFORCE"}, {"env_step": 6789120, "rew": 393.2349, "rew_std": 92.2259, "Agent": "REINFORCE"}, {"env_step": 6819840, "rew": 387.7151, "rew_std": 88.0488, "Agent": "REINFORCE"}, {"env_step": 6850560, "rew": 386.5385, "rew_std": 84.4063, "Agent": "REINFORCE"}, {"env_step": 6881280, "rew": 388.8521, "rew_std": 74.5801, "Agent": "REINFORCE"}, {"env_step": 6912000, "rew": 398.1654, "rew_std": 90.6041, "Agent": "REINFORCE"}, {"env_step": 6942720, "rew": 384.939, "rew_std": 71.2728, "Agent": "REINFORCE"}, {"env_step": 6973440, "rew": 390.8309, "rew_std": 85.7066, "Agent": "REINFORCE"}, {"env_step": 7004160, "rew": 399.2637, "rew_std": 97.6472, "Agent": "REINFORCE"}, {"env_step": 7034880, "rew": 389.195, "rew_std": 81.2926, "Agent": "REINFORCE"}, {"env_step": 7065600, "rew": 398.1003, "rew_std": 93.8406, "Agent": "REINFORCE"}, {"env_step": 7096320, "rew": 396.5792, "rew_std": 99.5352, "Agent": "REINFORCE"}, {"env_step": 7127040, "rew": 388.7145, "rew_std": 90.0708, "Agent": "REINFORCE"}, {"env_step": 7157760, "rew": 389.8861, "rew_std": 85.8735, "Agent": "REINFORCE"}, {"env_step": 7188480, "rew": 390.0967, "rew_std": 82.3581, "Agent": "REINFORCE"}, {"env_step": 7219200, "rew": 379.0566, "rew_std": 64.0611, "Agent": "REINFORCE"}, {"env_step": 7249920, "rew": 385.6624, "rew_std": 81.0679, "Agent": "REINFORCE"}, {"env_step": 7280640, "rew": 386.8548, "rew_std": 75.6701, "Agent": "REINFORCE"}, {"env_step": 7311360, "rew": 379.9336, "rew_std": 77.4284, "Agent": "REINFORCE"}, {"env_step": 7342080, "rew": 379.5128, "rew_std": 75.1445, "Agent": "REINFORCE"}, {"env_step": 7372800, "rew": 374.7474, "rew_std": 58.1994, "Agent": "REINFORCE"}, {"env_step": 7403520, "rew": 385.7565, "rew_std": 75.5155, "Agent": "REINFORCE"}, {"env_step": 7434240, "rew": 379.3197, "rew_std": 67.6012, "Agent": "REINFORCE"}, {"env_step": 7464960, "rew": 375.6075, "rew_std": 62.7015, "Agent": "REINFORCE"}, {"env_step": 7495680, "rew": 374.1764, "rew_std": 54.2789, "Agent": "REINFORCE"}, {"env_step": 7526400, "rew": 392.6875, "rew_std": 68.5086, "Agent": "REINFORCE"}, {"env_step": 7557120, "rew": 382.8261, "rew_std": 63.2083, "Agent": "REINFORCE"}, {"env_step": 7587840, "rew": 385.8388, "rew_std": 72.5709, "Agent": "REINFORCE"}, {"env_step": 7618560, "rew": 392.9784, "rew_std": 84.3356, "Agent": "REINFORCE"}, {"env_step": 7649280, "rew": 390.1091, "rew_std": 83.1857, "Agent": "REINFORCE"}, {"env_step": 7680000, "rew": 386.6012, "rew_std": 80.7424, "Agent": "REINFORCE"}, {"env_step": 7710720, "rew": 388.8892, "rew_std": 63.1784, "Agent": "REINFORCE"}, {"env_step": 7741440, "rew": 382.1974, "rew_std": 68.2579, "Agent": "REINFORCE"}, {"env_step": 7772160, "rew": 379.7919, "rew_std": 59.8642, "Agent": "REINFORCE"}, {"env_step": 7802880, "rew": 387.753, "rew_std": 63.2395, "Agent": "REINFORCE"}, {"env_step": 7833600, "rew": 387.4659, "rew_std": 64.6213, "Agent": "REINFORCE"}, {"env_step": 7864320, "rew": 379.2728, "rew_std": 85.6654, "Agent": "REINFORCE"}, {"env_step": 7895040, "rew": 387.6978, "rew_std": 71.3842, "Agent": "REINFORCE"}, {"env_step": 7925760, "rew": 387.5727, "rew_std": 75.2939, "Agent": "REINFORCE"}, {"env_step": 7956480, "rew": 388.9357, "rew_std": 72.2209, "Agent": "REINFORCE"}, {"env_step": 7987200, "rew": 387.5855, "rew_std": 73.3018, "Agent": "REINFORCE"}, {"env_step": 8017920, "rew": 383.1652, "rew_std": 72.855, "Agent": "REINFORCE"}, {"env_step": 8048640, "rew": 396.8474, "rew_std": 84.074, "Agent": "REINFORCE"}, {"env_step": 8079360, "rew": 383.3162, "rew_std": 73.0269, "Agent": "REINFORCE"}, {"env_step": 8110080, "rew": 387.3427, "rew_std": 74.5757, "Agent": "REINFORCE"}, {"env_step": 8140800, "rew": 391.8142, "rew_std": 60.3373, "Agent": "REINFORCE"}, {"env_step": 8171520, "rew": 384.0898, "rew_std": 65.3742, "Agent": "REINFORCE"}, {"env_step": 8202240, "rew": 388.1516, "rew_std": 71.4981, "Agent": "REINFORCE"}, {"env_step": 8232960, "rew": 386.9834, "rew_std": 66.7738, "Agent": "REINFORCE"}, {"env_step": 8263680, "rew": 393.1251, "rew_std": 89.5124, "Agent": "REINFORCE"}, {"env_step": 8294400, "rew": 390.7711, "rew_std": 69.4544, "Agent": "REINFORCE"}, {"env_step": 8325120, "rew": 390.4361, "rew_std": 74.7419, "Agent": "REINFORCE"}, {"env_step": 8355840, "rew": 384.8838, "rew_std": 74.9661, "Agent": "REINFORCE"}, {"env_step": 8386560, "rew": 387.1014, "rew_std": 73.4848, "Agent": "REINFORCE"}, {"env_step": 8417280, "rew": 385.2746, "rew_std": 65.9136, "Agent": "REINFORCE"}, {"env_step": 8448000, "rew": 389.9486, "rew_std": 82.8964, "Agent": "REINFORCE"}, {"env_step": 8478720, "rew": 381.0628, "rew_std": 74.0303, "Agent": "REINFORCE"}, {"env_step": 8509440, "rew": 396.4438, "rew_std": 81.3918, "Agent": "REINFORCE"}, {"env_step": 8540160, "rew": 387.083, "rew_std": 70.84, "Agent": "REINFORCE"}, {"env_step": 8570880, "rew": 384.714, "rew_std": 71.8535, "Agent": "REINFORCE"}, {"env_step": 8601600, "rew": 387.3163, "rew_std": 73.4316, "Agent": "REINFORCE"}, {"env_step": 8632320, "rew": 376.7846, "rew_std": 66.9371, "Agent": "REINFORCE"}, {"env_step": 8663040, "rew": 389.0855, "rew_std": 66.3918, "Agent": "REINFORCE"}, {"env_step": 8693760, "rew": 386.6858, "rew_std": 74.6856, "Agent": "REINFORCE"}, {"env_step": 8724480, "rew": 380.3388, "rew_std": 62.0064, "Agent": "REINFORCE"}, {"env_step": 8755200, "rew": 391.8039, "rew_std": 70.9114, "Agent": "REINFORCE"}, {"env_step": 8785920, "rew": 385.2417, "rew_std": 81.3082, "Agent": "REINFORCE"}, {"env_step": 8816640, "rew": 382.185, "rew_std": 67.3521, "Agent": "REINFORCE"}, {"env_step": 8847360, "rew": 390.1358, "rew_std": 68.1274, "Agent": "REINFORCE"}, {"env_step": 8878080, "rew": 392.2323, "rew_std": 79.9112, "Agent": "REINFORCE"}, {"env_step": 8908800, "rew": 385.8885, "rew_std": 59.5361, "Agent": "REINFORCE"}, {"env_step": 8939520, "rew": 390.0189, "rew_std": 75.2109, "Agent": "REINFORCE"}, {"env_step": 8970240, "rew": 389.2995, "rew_std": 78.8738, "Agent": "REINFORCE"}, {"env_step": 9000960, "rew": 389.9112, "rew_std": 77.0676, "Agent": "REINFORCE"}, {"env_step": 9031680, "rew": 390.7582, "rew_std": 61.6335, "Agent": "REINFORCE"}, {"env_step": 9062400, "rew": 386.58, "rew_std": 67.7454, "Agent": "REINFORCE"}, {"env_step": 9093120, "rew": 393.7479, "rew_std": 84.891, "Agent": "REINFORCE"}, {"env_step": 9123840, "rew": 387.8405, "rew_std": 79.688, "Agent": "REINFORCE"}, {"env_step": 9154560, "rew": 389.0189, "rew_std": 72.7803, "Agent": "REINFORCE"}, {"env_step": 9185280, "rew": 393.9931, "rew_std": 89.404, "Agent": "REINFORCE"}, {"env_step": 9216000, "rew": 391.9484, "rew_std": 81.6346, "Agent": "REINFORCE"}, {"env_step": 9246720, "rew": 391.9803, "rew_std": 83.1838, "Agent": "REINFORCE"}, {"env_step": 9277440, "rew": 393.2402, "rew_std": 80.7977, "Agent": "REINFORCE"}, {"env_step": 9308160, "rew": 388.6211, "rew_std": 65.8222, "Agent": "REINFORCE"}, {"env_step": 9338880, "rew": 386.8091, "rew_std": 65.9946, "Agent": "REINFORCE"}, {"env_step": 9369600, "rew": 393.0005, "rew_std": 82.596, "Agent": "REINFORCE"}, {"env_step": 9400320, "rew": 398.6098, "rew_std": 77.0395, "Agent": "REINFORCE"}, {"env_step": 9431040, "rew": 387.6794, "rew_std": 68.2785, "Agent": "REINFORCE"}, {"env_step": 9461760, "rew": 396.2232, "rew_std": 84.8934, "Agent": "REINFORCE"}, {"env_step": 9492480, "rew": 393.7139, "rew_std": 72.3839, "Agent": "REINFORCE"}, {"env_step": 9523200, "rew": 386.8038, "rew_std": 78.5513, "Agent": "REINFORCE"}, {"env_step": 9553920, "rew": 398.665, "rew_std": 83.0765, "Agent": "REINFORCE"}, {"env_step": 9584640, "rew": 394.106, "rew_std": 81.1441, "Agent": "REINFORCE"}, {"env_step": 9615360, "rew": 394.6446, "rew_std": 80.3958, "Agent": "REINFORCE"}, {"env_step": 9646080, "rew": 394.4672, "rew_std": 92.5547, "Agent": "REINFORCE"}, {"env_step": 9676800, "rew": 394.4883, "rew_std": 85.8432, "Agent": "REINFORCE"}, {"env_step": 9707520, "rew": 383.2617, "rew_std": 62.3773, "Agent": "REINFORCE"}, {"env_step": 9738240, "rew": 393.0799, "rew_std": 88.1284, "Agent": "REINFORCE"}, {"env_step": 9768960, "rew": 393.9025, "rew_std": 91.0352, "Agent": "REINFORCE"}, {"env_step": 9799680, "rew": 402.741, "rew_std": 85.7434, "Agent": "REINFORCE"}, {"env_step": 9830400, "rew": 390.5062, "rew_std": 64.6333, "Agent": "REINFORCE"}, {"env_step": 9861120, "rew": 395.8816, "rew_std": 81.3256, "Agent": "REINFORCE"}, {"env_step": 9891840, "rew": 389.786, "rew_std": 75.6932, "Agent": "REINFORCE"}, {"env_step": 9922560, "rew": 392.9576, "rew_std": 76.6835, "Agent": "REINFORCE"}, {"env_step": 9953280, "rew": 386.0522, "rew_std": 74.3712, "Agent": "REINFORCE"}, {"env_step": 9984000, "rew": 387.3965, "rew_std": 70.1528, "Agent": "REINFORCE"}, {"env_step": 10014720, "rew": 395.1271, "rew_std": 97.8375, "Agent": "REINFORCE"}, {"env_step": 10045440, "rew": 395.2879, "rew_std": 74.4887, "Agent": "REINFORCE"}, {"env_step": 10076160, "rew": 395.3669, "rew_std": 83.4544, "Agent": "REINFORCE"}, {"env_step": 10106880, "rew": 378.1233, "rew_std": 66.645, "Agent": "REINFORCE"}, {"env_step": 10137600, "rew": 390.0436, "rew_std": 78.3602, "Agent": "REINFORCE"}, {"env_step": 10168320, "rew": 390.2037, "rew_std": 83.6567, "Agent": "REINFORCE"}, {"env_step": 10199040, "rew": 384.08, "rew_std": 66.8607, "Agent": "REINFORCE"}, {"env_step": 10229760, "rew": 391.8881, "rew_std": 86.4776, "Agent": "REINFORCE"}, {"env_step": 0, "rew": 47.4556, "rew_std": 36.0937, "Agent": "SAC"}, {"env_step": 5000, "rew": 275.7761, "rew_std": 59.4556, "Agent": "SAC"}, {"env_step": 10000, "rew": 282.0917, "rew_std": 46.6158, "Agent": "SAC"}, {"env_step": 15000, "rew": 336.6352, "rew_std": 45.5268, "Agent": "SAC"}, {"env_step": 20000, "rew": 350.7719, "rew_std": 59.4432, "Agent": "SAC"}, {"env_step": 25000, "rew": 393.867, "rew_std": 94.7212, "Agent": "SAC"}, {"env_step": 30000, "rew": 493.3881, "rew_std": 205.9798, "Agent": "SAC"}, {"env_step": 35000, "rew": 535.254, "rew_std": 222.4849, "Agent": "SAC"}, {"env_step": 40000, "rew": 1029.6053, "rew_std": 793.9815, "Agent": "SAC"}, {"env_step": 45000, "rew": 705.2766, "rew_std": 641.1404, "Agent": "SAC"}, {"env_step": 50000, "rew": 851.1729, "rew_std": 372.5027, "Agent": "SAC"}, {"env_step": 55000, "rew": 1182.7687, "rew_std": 721.6847, "Agent": "SAC"}, {"env_step": 60000, "rew": 930.261, "rew_std": 399.8715, "Agent": "SAC"}, {"env_step": 65000, "rew": 1422.8022, "rew_std": 1090.8127, "Agent": "SAC"}, {"env_step": 70000, "rew": 1387.1509, "rew_std": 1089.2428, "Agent": "SAC"}, {"env_step": 75000, "rew": 1521.7049, "rew_std": 1072.2036, "Agent": "SAC"}, {"env_step": 80000, "rew": 1523.1274, "rew_std": 812.4802, "Agent": "SAC"}, {"env_step": 85000, "rew": 1787.7521, "rew_std": 997.5609, "Agent": "SAC"}, {"env_step": 90000, "rew": 1765.9052, "rew_std": 1035.8665, "Agent": "SAC"}, {"env_step": 95000, "rew": 2079.4099, "rew_std": 1125.9664, "Agent": "SAC"}, {"env_step": 100000, "rew": 2613.4592, "rew_std": 990.7811, "Agent": "SAC"}, {"env_step": 105000, "rew": 2505.2093, "rew_std": 1014.8763, "Agent": "SAC"}, {"env_step": 110000, "rew": 1882.9724, "rew_std": 903.8805, "Agent": "SAC"}, {"env_step": 115000, "rew": 2251.6213, "rew_std": 1015.3205, "Agent": "SAC"}, {"env_step": 120000, "rew": 2083.6742, "rew_std": 1150.8883, "Agent": "SAC"}, {"env_step": 125000, "rew": 2037.7974, "rew_std": 1069.9703, "Agent": "SAC"}, {"env_step": 130000, "rew": 2447.5492, "rew_std": 1104.9526, "Agent": "SAC"}, {"env_step": 135000, "rew": 2434.7552, "rew_std": 991.8537, "Agent": "SAC"}, {"env_step": 140000, "rew": 2720.4292, "rew_std": 934.5695, "Agent": "SAC"}, {"env_step": 145000, "rew": 2583.2391, "rew_std": 1002.1706, "Agent": "SAC"}, {"env_step": 150000, "rew": 2782.7663, "rew_std": 827.8125, "Agent": "SAC"}, {"env_step": 155000, "rew": 2899.1311, "rew_std": 683.8363, "Agent": "SAC"}, {"env_step": 160000, "rew": 2912.7348, "rew_std": 704.0542, "Agent": "SAC"}, {"env_step": 165000, "rew": 2908.8992, "rew_std": 758.2095, "Agent": "SAC"}, {"env_step": 170000, "rew": 2830.1015, "rew_std": 582.8762, "Agent": "SAC"}, {"env_step": 175000, "rew": 3058.4135, "rew_std": 416.2314, "Agent": "SAC"}, {"env_step": 180000, "rew": 2800.0321, "rew_std": 969.0885, "Agent": "SAC"}, {"env_step": 185000, "rew": 2993.8637, "rew_std": 707.68, "Agent": "SAC"}, {"env_step": 190000, "rew": 2382.8887, "rew_std": 1161.7076, "Agent": "SAC"}, {"env_step": 195000, "rew": 3015.8118, "rew_std": 506.8064, "Agent": "SAC"}, {"env_step": 200000, "rew": 3234.4156, "rew_std": 314.1973, "Agent": "SAC"}, {"env_step": 205000, "rew": 3099.8164, "rew_std": 619.2829, "Agent": "SAC"}, {"env_step": 210000, "rew": 2495.4626, "rew_std": 1158.0519, "Agent": "SAC"}, {"env_step": 215000, "rew": 2738.6383, "rew_std": 982.2683, "Agent": "SAC"}, {"env_step": 220000, "rew": 2957.1676, "rew_std": 777.4626, "Agent": "SAC"}, {"env_step": 225000, "rew": 2915.008, "rew_std": 750.9862, "Agent": "SAC"}, {"env_step": 230000, "rew": 3173.0933, "rew_std": 545.6744, "Agent": "SAC"}, {"env_step": 235000, "rew": 3352.3255, "rew_std": 144.4022, "Agent": "SAC"}, {"env_step": 240000, "rew": 3170.9914, "rew_std": 657.4997, "Agent": "SAC"}, {"env_step": 245000, "rew": 3294.4914, "rew_std": 278.824, "Agent": "SAC"}, {"env_step": 250000, "rew": 3222.7075, "rew_std": 280.7911, "Agent": "SAC"}, {"env_step": 255000, "rew": 3297.9414, "rew_std": 224.8675, "Agent": "SAC"}, {"env_step": 260000, "rew": 3382.6137, "rew_std": 129.619, "Agent": "SAC"}, {"env_step": 265000, "rew": 3385.8352, "rew_std": 131.3435, "Agent": "SAC"}, {"env_step": 270000, "rew": 3345.2796, "rew_std": 213.9516, "Agent": "SAC"}, {"env_step": 275000, "rew": 3108.6666, "rew_std": 687.6853, "Agent": "SAC"}, {"env_step": 280000, "rew": 2807.6834, "rew_std": 1111.6307, "Agent": "SAC"}, {"env_step": 285000, "rew": 2989.1773, "rew_std": 888.0763, "Agent": "SAC"}, {"env_step": 290000, "rew": 3165.0168, "rew_std": 670.5128, "Agent": "SAC"}, {"env_step": 295000, "rew": 3403.0451, "rew_std": 95.1653, "Agent": "SAC"}, {"env_step": 300000, "rew": 3387.6597, "rew_std": 114.6012, "Agent": "SAC"}, {"env_step": 305000, "rew": 3327.1286, "rew_std": 317.4994, "Agent": "SAC"}, {"env_step": 310000, "rew": 3402.2741, "rew_std": 118.2682, "Agent": "SAC"}, {"env_step": 315000, "rew": 3335.9056, "rew_std": 249.4078, "Agent": "SAC"}, {"env_step": 320000, "rew": 3389.7038, "rew_std": 113.1724, "Agent": "SAC"}, {"env_step": 325000, "rew": 3439.6622, "rew_std": 96.1649, "Agent": "SAC"}, {"env_step": 330000, "rew": 2915.1265, "rew_std": 1128.311, "Agent": "SAC"}, {"env_step": 335000, "rew": 3355.5532, "rew_std": 187.5645, "Agent": "SAC"}, {"env_step": 340000, "rew": 3235.9036, "rew_std": 642.4013, "Agent": "SAC"}, {"env_step": 345000, "rew": 3244.4175, "rew_std": 612.4494, "Agent": "SAC"}, {"env_step": 350000, "rew": 3386.5798, "rew_std": 238.5771, "Agent": "SAC"}, {"env_step": 355000, "rew": 3194.7686, "rew_std": 700.3986, "Agent": "SAC"}, {"env_step": 360000, "rew": 3413.1038, "rew_std": 116.8649, "Agent": "SAC"}, {"env_step": 365000, "rew": 3289.0649, "rew_std": 496.0933, "Agent": "SAC"}, {"env_step": 370000, "rew": 3352.8785, "rew_std": 266.9787, "Agent": "SAC"}, {"env_step": 375000, "rew": 3431.5784, "rew_std": 116.194, "Agent": "SAC"}, {"env_step": 380000, "rew": 3179.7096, "rew_std": 586.7048, "Agent": "SAC"}, {"env_step": 385000, "rew": 3269.7002, "rew_std": 600.8841, "Agent": "SAC"}, {"env_step": 390000, "rew": 3362.5338, "rew_std": 315.9082, "Agent": "SAC"}, {"env_step": 395000, "rew": 3259.2257, "rew_std": 587.5798, "Agent": "SAC"}, {"env_step": 400000, "rew": 3300.7786, "rew_std": 477.0863, "Agent": "SAC"}, {"env_step": 405000, "rew": 3156.5526, "rew_std": 622.6734, "Agent": "SAC"}, {"env_step": 410000, "rew": 3440.1684, "rew_std": 83.916, "Agent": "SAC"}, {"env_step": 415000, "rew": 3427.2914, "rew_std": 112.7821, "Agent": "SAC"}, {"env_step": 420000, "rew": 3278.1821, "rew_std": 417.4718, "Agent": "SAC"}, {"env_step": 425000, "rew": 3286.694, "rew_std": 544.7659, "Agent": "SAC"}, {"env_step": 430000, "rew": 3298.7286, "rew_std": 489.6424, "Agent": "SAC"}, {"env_step": 435000, "rew": 3108.858, "rew_std": 612.0163, "Agent": "SAC"}, {"env_step": 440000, "rew": 3373.391, "rew_std": 303.656, "Agent": "SAC"}, {"env_step": 445000, "rew": 3348.5861, "rew_std": 332.7744, "Agent": "SAC"}, {"env_step": 450000, "rew": 3129.1637, "rew_std": 1045.6309, "Agent": "SAC"}, {"env_step": 455000, "rew": 3315.3106, "rew_std": 446.1883, "Agent": "SAC"}, {"env_step": 460000, "rew": 3351.584, "rew_std": 363.8294, "Agent": "SAC"}, {"env_step": 465000, "rew": 3408.3243, "rew_std": 247.8712, "Agent": "SAC"}, {"env_step": 470000, "rew": 3269.2203, "rew_std": 626.2374, "Agent": "SAC"}, {"env_step": 475000, "rew": 3479.7509, "rew_std": 76.4065, "Agent": "SAC"}, {"env_step": 480000, "rew": 3307.292, "rew_std": 572.615, "Agent": "SAC"}, {"env_step": 485000, "rew": 3358.0348, "rew_std": 392.7433, "Agent": "SAC"}, {"env_step": 490000, "rew": 3289.9174, "rew_std": 620.9423, "Agent": "SAC"}, {"env_step": 495000, "rew": 3149.5783, "rew_std": 983.6098, "Agent": "SAC"}, {"env_step": 500000, "rew": 3153.8445, "rew_std": 689.3463, "Agent": "SAC"}, {"env_step": 505000, "rew": 3343.6685, "rew_std": 428.8474, "Agent": "SAC"}, {"env_step": 510000, "rew": 3352.6351, "rew_std": 453.2007, "Agent": "SAC"}, {"env_step": 515000, "rew": 3496.9786, "rew_std": 67.199, "Agent": "SAC"}, {"env_step": 520000, "rew": 3308.8103, "rew_std": 560.9129, "Agent": "SAC"}, {"env_step": 525000, "rew": 3429.5733, "rew_std": 181.7485, "Agent": "SAC"}, {"env_step": 530000, "rew": 3502.2174, "rew_std": 55.4399, "Agent": "SAC"}, {"env_step": 535000, "rew": 3307.6355, "rew_std": 573.1831, "Agent": "SAC"}, {"env_step": 540000, "rew": 3494.0667, "rew_std": 74.681, "Agent": "SAC"}, {"env_step": 545000, "rew": 3152.4726, "rew_std": 919.3493, "Agent": "SAC"}, {"env_step": 550000, "rew": 3496.8042, "rew_std": 69.283, "Agent": "SAC"}, {"env_step": 555000, "rew": 3472.1212, "rew_std": 103.5854, "Agent": "SAC"}, {"env_step": 560000, "rew": 3466.4866, "rew_std": 110.1099, "Agent": "SAC"}, {"env_step": 565000, "rew": 3485.939, "rew_std": 80.6578, "Agent": "SAC"}, {"env_step": 570000, "rew": 3488.7434, "rew_std": 77.3344, "Agent": "SAC"}, {"env_step": 575000, "rew": 3147.2589, "rew_std": 989.8934, "Agent": "SAC"}, {"env_step": 580000, "rew": 3342.3024, "rew_std": 472.1387, "Agent": "SAC"}, {"env_step": 585000, "rew": 3505.615, "rew_std": 66.4951, "Agent": "SAC"}, {"env_step": 590000, "rew": 3434.079, "rew_std": 222.5851, "Agent": "SAC"}, {"env_step": 595000, "rew": 3302.6204, "rew_std": 527.5602, "Agent": "SAC"}, {"env_step": 600000, "rew": 3469.6485, "rew_std": 129.1016, "Agent": "SAC"}, {"env_step": 605000, "rew": 3453.9831, "rew_std": 128.9461, "Agent": "SAC"}, {"env_step": 610000, "rew": 3496.7596, "rew_std": 49.8348, "Agent": "SAC"}, {"env_step": 615000, "rew": 3497.4815, "rew_std": 62.9814, "Agent": "SAC"}, {"env_step": 620000, "rew": 3509.1201, "rew_std": 45.4985, "Agent": "SAC"}, {"env_step": 625000, "rew": 3513.9445, "rew_std": 49.767, "Agent": "SAC"}, {"env_step": 630000, "rew": 3485.2062, "rew_std": 62.7697, "Agent": "SAC"}, {"env_step": 635000, "rew": 3463.5502, "rew_std": 138.2686, "Agent": "SAC"}, {"env_step": 640000, "rew": 3504.1595, "rew_std": 63.7314, "Agent": "SAC"}, {"env_step": 645000, "rew": 3506.4354, "rew_std": 54.2136, "Agent": "SAC"}, {"env_step": 650000, "rew": 3504.8205, "rew_std": 66.3304, "Agent": "SAC"}, {"env_step": 655000, "rew": 3512.5706, "rew_std": 51.5125, "Agent": "SAC"}, {"env_step": 660000, "rew": 3511.0268, "rew_std": 52.0514, "Agent": "SAC"}, {"env_step": 665000, "rew": 3513.4651, "rew_std": 54.3786, "Agent": "SAC"}, {"env_step": 670000, "rew": 3507.2821, "rew_std": 55.4767, "Agent": "SAC"}, {"env_step": 675000, "rew": 3518.2688, "rew_std": 53.0561, "Agent": "SAC"}, {"env_step": 680000, "rew": 3349.8544, "rew_std": 489.5576, "Agent": "SAC"}, {"env_step": 685000, "rew": 3330.8927, "rew_std": 539.2089, "Agent": "SAC"}, {"env_step": 690000, "rew": 3496.2697, "rew_std": 98.1611, "Agent": "SAC"}, {"env_step": 695000, "rew": 3514.8186, "rew_std": 61.7482, "Agent": "SAC"}, {"env_step": 700000, "rew": 3503.5561, "rew_std": 64.6355, "Agent": "SAC"}, {"env_step": 705000, "rew": 3497.2257, "rew_std": 61.3456, "Agent": "SAC"}, {"env_step": 710000, "rew": 3520.9237, "rew_std": 65.9712, "Agent": "SAC"}, {"env_step": 715000, "rew": 3489.5284, "rew_std": 136.7891, "Agent": "SAC"}, {"env_step": 720000, "rew": 3527.6567, "rew_std": 63.4808, "Agent": "SAC"}, {"env_step": 725000, "rew": 3516.5266, "rew_std": 54.1486, "Agent": "SAC"}, {"env_step": 730000, "rew": 3519.1343, "rew_std": 52.9873, "Agent": "SAC"}, {"env_step": 735000, "rew": 3490.632, "rew_std": 96.6564, "Agent": "SAC"}, {"env_step": 740000, "rew": 3506.4161, "rew_std": 109.7111, "Agent": "SAC"}, {"env_step": 745000, "rew": 3514.3282, "rew_std": 61.8251, "Agent": "SAC"}, {"env_step": 750000, "rew": 3511.3453, "rew_std": 56.5664, "Agent": "SAC"}, {"env_step": 755000, "rew": 3508.2242, "rew_std": 43.2657, "Agent": "SAC"}, {"env_step": 760000, "rew": 3513.4562, "rew_std": 49.6405, "Agent": "SAC"}, {"env_step": 765000, "rew": 3447.2038, "rew_std": 214.2386, "Agent": "SAC"}, {"env_step": 770000, "rew": 3281.5668, "rew_std": 691.0348, "Agent": "SAC"}, {"env_step": 775000, "rew": 3520.0712, "rew_std": 64.6354, "Agent": "SAC"}, {"env_step": 780000, "rew": 3516.2051, "rew_std": 60.5938, "Agent": "SAC"}, {"env_step": 785000, "rew": 3519.0088, "rew_std": 62.0088, "Agent": "SAC"}, {"env_step": 790000, "rew": 3524.6045, "rew_std": 54.7701, "Agent": "SAC"}, {"env_step": 795000, "rew": 3501.6906, "rew_std": 58.4171, "Agent": "SAC"}, {"env_step": 800000, "rew": 3509.3966, "rew_std": 56.6941, "Agent": "SAC"}, {"env_step": 805000, "rew": 3515.611, "rew_std": 54.3113, "Agent": "SAC"}, {"env_step": 810000, "rew": 3522.4115, "rew_std": 60.0603, "Agent": "SAC"}, {"env_step": 815000, "rew": 3525.2187, "rew_std": 60.8522, "Agent": "SAC"}, {"env_step": 820000, "rew": 3517.6993, "rew_std": 60.5311, "Agent": "SAC"}, {"env_step": 825000, "rew": 3511.3608, "rew_std": 53.1438, "Agent": "SAC"}, {"env_step": 830000, "rew": 3525.4017, "rew_std": 59.3785, "Agent": "SAC"}, {"env_step": 835000, "rew": 3517.3174, "rew_std": 51.8875, "Agent": "SAC"}, {"env_step": 840000, "rew": 3511.427, "rew_std": 48.9103, "Agent": "SAC"}, {"env_step": 845000, "rew": 3233.2189, "rew_std": 902.9686, "Agent": "SAC"}, {"env_step": 850000, "rew": 3505.4327, "rew_std": 53.0899, "Agent": "SAC"}, {"env_step": 855000, "rew": 3521.5302, "rew_std": 58.6207, "Agent": "SAC"}, {"env_step": 860000, "rew": 3532.3486, "rew_std": 68.1457, "Agent": "SAC"}, {"env_step": 865000, "rew": 3523.5765, "rew_std": 53.409, "Agent": "SAC"}, {"env_step": 870000, "rew": 3236.7132, "rew_std": 895.7161, "Agent": "SAC"}, {"env_step": 875000, "rew": 3517.0279, "rew_std": 56.7523, "Agent": "SAC"}, {"env_step": 880000, "rew": 3522.4118, "rew_std": 58.5564, "Agent": "SAC"}, {"env_step": 885000, "rew": 3161.5897, "rew_std": 1046.7225, "Agent": "SAC"}, {"env_step": 890000, "rew": 3537.7698, "rew_std": 47.4872, "Agent": "SAC"}, {"env_step": 895000, "rew": 3519.0764, "rew_std": 60.8041, "Agent": "SAC"}, {"env_step": 900000, "rew": 3520.3896, "rew_std": 55.8492, "Agent": "SAC"}, {"env_step": 905000, "rew": 3523.8942, "rew_std": 56.3431, "Agent": "SAC"}, {"env_step": 910000, "rew": 3538.571, "rew_std": 40.6978, "Agent": "SAC"}, {"env_step": 915000, "rew": 3450.8878, "rew_std": 236.0645, "Agent": "SAC"}, {"env_step": 920000, "rew": 3524.2823, "rew_std": 51.914, "Agent": "SAC"}, {"env_step": 925000, "rew": 3202.4734, "rew_std": 977.0959, "Agent": "SAC"}, {"env_step": 930000, "rew": 3273.1453, "rew_std": 734.3886, "Agent": "SAC"}, {"env_step": 935000, "rew": 3455.3452, "rew_std": 206.2434, "Agent": "SAC"}, {"env_step": 940000, "rew": 3175.5728, "rew_std": 1042.4874, "Agent": "SAC"}, {"env_step": 945000, "rew": 3527.0726, "rew_std": 55.3019, "Agent": "SAC"}, {"env_step": 950000, "rew": 3535.6306, "rew_std": 49.2671, "Agent": "SAC"}, {"env_step": 955000, "rew": 3525.8447, "rew_std": 46.4758, "Agent": "SAC"}, {"env_step": 960000, "rew": 3531.017, "rew_std": 52.1814, "Agent": "SAC"}, {"env_step": 965000, "rew": 3520.952, "rew_std": 52.5745, "Agent": "SAC"}, {"env_step": 970000, "rew": 3542.2142, "rew_std": 51.4682, "Agent": "SAC"}, {"env_step": 975000, "rew": 3527.5707, "rew_std": 45.3567, "Agent": "SAC"}, {"env_step": 980000, "rew": 3189.7376, "rew_std": 997.8534, "Agent": "SAC"}, {"env_step": 985000, "rew": 3520.5999, "rew_std": 35.5321, "Agent": "SAC"}, {"env_step": 990000, "rew": 3515.0443, "rew_std": 36.0914, "Agent": "SAC"}, {"env_step": 995000, "rew": 3520.7646, "rew_std": 44.903, "Agent": "SAC"}, {"env_step": 1000000, "rew": 3531.5999, "rew_std": 43.2168, "Agent": "SAC"}, {"env_step": 1005000, "rew": 3537.6764, "rew_std": 41.3989, "Agent": "SAC"}, {"env_step": 1010000, "rew": 3537.5447, "rew_std": 44.6579, "Agent": "SAC"}, {"env_step": 1015000, "rew": 3524.9329, "rew_std": 56.391, "Agent": "SAC"}, {"env_step": 1020000, "rew": 3459.5167, "rew_std": 247.163, "Agent": "SAC"}, {"env_step": 1025000, "rew": 3540.6938, "rew_std": 37.3364, "Agent": "SAC"}, {"env_step": 1030000, "rew": 3533.2482, "rew_std": 48.7726, "Agent": "SAC"}, {"env_step": 1035000, "rew": 3521.0612, "rew_std": 58.0774, "Agent": "SAC"}, {"env_step": 1040000, "rew": 3546.4092, "rew_std": 48.796, "Agent": "SAC"}, {"env_step": 1045000, "rew": 3535.2375, "rew_std": 46.4841, "Agent": "SAC"}, {"env_step": 1050000, "rew": 3546.7265, "rew_std": 42.9841, "Agent": "SAC"}, {"env_step": 1055000, "rew": 3527.3797, "rew_std": 49.7837, "Agent": "SAC"}, {"env_step": 1060000, "rew": 3544.2985, "rew_std": 50.6251, "Agent": "SAC"}, {"env_step": 1065000, "rew": 3504.0597, "rew_std": 137.2038, "Agent": "SAC"}, {"env_step": 1070000, "rew": 3548.3365, "rew_std": 42.6806, "Agent": "SAC"}, {"env_step": 1075000, "rew": 3547.6729, "rew_std": 49.0633, "Agent": "SAC"}, {"env_step": 1080000, "rew": 3546.0549, "rew_std": 40.8882, "Agent": "SAC"}, {"env_step": 1085000, "rew": 3518.5469, "rew_std": 109.8673, "Agent": "SAC"}, {"env_step": 1090000, "rew": 3151.1933, "rew_std": 909.5713, "Agent": "SAC"}, {"env_step": 1095000, "rew": 3440.9245, "rew_std": 322.2829, "Agent": "SAC"}, {"env_step": 1100000, "rew": 3029.8716, "rew_std": 1071.2459, "Agent": "SAC"}, {"env_step": 1105000, "rew": 3557.3477, "rew_std": 33.0738, "Agent": "SAC"}, {"env_step": 1110000, "rew": 3395.5135, "rew_std": 338.1572, "Agent": "SAC"}, {"env_step": 1115000, "rew": 3550.1206, "rew_std": 48.1577, "Agent": "SAC"}, {"env_step": 1120000, "rew": 3561.1023, "rew_std": 40.9386, "Agent": "SAC"}, {"env_step": 1125000, "rew": 3533.8194, "rew_std": 61.1164, "Agent": "SAC"}, {"env_step": 1130000, "rew": 3463.6075, "rew_std": 266.0974, "Agent": "SAC"}, {"env_step": 1135000, "rew": 3570.4994, "rew_std": 47.6836, "Agent": "SAC"}, {"env_step": 1140000, "rew": 3551.0034, "rew_std": 41.5901, "Agent": "SAC"}, {"env_step": 1145000, "rew": 3564.5966, "rew_std": 39.7762, "Agent": "SAC"}, {"env_step": 1150000, "rew": 3181.0511, "rew_std": 1060.7804, "Agent": "SAC"}, {"env_step": 1155000, "rew": 3462.0114, "rew_std": 197.7437, "Agent": "SAC"}, {"env_step": 1160000, "rew": 3425.1199, "rew_std": 361.8834, "Agent": "SAC"}, {"env_step": 1165000, "rew": 3352.6739, "rew_std": 518.6627, "Agent": "SAC"}, {"env_step": 1170000, "rew": 3557.2332, "rew_std": 43.5451, "Agent": "SAC"}, {"env_step": 1175000, "rew": 3554.7394, "rew_std": 35.583, "Agent": "SAC"}, {"env_step": 1180000, "rew": 3557.5383, "rew_std": 31.4509, "Agent": "SAC"}, {"env_step": 1185000, "rew": 3551.5281, "rew_std": 36.8617, "Agent": "SAC"}, {"env_step": 1190000, "rew": 3370.5322, "rew_std": 534.8758, "Agent": "SAC"}, {"env_step": 1195000, "rew": 3462.1363, "rew_std": 255.2329, "Agent": "SAC"}, {"env_step": 1200000, "rew": 3515.0849, "rew_std": 121.4034, "Agent": "SAC"}, {"env_step": 1205000, "rew": 3541.7524, "rew_std": 77.3033, "Agent": "SAC"}, {"env_step": 1210000, "rew": 3567.9682, "rew_std": 50.4551, "Agent": "SAC"}, {"env_step": 1215000, "rew": 3550.3638, "rew_std": 34.3122, "Agent": "SAC"}, {"env_step": 1220000, "rew": 3561.7984, "rew_std": 37.095, "Agent": "SAC"}, {"env_step": 1225000, "rew": 3509.1085, "rew_std": 193.0366, "Agent": "SAC"}, {"env_step": 1230000, "rew": 3531.0292, "rew_std": 99.6654, "Agent": "SAC"}, {"env_step": 1235000, "rew": 3573.5177, "rew_std": 49.6752, "Agent": "SAC"}, {"env_step": 1240000, "rew": 3545.2726, "rew_std": 71.9973, "Agent": "SAC"}, {"env_step": 1245000, "rew": 3487.1151, "rew_std": 227.3082, "Agent": "SAC"}, {"env_step": 1250000, "rew": 3547.1835, "rew_std": 38.5091, "Agent": "SAC"}, {"env_step": 0, "rew": 17.3274, "rew_std": 3.1882, "Agent": "TRPO"}, {"env_step": 30720, "rew": 233.7668, "rew_std": 18.8559, "Agent": "TRPO"}, {"env_step": 61440, "rew": 298.1263, "rew_std": 81.1015, "Agent": "TRPO"}, {"env_step": 92160, "rew": 325.7863, "rew_std": 62.1168, "Agent": "TRPO"}, {"env_step": 122880, "rew": 358.3496, "rew_std": 71.4976, "Agent": "TRPO"}, {"env_step": 153600, "rew": 375.9593, "rew_std": 70.5803, "Agent": "TRPO"}, {"env_step": 184320, "rew": 398.5706, "rew_std": 105.4031, "Agent": "TRPO"}, {"env_step": 215040, "rew": 410.154, "rew_std": 115.6071, "Agent": "TRPO"}, {"env_step": 245760, "rew": 425.957, "rew_std": 137.304, "Agent": "TRPO"}, {"env_step": 276480, "rew": 430.9357, "rew_std": 122.482, "Agent": "TRPO"}, {"env_step": 307200, "rew": 507.8167, "rew_std": 277.9642, "Agent": "TRPO"}, {"env_step": 337920, "rew": 634.4965, "rew_std": 457.2043, "Agent": "TRPO"}, {"env_step": 368640, "rew": 812.3279, "rew_std": 694.1096, "Agent": "TRPO"}, {"env_step": 399360, "rew": 818.5923, "rew_std": 559.483, "Agent": "TRPO"}, {"env_step": 430080, "rew": 894.2241, "rew_std": 521.3391, "Agent": "TRPO"}, {"env_step": 460800, "rew": 975.9629, "rew_std": 519.4792, "Agent": "TRPO"}, {"env_step": 491520, "rew": 945.1953, "rew_std": 471.9335, "Agent": "TRPO"}, {"env_step": 522240, "rew": 1089.0439, "rew_std": 637.3884, "Agent": "TRPO"}, {"env_step": 552960, "rew": 1069.8288, "rew_std": 577.7914, "Agent": "TRPO"}, {"env_step": 583680, "rew": 1068.6961, "rew_std": 524.5628, "Agent": "TRPO"}, {"env_step": 614400, "rew": 1363.4712, "rew_std": 759.5915, "Agent": "TRPO"}, {"env_step": 645120, "rew": 1272.1759, "rew_std": 632.1076, "Agent": "TRPO"}, {"env_step": 675840, "rew": 1442.5838, "rew_std": 850.6924, "Agent": "TRPO"}, {"env_step": 706560, "rew": 1579.9689, "rew_std": 890.0017, "Agent": "TRPO"}, {"env_step": 737280, "rew": 1668.6527, "rew_std": 989.1277, "Agent": "TRPO"}, {"env_step": 768000, "rew": 1634.7542, "rew_std": 913.2596, "Agent": "TRPO"}, {"env_step": 798720, "rew": 1666.9664, "rew_std": 907.2841, "Agent": "TRPO"}, {"env_step": 829440, "rew": 1866.8377, "rew_std": 892.0204, "Agent": "TRPO"}, {"env_step": 860160, "rew": 1856.6282, "rew_std": 879.1212, "Agent": "TRPO"}, {"env_step": 890880, "rew": 2046.0458, "rew_std": 1037.8581, "Agent": "TRPO"}, {"env_step": 921600, "rew": 2000.8053, "rew_std": 914.3049, "Agent": "TRPO"}, {"env_step": 952320, "rew": 1833.8615, "rew_std": 932.996, "Agent": "TRPO"}, {"env_step": 983040, "rew": 2020.3857, "rew_std": 1101.9795, "Agent": "TRPO"}, {"env_step": 1013760, "rew": 2006.4676, "rew_std": 927.6951, "Agent": "TRPO"}, {"env_step": 1044480, "rew": 2050.02, "rew_std": 1060.7432, "Agent": "TRPO"}, {"env_step": 1075200, "rew": 1817.2615, "rew_std": 741.5132, "Agent": "TRPO"}, {"env_step": 1105920, "rew": 1947.5662, "rew_std": 1063.159, "Agent": "TRPO"}, {"env_step": 1136640, "rew": 1906.7756, "rew_std": 975.5771, "Agent": "TRPO"}, {"env_step": 1167360, "rew": 2003.1815, "rew_std": 1082.4816, "Agent": "TRPO"}, {"env_step": 1198080, "rew": 2042.0015, "rew_std": 1096.7791, "Agent": "TRPO"}, {"env_step": 1228800, "rew": 2126.101, "rew_std": 1164.467, "Agent": "TRPO"}, {"env_step": 1259520, "rew": 2108.2943, "rew_std": 1136.4875, "Agent": "TRPO"}, {"env_step": 1290240, "rew": 2147.9696, "rew_std": 1136.5707, "Agent": "TRPO"}, {"env_step": 1320960, "rew": 2047.2856, "rew_std": 1137.6954, "Agent": "TRPO"}, {"env_step": 1351680, "rew": 1976.4187, "rew_std": 1019.6263, "Agent": "TRPO"}, {"env_step": 1382400, "rew": 1886.957, "rew_std": 1020.8876, "Agent": "TRPO"}, {"env_step": 1413120, "rew": 2176.439, "rew_std": 1124.3158, "Agent": "TRPO"}, {"env_step": 1443840, "rew": 2062.1238, "rew_std": 1033.0589, "Agent": "TRPO"}, {"env_step": 1474560, "rew": 2025.7069, "rew_std": 1050.537, "Agent": "TRPO"}, {"env_step": 1505280, "rew": 2008.325, "rew_std": 997.508, "Agent": "TRPO"}, {"env_step": 1536000, "rew": 2265.3851, "rew_std": 1087.0787, "Agent": "TRPO"}, {"env_step": 1566720, "rew": 2230.1246, "rew_std": 1092.5622, "Agent": "TRPO"}, {"env_step": 1597440, "rew": 2167.5746, "rew_std": 1091.8927, "Agent": "TRPO"}, {"env_step": 1628160, "rew": 2285.9649, "rew_std": 1021.1309, "Agent": "TRPO"}, {"env_step": 1658880, "rew": 1932.2893, "rew_std": 848.5764, "Agent": "TRPO"}, {"env_step": 1689600, "rew": 2413.8677, "rew_std": 1042.6641, "Agent": "TRPO"}, {"env_step": 1720320, "rew": 2183.6026, "rew_std": 1076.4357, "Agent": "TRPO"}, {"env_step": 1751040, "rew": 2214.1489, "rew_std": 998.4885, "Agent": "TRPO"}, {"env_step": 1781760, "rew": 2369.7069, "rew_std": 1030.0079, "Agent": "TRPO"}, {"env_step": 1812480, "rew": 2271.6798, "rew_std": 1047.97, "Agent": "TRPO"}, {"env_step": 1843200, "rew": 2184.2902, "rew_std": 971.1338, "Agent": "TRPO"}, {"env_step": 1873920, "rew": 2185.7843, "rew_std": 998.9846, "Agent": "TRPO"}, {"env_step": 1904640, "rew": 2177.7353, "rew_std": 945.4112, "Agent": "TRPO"}, {"env_step": 1935360, "rew": 2317.1312, "rew_std": 1047.9088, "Agent": "TRPO"}, {"env_step": 1966080, "rew": 2499.6737, "rew_std": 1033.8052, "Agent": "TRPO"}, {"env_step": 1996800, "rew": 2270.618, "rew_std": 919.9233, "Agent": "TRPO"}, {"env_step": 2027520, "rew": 2321.4618, "rew_std": 955.0355, "Agent": "TRPO"}, {"env_step": 2058240, "rew": 2186.1345, "rew_std": 1067.9878, "Agent": "TRPO"}, {"env_step": 2088960, "rew": 2322.2783, "rew_std": 987.7264, "Agent": "TRPO"}, {"env_step": 2119680, "rew": 2300.4148, "rew_std": 922.8249, "Agent": "TRPO"}, {"env_step": 2150400, "rew": 2340.7148, "rew_std": 981.3813, "Agent": "TRPO"}, {"env_step": 2181120, "rew": 2541.9973, "rew_std": 1047.5803, "Agent": "TRPO"}, {"env_step": 2211840, "rew": 2167.5642, "rew_std": 970.3827, "Agent": "TRPO"}, {"env_step": 2242560, "rew": 2329.2001, "rew_std": 925.7716, "Agent": "TRPO"}, {"env_step": 2273280, "rew": 2427.4703, "rew_std": 935.2074, "Agent": "TRPO"}, {"env_step": 2304000, "rew": 2202.2032, "rew_std": 889.7977, "Agent": "TRPO"}, {"env_step": 2334720, "rew": 2318.2378, "rew_std": 925.6013, "Agent": "TRPO"}, {"env_step": 2365440, "rew": 2370.0184, "rew_std": 909.7784, "Agent": "TRPO"}, {"env_step": 2396160, "rew": 2318.9332, "rew_std": 857.8738, "Agent": "TRPO"}, {"env_step": 2426880, "rew": 2498.729, "rew_std": 1018.3086, "Agent": "TRPO"}, {"env_step": 2457600, "rew": 2402.2547, "rew_std": 1004.0242, "Agent": "TRPO"}, {"env_step": 2488320, "rew": 2377.708, "rew_std": 859.3971, "Agent": "TRPO"}, {"env_step": 2519040, "rew": 2228.2407, "rew_std": 908.7501, "Agent": "TRPO"}, {"env_step": 2549760, "rew": 2276.0725, "rew_std": 974.3989, "Agent": "TRPO"}, {"env_step": 2580480, "rew": 2171.0538, "rew_std": 915.2567, "Agent": "TRPO"}, {"env_step": 2611200, "rew": 2293.7268, "rew_std": 840.503, "Agent": "TRPO"}, {"env_step": 2641920, "rew": 2309.3953, "rew_std": 834.8744, "Agent": "TRPO"}, {"env_step": 2672640, "rew": 2227.8159, "rew_std": 818.4304, "Agent": "TRPO"}, {"env_step": 2703360, "rew": 2252.5822, "rew_std": 853.2035, "Agent": "TRPO"}, {"env_step": 2734080, "rew": 2144.7569, "rew_std": 821.6433, "Agent": "TRPO"}, {"env_step": 2764800, "rew": 2547.3423, "rew_std": 945.7498, "Agent": "TRPO"}, {"env_step": 2795520, "rew": 2455.6882, "rew_std": 792.5609, "Agent": "TRPO"}, {"env_step": 2826240, "rew": 2559.1104, "rew_std": 790.6916, "Agent": "TRPO"}, {"env_step": 2856960, "rew": 2393.9441, "rew_std": 823.6406, "Agent": "TRPO"}, {"env_step": 2887680, "rew": 2534.2962, "rew_std": 815.4712, "Agent": "TRPO"}, {"env_step": 2918400, "rew": 2626.6735, "rew_std": 778.8513, "Agent": "TRPO"}, {"env_step": 2949120, "rew": 2501.3082, "rew_std": 834.2012, "Agent": "TRPO"}, {"env_step": 2979840, "rew": 2461.2728, "rew_std": 947.3733, "Agent": "TRPO"}, {"env_step": 3010560, "rew": 2520.141, "rew_std": 729.8857, "Agent": "TRPO"}, {"env_step": 3041280, "rew": 2529.6456, "rew_std": 769.5603, "Agent": "TRPO"}, {"env_step": 3072000, "rew": 2453.7476, "rew_std": 923.7766, "Agent": "TRPO"}, {"env_step": 0, "rew": 17.3274, "rew_std": 3.1882, "Agent": "A2C"}, {"env_step": 30000, "rew": 462.4966, "rew_std": 346.8055, "Agent": "A2C"}, {"env_step": 60000, "rew": 622.0757, "rew_std": 308.1571, "Agent": "A2C"}, {"env_step": 90000, "rew": 682.6425, "rew_std": 293.7176, "Agent": "A2C"}, {"env_step": 120000, "rew": 626.6831, "rew_std": 267.0181, "Agent": "A2C"}, {"env_step": 150000, "rew": 588.8864, "rew_std": 272.5663, "Agent": "A2C"}, {"env_step": 180000, "rew": 570.3548, "rew_std": 273.4997, "Agent": "A2C"}, {"env_step": 210000, "rew": 583.2997, "rew_std": 269.3662, "Agent": "A2C"}, {"env_step": 240000, "rew": 568.1374, "rew_std": 285.7505, "Agent": "A2C"}, {"env_step": 270000, "rew": 600.4265, "rew_std": 283.2298, "Agent": "A2C"}, {"env_step": 300000, "rew": 581.2122, "rew_std": 281.8224, "Agent": "A2C"}, {"env_step": 330000, "rew": 582.0573, "rew_std": 275.9559, "Agent": "A2C"}, {"env_step": 360000, "rew": 639.7437, "rew_std": 248.9154, "Agent": "A2C"}, {"env_step": 390000, "rew": 748.2057, "rew_std": 324.7842, "Agent": "A2C"}, {"env_step": 420000, "rew": 826.1403, "rew_std": 476.4329, "Agent": "A2C"}, {"env_step": 450000, "rew": 772.2532, "rew_std": 355.8575, "Agent": "A2C"}, {"env_step": 480000, "rew": 729.2479, "rew_std": 296.4466, "Agent": "A2C"}, {"env_step": 510000, "rew": 819.3713, "rew_std": 456.3531, "Agent": "A2C"}, {"env_step": 540000, "rew": 709.3754, "rew_std": 292.8698, "Agent": "A2C"}, {"env_step": 570000, "rew": 732.1387, "rew_std": 328.7899, "Agent": "A2C"}, {"env_step": 600000, "rew": 990.2754, "rew_std": 488.759, "Agent": "A2C"}, {"env_step": 630000, "rew": 982.0049, "rew_std": 340.0413, "Agent": "A2C"}, {"env_step": 660000, "rew": 940.6046, "rew_std": 400.8275, "Agent": "A2C"}, {"env_step": 690000, "rew": 951.6317, "rew_std": 224.9542, "Agent": "A2C"}, {"env_step": 720000, "rew": 1166.5681, "rew_std": 264.526, "Agent": "A2C"}, {"env_step": 750000, "rew": 1253.1615, "rew_std": 458.0398, "Agent": "A2C"}, {"env_step": 780000, "rew": 1106.3958, "rew_std": 266.184, "Agent": "A2C"}, {"env_step": 810000, "rew": 1037.3397, "rew_std": 192.7324, "Agent": "A2C"}, {"env_step": 840000, "rew": 1194.818, "rew_std": 557.2156, "Agent": "A2C"}, {"env_step": 870000, "rew": 1174.3561, "rew_std": 222.2454, "Agent": "A2C"}, {"env_step": 900000, "rew": 1212.1007, "rew_std": 340.1215, "Agent": "A2C"}, {"env_step": 930000, "rew": 1132.2114, "rew_std": 514.8548, "Agent": "A2C"}, {"env_step": 960000, "rew": 1201.6032, "rew_std": 580.1104, "Agent": "A2C"}, {"env_step": 990000, "rew": 1223.54, "rew_std": 339.8763, "Agent": "A2C"}, {"env_step": 1020000, "rew": 954.8797, "rew_std": 314.4283, "Agent": "A2C"}, {"env_step": 1050000, "rew": 1160.6148, "rew_std": 429.8111, "Agent": "A2C"}, {"env_step": 1080000, "rew": 1034.2824, "rew_std": 408.4905, "Agent": "A2C"}, {"env_step": 1110000, "rew": 990.1428, "rew_std": 453.6877, "Agent": "A2C"}, {"env_step": 1140000, "rew": 1146.8304, "rew_std": 373.1246, "Agent": "A2C"}, {"env_step": 1170000, "rew": 1197.3747, "rew_std": 623.5087, "Agent": "A2C"}, {"env_step": 1200000, "rew": 1165.3104, "rew_std": 555.5445, "Agent": "A2C"}, {"env_step": 1230000, "rew": 1368.01, "rew_std": 586.2133, "Agent": "A2C"}, {"env_step": 1260000, "rew": 1345.0412, "rew_std": 559.5705, "Agent": "A2C"}, {"env_step": 1290000, "rew": 1175.3513, "rew_std": 607.5811, "Agent": "A2C"}, {"env_step": 1320000, "rew": 1094.7432, "rew_std": 688.7237, "Agent": "A2C"}, {"env_step": 1350000, "rew": 1296.5528, "rew_std": 737.2834, "Agent": "A2C"}, {"env_step": 1380000, "rew": 1088.8646, "rew_std": 336.7799, "Agent": "A2C"}, {"env_step": 1410000, "rew": 1354.1653, "rew_std": 371.5432, "Agent": "A2C"}, {"env_step": 1440000, "rew": 1275.0429, "rew_std": 374.1279, "Agent": "A2C"}, {"env_step": 1470000, "rew": 1553.9737, "rew_std": 726.4136, "Agent": "A2C"}, {"env_step": 1500000, "rew": 1348.2717, "rew_std": 537.4082, "Agent": "A2C"}, {"env_step": 1530000, "rew": 1196.8302, "rew_std": 579.4114, "Agent": "A2C"}, {"env_step": 1560000, "rew": 1301.034, "rew_std": 435.1382, "Agent": "A2C"}, {"env_step": 1590000, "rew": 1381.2474, "rew_std": 586.198, "Agent": "A2C"}, {"env_step": 1620000, "rew": 1210.7781, "rew_std": 452.1103, "Agent": "A2C"}, {"env_step": 1650000, "rew": 1159.8688, "rew_std": 308.3852, "Agent": "A2C"}, {"env_step": 1680000, "rew": 1233.043, "rew_std": 448.2399, "Agent": "A2C"}, {"env_step": 1710000, "rew": 1413.6957, "rew_std": 452.6843, "Agent": "A2C"}, {"env_step": 1740000, "rew": 1427.6175, "rew_std": 536.558, "Agent": "A2C"}, {"env_step": 1770000, "rew": 1435.2136, "rew_std": 702.4925, "Agent": "A2C"}, {"env_step": 1800000, "rew": 1517.1957, "rew_std": 570.5674, "Agent": "A2C"}, {"env_step": 1830000, "rew": 1091.752, "rew_std": 361.7346, "Agent": "A2C"}, {"env_step": 1860000, "rew": 1199.0044, "rew_std": 400.4895, "Agent": "A2C"}, {"env_step": 1890000, "rew": 1292.4859, "rew_std": 560.0479, "Agent": "A2C"}, {"env_step": 1920000, "rew": 1419.6097, "rew_std": 639.8421, "Agent": "A2C"}, {"env_step": 1950000, "rew": 1415.1152, "rew_std": 413.4579, "Agent": "A2C"}, {"env_step": 1980000, "rew": 1176.76, "rew_std": 481.8063, "Agent": "A2C"}, {"env_step": 2010000, "rew": 1294.9907, "rew_std": 429.3094, "Agent": "A2C"}, {"env_step": 2040000, "rew": 1456.2192, "rew_std": 462.3628, "Agent": "A2C"}, {"env_step": 2070000, "rew": 1608.6202, "rew_std": 529.515, "Agent": "A2C"}, {"env_step": 2100000, "rew": 1526.9954, "rew_std": 652.4756, "Agent": "A2C"}, {"env_step": 2130000, "rew": 1505.7459, "rew_std": 656.8452, "Agent": "A2C"}, {"env_step": 2160000, "rew": 1504.5428, "rew_std": 594.6738, "Agent": "A2C"}, {"env_step": 2190000, "rew": 1457.4778, "rew_std": 556.3529, "Agent": "A2C"}, {"env_step": 2220000, "rew": 1376.9743, "rew_std": 396.4713, "Agent": "A2C"}, {"env_step": 2250000, "rew": 1314.4171, "rew_std": 455.926, "Agent": "A2C"}, {"env_step": 2280000, "rew": 1181.3131, "rew_std": 421.3108, "Agent": "A2C"}, {"env_step": 2310000, "rew": 1327.9512, "rew_std": 548.2671, "Agent": "A2C"}, {"env_step": 2340000, "rew": 1214.5111, "rew_std": 312.23, "Agent": "A2C"}, {"env_step": 2370000, "rew": 1340.6044, "rew_std": 368.7874, "Agent": "A2C"}, {"env_step": 2400000, "rew": 1381.3645, "rew_std": 377.5288, "Agent": "A2C"}, {"env_step": 2430000, "rew": 1409.8832, "rew_std": 362.9671, "Agent": "A2C"}, {"env_step": 2460000, "rew": 1313.9969, "rew_std": 244.2689, "Agent": "A2C"}, {"env_step": 2490000, "rew": 1276.3597, "rew_std": 417.0242, "Agent": "A2C"}, {"env_step": 2520000, "rew": 1349.8452, "rew_std": 397.339, "Agent": "A2C"}, {"env_step": 2550000, "rew": 1257.4598, "rew_std": 450.0145, "Agent": "A2C"}, {"env_step": 2580000, "rew": 1514.8774, "rew_std": 458.0025, "Agent": "A2C"}, {"env_step": 2610000, "rew": 1338.5812, "rew_std": 343.2712, "Agent": "A2C"}, {"env_step": 2640000, "rew": 1441.4321, "rew_std": 484.9153, "Agent": "A2C"}, {"env_step": 2670000, "rew": 1430.9547, "rew_std": 335.1838, "Agent": "A2C"}, {"env_step": 2700000, "rew": 1270.3224, "rew_std": 239.8125, "Agent": "A2C"}, {"env_step": 2730000, "rew": 1402.5757, "rew_std": 358.1328, "Agent": "A2C"}, {"env_step": 2760000, "rew": 1359.1978, "rew_std": 284.1278, "Agent": "A2C"}, {"env_step": 2790000, "rew": 1311.6115, "rew_std": 235.8307, "Agent": "A2C"}, {"env_step": 2820000, "rew": 1402.1925, "rew_std": 478.4434, "Agent": "A2C"}, {"env_step": 2850000, "rew": 1220.61, "rew_std": 366.7868, "Agent": "A2C"}, {"env_step": 2880000, "rew": 1300.8353, "rew_std": 249.6865, "Agent": "A2C"}, {"env_step": 2910000, "rew": 1404.9237, "rew_std": 394.3524, "Agent": "A2C"}, {"env_step": 2940000, "rew": 1429.0835, "rew_std": 425.5458, "Agent": "A2C"}, {"env_step": 2970000, "rew": 1367.0696, "rew_std": 392.2221, "Agent": "A2C"}, {"env_step": 3000000, "rew": 1291.0612, "rew_std": 336.8317, "Agent": "A2C"}, {"env_step": 0, "rew": 17.5422, "rew_std": 3.2776, "Agent": "ACKTR"}, {"env_step": 30000, "rew": 304.9249, "rew_std": 242.2893, "Agent": "ACKTR"}, {"env_step": 60000, "rew": 219.8068, "rew_std": 56.6026, "Agent": "ACKTR"}, {"env_step": 90000, "rew": 325.8134, "rew_std": 219.4743, "Agent": "ACKTR"}, {"env_step": 120000, "rew": 281.1752, "rew_std": 87.1774, "Agent": "ACKTR"}, {"env_step": 150000, "rew": 327.7652, "rew_std": 84.6139, "Agent": "ACKTR"}, {"env_step": 180000, "rew": 318.4706, "rew_std": 88.2207, "Agent": "ACKTR"}, {"env_step": 210000, "rew": 359.4809, "rew_std": 111.4081, "Agent": "ACKTR"}, {"env_step": 240000, "rew": 439.4241, "rew_std": 203.7932, "Agent": "ACKTR"}, {"env_step": 270000, "rew": 374.2698, "rew_std": 146.1785, "Agent": "ACKTR"}, {"env_step": 300000, "rew": 492.5018, "rew_std": 298.474, "Agent": "ACKTR"}, {"env_step": 330000, "rew": 464.1214, "rew_std": 191.1444, "Agent": "ACKTR"}, {"env_step": 360000, "rew": 398.3017, "rew_std": 107.0735, "Agent": "ACKTR"}, {"env_step": 390000, "rew": 401.9124, "rew_std": 169.0182, "Agent": "ACKTR"}, {"env_step": 420000, "rew": 559.9767, "rew_std": 248.8336, "Agent": "ACKTR"}, {"env_step": 450000, "rew": 617.8844, "rew_std": 283.9486, "Agent": "ACKTR"}, {"env_step": 480000, "rew": 470.0433, "rew_std": 181.079, "Agent": "ACKTR"}, {"env_step": 510000, "rew": 512.0529, "rew_std": 211.3653, "Agent": "ACKTR"}, {"env_step": 540000, "rew": 544.2903, "rew_std": 184.5096, "Agent": "ACKTR"}, {"env_step": 570000, "rew": 558.5919, "rew_std": 212.7858, "Agent": "ACKTR"}, {"env_step": 600000, "rew": 637.0841, "rew_std": 251.736, "Agent": "ACKTR"}, {"env_step": 630000, "rew": 532.4362, "rew_std": 212.8007, "Agent": "ACKTR"}, {"env_step": 660000, "rew": 601.899, "rew_std": 249.1718, "Agent": "ACKTR"}, {"env_step": 690000, "rew": 656.795, "rew_std": 438.6089, "Agent": "ACKTR"}, {"env_step": 720000, "rew": 584.1855, "rew_std": 352.1998, "Agent": "ACKTR"}, {"env_step": 750000, "rew": 532.7445, "rew_std": 285.4761, "Agent": "ACKTR"}, {"env_step": 780000, "rew": 645.1858, "rew_std": 274.1018, "Agent": "ACKTR"}, {"env_step": 810000, "rew": 568.0694, "rew_std": 240.8376, "Agent": "ACKTR"}, {"env_step": 840000, "rew": 592.9572, "rew_std": 400.0159, "Agent": "ACKTR"}, {"env_step": 870000, "rew": 489.0758, "rew_std": 261.1999, "Agent": "ACKTR"}, {"env_step": 900000, "rew": 678.0208, "rew_std": 374.4668, "Agent": "ACKTR"}, {"env_step": 930000, "rew": 1066.1738, "rew_std": 799.7624, "Agent": "ACKTR"}, {"env_step": 960000, "rew": 846.759, "rew_std": 522.8762, "Agent": "ACKTR"}, {"env_step": 990000, "rew": 787.4983, "rew_std": 620.7952, "Agent": "ACKTR"}, {"env_step": 1020000, "rew": 843.901, "rew_std": 606.0721, "Agent": "ACKTR"}, {"env_step": 1050000, "rew": 920.9396, "rew_std": 629.8945, "Agent": "ACKTR"}, {"env_step": 1080000, "rew": 863.5142, "rew_std": 739.5084, "Agent": "ACKTR"}, {"env_step": 1110000, "rew": 921.0193, "rew_std": 851.6734, "Agent": "ACKTR"}, {"env_step": 1140000, "rew": 793.6159, "rew_std": 607.1138, "Agent": "ACKTR"}, {"env_step": 1170000, "rew": 862.2104, "rew_std": 596.6593, "Agent": "ACKTR"}, {"env_step": 1200000, "rew": 838.3989, "rew_std": 546.188, "Agent": "ACKTR"}, {"env_step": 1230000, "rew": 821.6949, "rew_std": 502.8031, "Agent": "ACKTR"}, {"env_step": 1260000, "rew": 831.06, "rew_std": 511.9782, "Agent": "ACKTR"}, {"env_step": 1290000, "rew": 795.1134, "rew_std": 556.4464, "Agent": "ACKTR"}, {"env_step": 1320000, "rew": 802.5034, "rew_std": 451.6817, "Agent": "ACKTR"}, {"env_step": 1350000, "rew": 1085.6525, "rew_std": 779.2799, "Agent": "ACKTR"}, {"env_step": 1380000, "rew": 792.3995, "rew_std": 355.5349, "Agent": "ACKTR"}, {"env_step": 1410000, "rew": 961.2071, "rew_std": 507.2608, "Agent": "ACKTR"}, {"env_step": 1440000, "rew": 1114.052, "rew_std": 597.0814, "Agent": "ACKTR"}, {"env_step": 1470000, "rew": 1087.158, "rew_std": 614.7536, "Agent": "ACKTR"}, {"env_step": 1500000, "rew": 1099.9079, "rew_std": 799.1687, "Agent": "ACKTR"}, {"env_step": 1530000, "rew": 952.7763, "rew_std": 530.1096, "Agent": "ACKTR"}, {"env_step": 1560000, "rew": 1046.1663, "rew_std": 628.3332, "Agent": "ACKTR"}, {"env_step": 1590000, "rew": 1131.3974, "rew_std": 590.9852, "Agent": "ACKTR"}, {"env_step": 1620000, "rew": 916.6858, "rew_std": 460.0814, "Agent": "ACKTR"}, {"env_step": 1650000, "rew": 1018.0943, "rew_std": 522.5525, "Agent": "ACKTR"}, {"env_step": 1680000, "rew": 1123.9108, "rew_std": 486.0627, "Agent": "ACKTR"}, {"env_step": 1710000, "rew": 1183.1119, "rew_std": 547.4969, "Agent": "ACKTR"}, {"env_step": 1740000, "rew": 1124.432, "rew_std": 646.2154, "Agent": "ACKTR"}, {"env_step": 1770000, "rew": 888.0863, "rew_std": 291.3664, "Agent": "ACKTR"}, {"env_step": 1800000, "rew": 1053.5495, "rew_std": 468.3159, "Agent": "ACKTR"}, {"env_step": 1830000, "rew": 1077.3572, "rew_std": 482.3279, "Agent": "ACKTR"}, {"env_step": 1860000, "rew": 903.0388, "rew_std": 450.3206, "Agent": "ACKTR"}, {"env_step": 1890000, "rew": 1122.1908, "rew_std": 471.0813, "Agent": "ACKTR"}, {"env_step": 1920000, "rew": 1127.8137, "rew_std": 453.882, "Agent": "ACKTR"}, {"env_step": 1950000, "rew": 1239.5631, "rew_std": 448.9448, "Agent": "ACKTR"}, {"env_step": 1980000, "rew": 1193.7868, "rew_std": 381.9751, "Agent": "ACKTR"}, {"env_step": 2010000, "rew": 1165.3051, "rew_std": 538.7137, "Agent": "ACKTR"}, {"env_step": 2040000, "rew": 1321.9527, "rew_std": 571.1979, "Agent": "ACKTR"}, {"env_step": 2070000, "rew": 1531.22, "rew_std": 540.5889, "Agent": "ACKTR"}, {"env_step": 2100000, "rew": 1267.6756, "rew_std": 593.4102, "Agent": "ACKTR"}, {"env_step": 2130000, "rew": 1277.196, "rew_std": 604.2548, "Agent": "ACKTR"}, {"env_step": 2160000, "rew": 1335.8426, "rew_std": 450.2048, "Agent": "ACKTR"}, {"env_step": 2190000, "rew": 1269.1418, "rew_std": 464.4829, "Agent": "ACKTR"}, {"env_step": 2220000, "rew": 1379.5432, "rew_std": 428.9311, "Agent": "ACKTR"}, {"env_step": 2250000, "rew": 1373.0315, "rew_std": 594.7235, "Agent": "ACKTR"}, {"env_step": 2280000, "rew": 1565.7903, "rew_std": 762.8894, "Agent": "ACKTR"}, {"env_step": 2310000, "rew": 1490.7087, "rew_std": 325.904, "Agent": "ACKTR"}, {"env_step": 2340000, "rew": 1424.1998, "rew_std": 519.6324, "Agent": "ACKTR"}, {"env_step": 2370000, "rew": 1369.4744, "rew_std": 599.6785, "Agent": "ACKTR"}, {"env_step": 2400000, "rew": 1660.7295, "rew_std": 576.8576, "Agent": "ACKTR"}, {"env_step": 2430000, "rew": 1271.6249, "rew_std": 606.0866, "Agent": "ACKTR"}, {"env_step": 2460000, "rew": 1450.637, "rew_std": 397.4456, "Agent": "ACKTR"}, {"env_step": 2490000, "rew": 1289.9877, "rew_std": 487.899, "Agent": "ACKTR"}, {"env_step": 2520000, "rew": 1354.3393, "rew_std": 558.5818, "Agent": "ACKTR"}, {"env_step": 2550000, "rew": 1508.2282, "rew_std": 630.2843, "Agent": "ACKTR"}, {"env_step": 2580000, "rew": 1474.4799, "rew_std": 436.6433, "Agent": "ACKTR"}, {"env_step": 2610000, "rew": 1236.7119, "rew_std": 646.8339, "Agent": "ACKTR"}, {"env_step": 2640000, "rew": 1378.7648, "rew_std": 596.5196, "Agent": "ACKTR"}, {"env_step": 2670000, "rew": 1462.9911, "rew_std": 359.6089, "Agent": "ACKTR"}, {"env_step": 2700000, "rew": 1430.8475, "rew_std": 512.0464, "Agent": "ACKTR"}, {"env_step": 2730000, "rew": 1734.0183, "rew_std": 695.4843, "Agent": "ACKTR"}, {"env_step": 2760000, "rew": 1394.0167, "rew_std": 538.651, "Agent": "ACKTR"}, {"env_step": 2790000, "rew": 1632.9884, "rew_std": 599.2205, "Agent": "ACKTR"}, {"env_step": 2820000, "rew": 1547.5347, "rew_std": 587.5889, "Agent": "ACKTR"}, {"env_step": 2850000, "rew": 1531.6114, "rew_std": 462.1249, "Agent": "ACKTR"}, {"env_step": 2880000, "rew": 1401.6916, "rew_std": 554.143, "Agent": "ACKTR"}, {"env_step": 2910000, "rew": 1596.259, "rew_std": 589.2523, "Agent": "ACKTR"}, {"env_step": 2940000, "rew": 1924.3603, "rew_std": 704.9036, "Agent": "ACKTR"}, {"env_step": 2970000, "rew": 1840.9154, "rew_std": 604.4897, "Agent": "ACKTR"}, {"env_step": 3000000, "rew": 1677.4226, "rew_std": 555.5077, "Agent": "ACKTR"}, {"env_step": 0, "rew": 47.4556, "rew_std": 36.0937, "Agent": "DDPG"}, {"env_step": 5000, "rew": 199.5964, "rew_std": 33.9794, "Agent": "DDPG"}, {"env_step": 10000, "rew": 292.9478, "rew_std": 123.7966, "Agent": "DDPG"}, {"env_step": 15000, "rew": 304.7492, "rew_std": 86.323, "Agent": "DDPG"}, {"env_step": 20000, "rew": 287.3028, "rew_std": 154.7323, "Agent": "DDPG"}, {"env_step": 25000, "rew": 350.8284, "rew_std": 185.3053, "Agent": "DDPG"}, {"env_step": 30000, "rew": 461.0749, "rew_std": 327.0808, "Agent": "DDPG"}, {"env_step": 35000, "rew": 554.0079, "rew_std": 580.9794, "Agent": "DDPG"}, {"env_step": 40000, "rew": 368.9768, "rew_std": 260.8433, "Agent": "DDPG"}, {"env_step": 45000, "rew": 424.1908, "rew_std": 156.5163, "Agent": "DDPG"}, {"env_step": 50000, "rew": 576.619, "rew_std": 305.5415, "Agent": "DDPG"}, {"env_step": 55000, "rew": 491.5706, "rew_std": 285.2554, "Agent": "DDPG"}, {"env_step": 60000, "rew": 395.1139, "rew_std": 248.961, "Agent": "DDPG"}, {"env_step": 65000, "rew": 619.7068, "rew_std": 397.6176, "Agent": "DDPG"}, {"env_step": 70000, "rew": 507.9061, "rew_std": 321.1003, "Agent": "DDPG"}, {"env_step": 75000, "rew": 719.1054, "rew_std": 406.2997, "Agent": "DDPG"}, {"env_step": 80000, "rew": 744.2296, "rew_std": 364.8092, "Agent": "DDPG"}, {"env_step": 85000, "rew": 938.9236, "rew_std": 221.6865, "Agent": "DDPG"}, {"env_step": 90000, "rew": 856.0042, "rew_std": 388.8057, "Agent": "DDPG"}, {"env_step": 95000, "rew": 573.1303, "rew_std": 437.724, "Agent": "DDPG"}, {"env_step": 100000, "rew": 904.4764, "rew_std": 396.2616, "Agent": "DDPG"}, {"env_step": 105000, "rew": 994.7385, "rew_std": 525.0778, "Agent": "DDPG"}, {"env_step": 110000, "rew": 912.3102, "rew_std": 234.5438, "Agent": "DDPG"}, {"env_step": 115000, "rew": 905.7738, "rew_std": 506.0842, "Agent": "DDPG"}, {"env_step": 120000, "rew": 1022.8284, "rew_std": 425.9909, "Agent": "DDPG"}, {"env_step": 125000, "rew": 818.86, "rew_std": 332.6216, "Agent": "DDPG"}, {"env_step": 130000, "rew": 856.2068, "rew_std": 696.1068, "Agent": "DDPG"}, {"env_step": 135000, "rew": 969.3492, "rew_std": 564.7443, "Agent": "DDPG"}, {"env_step": 140000, "rew": 935.8756, "rew_std": 502.7124, "Agent": "DDPG"}, {"env_step": 145000, "rew": 1209.4538, "rew_std": 762.8217, "Agent": "DDPG"}, {"env_step": 150000, "rew": 1071.5299, "rew_std": 668.4726, "Agent": "DDPG"}, {"env_step": 155000, "rew": 1025.5543, "rew_std": 595.0783, "Agent": "DDPG"}, {"env_step": 160000, "rew": 1552.6187, "rew_std": 729.4655, "Agent": "DDPG"}, {"env_step": 165000, "rew": 1143.5506, "rew_std": 769.8467, "Agent": "DDPG"}, {"env_step": 170000, "rew": 1202.557, "rew_std": 625.1311, "Agent": "DDPG"}, {"env_step": 175000, "rew": 1157.8752, "rew_std": 774.7858, "Agent": "DDPG"}, {"env_step": 180000, "rew": 1112.9275, "rew_std": 571.9906, "Agent": "DDPG"}, {"env_step": 185000, "rew": 1294.5619, "rew_std": 751.9106, "Agent": "DDPG"}, {"env_step": 190000, "rew": 1276.959, "rew_std": 616.8828, "Agent": "DDPG"}, {"env_step": 195000, "rew": 1152.8641, "rew_std": 936.5329, "Agent": "DDPG"}, {"env_step": 200000, "rew": 1271.7593, "rew_std": 662.8393, "Agent": "DDPG"}, {"env_step": 205000, "rew": 1386.9656, "rew_std": 864.4552, "Agent": "DDPG"}, {"env_step": 210000, "rew": 1615.4658, "rew_std": 1087.9647, "Agent": "DDPG"}, {"env_step": 215000, "rew": 1485.9, "rew_std": 901.0807, "Agent": "DDPG"}, {"env_step": 220000, "rew": 1233.074, "rew_std": 891.3348, "Agent": "DDPG"}, {"env_step": 225000, "rew": 1495.7882, "rew_std": 599.9693, "Agent": "DDPG"}, {"env_step": 230000, "rew": 1511.5256, "rew_std": 826.3847, "Agent": "DDPG"}, {"env_step": 235000, "rew": 1368.9508, "rew_std": 672.3022, "Agent": "DDPG"}, {"env_step": 240000, "rew": 2055.3458, "rew_std": 796.3992, "Agent": "DDPG"}, {"env_step": 245000, "rew": 1784.053, "rew_std": 868.0014, "Agent": "DDPG"}, {"env_step": 250000, "rew": 1188.9104, "rew_std": 528.9923, "Agent": "DDPG"}, {"env_step": 255000, "rew": 1593.2322, "rew_std": 738.7044, "Agent": "DDPG"}, {"env_step": 260000, "rew": 1558.0799, "rew_std": 565.0878, "Agent": "DDPG"}, {"env_step": 265000, "rew": 1557.7178, "rew_std": 927.1087, "Agent": "DDPG"}, {"env_step": 270000, "rew": 1335.5645, "rew_std": 908.6661, "Agent": "DDPG"}, {"env_step": 275000, "rew": 1699.6929, "rew_std": 745.9329, "Agent": "DDPG"}, {"env_step": 280000, "rew": 1582.9738, "rew_std": 712.9094, "Agent": "DDPG"}, {"env_step": 285000, "rew": 1309.9093, "rew_std": 789.7158, "Agent": "DDPG"}, {"env_step": 290000, "rew": 1612.4216, "rew_std": 907.3729, "Agent": "DDPG"}, {"env_step": 295000, "rew": 1379.8448, "rew_std": 837.7913, "Agent": "DDPG"}, {"env_step": 300000, "rew": 1240.8142, "rew_std": 792.2656, "Agent": "DDPG"}, {"env_step": 305000, "rew": 1603.6851, "rew_std": 788.9357, "Agent": "DDPG"}, {"env_step": 310000, "rew": 1678.6352, "rew_std": 738.9559, "Agent": "DDPG"}, {"env_step": 315000, "rew": 1520.7429, "rew_std": 739.0202, "Agent": "DDPG"}, {"env_step": 320000, "rew": 1341.5378, "rew_std": 811.6886, "Agent": "DDPG"}, {"env_step": 325000, "rew": 1538.3204, "rew_std": 753.9931, "Agent": "DDPG"}, {"env_step": 330000, "rew": 2171.3508, "rew_std": 812.4793, "Agent": "DDPG"}, {"env_step": 335000, "rew": 1597.8247, "rew_std": 504.1572, "Agent": "DDPG"}, {"env_step": 340000, "rew": 1502.7578, "rew_std": 706.8602, "Agent": "DDPG"}, {"env_step": 345000, "rew": 1228.9521, "rew_std": 731.932, "Agent": "DDPG"}, {"env_step": 350000, "rew": 2105.4206, "rew_std": 711.0904, "Agent": "DDPG"}, {"env_step": 355000, "rew": 1222.946, "rew_std": 719.3598, "Agent": "DDPG"}, {"env_step": 360000, "rew": 1446.9002, "rew_std": 874.4786, "Agent": "DDPG"}, {"env_step": 365000, "rew": 1501.5562, "rew_std": 814.7934, "Agent": "DDPG"}, {"env_step": 370000, "rew": 1540.5308, "rew_std": 832.5853, "Agent": "DDPG"}, {"env_step": 375000, "rew": 1618.1915, "rew_std": 985.3355, "Agent": "DDPG"}, {"env_step": 380000, "rew": 1882.0891, "rew_std": 1091.0448, "Agent": "DDPG"}, {"env_step": 385000, "rew": 1645.4651, "rew_std": 735.7729, "Agent": "DDPG"}, {"env_step": 390000, "rew": 1178.6635, "rew_std": 621.3323, "Agent": "DDPG"}, {"env_step": 395000, "rew": 1994.3664, "rew_std": 772.0565, "Agent": "DDPG"}, {"env_step": 400000, "rew": 1854.5865, "rew_std": 891.3537, "Agent": "DDPG"}, {"env_step": 405000, "rew": 1764.6518, "rew_std": 1036.0291, "Agent": "DDPG"}, {"env_step": 410000, "rew": 1484.1159, "rew_std": 1081.0145, "Agent": "DDPG"}, {"env_step": 415000, "rew": 1507.5379, "rew_std": 723.7435, "Agent": "DDPG"}, {"env_step": 420000, "rew": 1282.4193, "rew_std": 759.1662, "Agent": "DDPG"}, {"env_step": 425000, "rew": 1566.2592, "rew_std": 890.281, "Agent": "DDPG"}, {"env_step": 430000, "rew": 1611.8748, "rew_std": 737.8685, "Agent": "DDPG"}, {"env_step": 435000, "rew": 1932.6178, "rew_std": 878.2189, "Agent": "DDPG"}, {"env_step": 440000, "rew": 1861.9749, "rew_std": 712.5401, "Agent": "DDPG"}, {"env_step": 445000, "rew": 1330.4312, "rew_std": 926.2519, "Agent": "DDPG"}, {"env_step": 450000, "rew": 1279.7114, "rew_std": 749.0, "Agent": "DDPG"}, {"env_step": 455000, "rew": 1406.3635, "rew_std": 557.1778, "Agent": "DDPG"}, {"env_step": 460000, "rew": 1813.8324, "rew_std": 788.8594, "Agent": "DDPG"}, {"env_step": 465000, "rew": 1884.2437, "rew_std": 853.1452, "Agent": "DDPG"}, {"env_step": 470000, "rew": 1915.2181, "rew_std": 834.8238, "Agent": "DDPG"}, {"env_step": 475000, "rew": 1080.747, "rew_std": 451.6704, "Agent": "DDPG"}, {"env_step": 480000, "rew": 1358.944, "rew_std": 755.2171, "Agent": "DDPG"}, {"env_step": 485000, "rew": 1161.3047, "rew_std": 466.7425, "Agent": "DDPG"}, {"env_step": 490000, "rew": 1265.8359, "rew_std": 575.7276, "Agent": "DDPG"}, {"env_step": 495000, "rew": 1579.7615, "rew_std": 829.9376, "Agent": "DDPG"}, {"env_step": 500000, "rew": 1937.8091, "rew_std": 749.3357, "Agent": "DDPG"}, {"env_step": 505000, "rew": 1455.1521, "rew_std": 672.3839, "Agent": "DDPG"}, {"env_step": 510000, "rew": 1539.8811, "rew_std": 807.9035, "Agent": "DDPG"}, {"env_step": 515000, "rew": 1667.0292, "rew_std": 1080.7372, "Agent": "DDPG"}, {"env_step": 520000, "rew": 1385.8087, "rew_std": 667.4235, "Agent": "DDPG"}, {"env_step": 525000, "rew": 1362.2604, "rew_std": 915.962, "Agent": "DDPG"}, {"env_step": 530000, "rew": 1858.4627, "rew_std": 1012.5408, "Agent": "DDPG"}, {"env_step": 535000, "rew": 1726.7965, "rew_std": 628.7272, "Agent": "DDPG"}, {"env_step": 540000, "rew": 1776.6725, "rew_std": 898.7636, "Agent": "DDPG"}, {"env_step": 545000, "rew": 1613.2686, "rew_std": 1021.7273, "Agent": "DDPG"}, {"env_step": 550000, "rew": 1372.588, "rew_std": 647.6357, "Agent": "DDPG"}, {"env_step": 555000, "rew": 1666.3868, "rew_std": 821.096, "Agent": "DDPG"}, {"env_step": 560000, "rew": 1207.9626, "rew_std": 684.4657, "Agent": "DDPG"}, {"env_step": 565000, "rew": 1491.7214, "rew_std": 810.4517, "Agent": "DDPG"}, {"env_step": 570000, "rew": 1517.6948, "rew_std": 562.8144, "Agent": "DDPG"}, {"env_step": 575000, "rew": 1419.4688, "rew_std": 634.5265, "Agent": "DDPG"}, {"env_step": 580000, "rew": 1233.782, "rew_std": 695.0035, "Agent": "DDPG"}, {"env_step": 585000, "rew": 1836.1308, "rew_std": 780.2811, "Agent": "DDPG"}, {"env_step": 590000, "rew": 2012.6321, "rew_std": 710.0638, "Agent": "DDPG"}, {"env_step": 595000, "rew": 1827.9922, "rew_std": 844.7668, "Agent": "DDPG"}, {"env_step": 600000, "rew": 1491.2336, "rew_std": 478.5381, "Agent": "DDPG"}, {"env_step": 605000, "rew": 1661.3061, "rew_std": 741.2274, "Agent": "DDPG"}, {"env_step": 610000, "rew": 1913.0473, "rew_std": 901.0005, "Agent": "DDPG"}, {"env_step": 615000, "rew": 1491.7244, "rew_std": 603.3158, "Agent": "DDPG"}, {"env_step": 620000, "rew": 2054.5905, "rew_std": 727.9373, "Agent": "DDPG"}, {"env_step": 625000, "rew": 1717.238, "rew_std": 949.1291, "Agent": "DDPG"}, {"env_step": 630000, "rew": 1453.1425, "rew_std": 734.2967, "Agent": "DDPG"}, {"env_step": 635000, "rew": 1917.0793, "rew_std": 920.3567, "Agent": "DDPG"}, {"env_step": 640000, "rew": 1816.6305, "rew_std": 562.8137, "Agent": "DDPG"}, {"env_step": 645000, "rew": 1350.5139, "rew_std": 762.7955, "Agent": "DDPG"}, {"env_step": 650000, "rew": 1562.9627, "rew_std": 610.504, "Agent": "DDPG"}, {"env_step": 655000, "rew": 1683.4779, "rew_std": 811.7958, "Agent": "DDPG"}, {"env_step": 660000, "rew": 1948.6147, "rew_std": 780.7959, "Agent": "DDPG"}, {"env_step": 665000, "rew": 1502.015, "rew_std": 778.1516, "Agent": "DDPG"}, {"env_step": 670000, "rew": 1888.6714, "rew_std": 890.6181, "Agent": "DDPG"}, {"env_step": 675000, "rew": 1331.4954, "rew_std": 903.252, "Agent": "DDPG"}, {"env_step": 680000, "rew": 1374.4944, "rew_std": 651.6485, "Agent": "DDPG"}, {"env_step": 685000, "rew": 1658.4132, "rew_std": 606.6067, "Agent": "DDPG"}, {"env_step": 690000, "rew": 1834.4839, "rew_std": 835.1019, "Agent": "DDPG"}, {"env_step": 695000, "rew": 1207.13, "rew_std": 629.4921, "Agent": "DDPG"}, {"env_step": 700000, "rew": 1479.8799, "rew_std": 774.4921, "Agent": "DDPG"}, {"env_step": 705000, "rew": 1430.1922, "rew_std": 790.7581, "Agent": "DDPG"}, {"env_step": 710000, "rew": 1148.2108, "rew_std": 469.6791, "Agent": "DDPG"}, {"env_step": 715000, "rew": 1234.3927, "rew_std": 616.3696, "Agent": "DDPG"}, {"env_step": 720000, "rew": 1442.2469, "rew_std": 869.6578, "Agent": "DDPG"}, {"env_step": 725000, "rew": 2047.1622, "rew_std": 997.6007, "Agent": "DDPG"}, {"env_step": 730000, "rew": 1791.2108, "rew_std": 944.3568, "Agent": "DDPG"}, {"env_step": 735000, "rew": 1337.5849, "rew_std": 715.2636, "Agent": "DDPG"}, {"env_step": 740000, "rew": 1440.0945, "rew_std": 375.8207, "Agent": "DDPG"}, {"env_step": 745000, "rew": 1146.3608, "rew_std": 815.5818, "Agent": "DDPG"}, {"env_step": 750000, "rew": 1407.0721, "rew_std": 537.2618, "Agent": "DDPG"}, {"env_step": 755000, "rew": 1880.9328, "rew_std": 1002.6757, "Agent": "DDPG"}, {"env_step": 760000, "rew": 1888.895, "rew_std": 661.2671, "Agent": "DDPG"}, {"env_step": 765000, "rew": 1888.1488, "rew_std": 760.2352, "Agent": "DDPG"}, {"env_step": 770000, "rew": 1648.2798, "rew_std": 780.4931, "Agent": "DDPG"}, {"env_step": 775000, "rew": 1660.9453, "rew_std": 603.4395, "Agent": "DDPG"}, {"env_step": 780000, "rew": 1766.914, "rew_std": 568.0854, "Agent": "DDPG"}, {"env_step": 785000, "rew": 1934.2981, "rew_std": 719.8906, "Agent": "DDPG"}, {"env_step": 790000, "rew": 1251.4397, "rew_std": 638.1787, "Agent": "DDPG"}, {"env_step": 795000, "rew": 1449.0066, "rew_std": 795.1345, "Agent": "DDPG"}, {"env_step": 800000, "rew": 1954.0406, "rew_std": 828.3001, "Agent": "DDPG"}, {"env_step": 805000, "rew": 1768.7785, "rew_std": 858.3872, "Agent": "DDPG"}, {"env_step": 810000, "rew": 2027.9814, "rew_std": 839.1931, "Agent": "DDPG"}, {"env_step": 815000, "rew": 1913.2213, "rew_std": 692.3181, "Agent": "DDPG"}, {"env_step": 820000, "rew": 1599.5942, "rew_std": 844.4248, "Agent": "DDPG"}, {"env_step": 825000, "rew": 1648.2999, "rew_std": 848.1727, "Agent": "DDPG"}, {"env_step": 830000, "rew": 1672.2677, "rew_std": 650.2616, "Agent": "DDPG"}, {"env_step": 835000, "rew": 1426.2038, "rew_std": 603.851, "Agent": "DDPG"}, {"env_step": 840000, "rew": 1201.6071, "rew_std": 713.3597, "Agent": "DDPG"}, {"env_step": 845000, "rew": 1891.6987, "rew_std": 1094.6308, "Agent": "DDPG"}, {"env_step": 850000, "rew": 1831.5032, "rew_std": 788.3598, "Agent": "DDPG"}, {"env_step": 855000, "rew": 1808.393, "rew_std": 811.0075, "Agent": "DDPG"}, {"env_step": 860000, "rew": 1722.02, "rew_std": 897.3865, "Agent": "DDPG"}, {"env_step": 865000, "rew": 1716.2164, "rew_std": 966.9749, "Agent": "DDPG"}, {"env_step": 870000, "rew": 1987.0209, "rew_std": 978.3952, "Agent": "DDPG"}, {"env_step": 875000, "rew": 1737.9764, "rew_std": 832.1536, "Agent": "DDPG"}, {"env_step": 880000, "rew": 1398.2013, "rew_std": 657.9203, "Agent": "DDPG"}, {"env_step": 885000, "rew": 1343.473, "rew_std": 754.4166, "Agent": "DDPG"}, {"env_step": 890000, "rew": 1681.7618, "rew_std": 929.122, "Agent": "DDPG"}, {"env_step": 895000, "rew": 1568.8794, "rew_std": 904.3076, "Agent": "DDPG"}, {"env_step": 900000, "rew": 1601.8665, "rew_std": 488.7929, "Agent": "DDPG"}, {"env_step": 905000, "rew": 1795.0391, "rew_std": 740.0067, "Agent": "DDPG"}, {"env_step": 910000, "rew": 1630.1091, "rew_std": 534.433, "Agent": "DDPG"}, {"env_step": 915000, "rew": 1856.3447, "rew_std": 898.0134, "Agent": "DDPG"}, {"env_step": 920000, "rew": 1773.9826, "rew_std": 892.2861, "Agent": "DDPG"}, {"env_step": 925000, "rew": 1744.7145, "rew_std": 902.0155, "Agent": "DDPG"}, {"env_step": 930000, "rew": 1681.8963, "rew_std": 934.1126, "Agent": "DDPG"}, {"env_step": 935000, "rew": 1544.4927, "rew_std": 869.2729, "Agent": "DDPG"}, {"env_step": 940000, "rew": 1710.695, "rew_std": 892.1599, "Agent": "DDPG"}, {"env_step": 945000, "rew": 1556.9009, "rew_std": 719.2425, "Agent": "DDPG"}, {"env_step": 950000, "rew": 1560.5468, "rew_std": 580.7039, "Agent": "DDPG"}, {"env_step": 955000, "rew": 1648.3686, "rew_std": 822.4474, "Agent": "DDPG"}, {"env_step": 960000, "rew": 2017.7817, "rew_std": 1049.0691, "Agent": "DDPG"}, {"env_step": 965000, "rew": 1799.2743, "rew_std": 804.7937, "Agent": "DDPG"}, {"env_step": 970000, "rew": 1431.8169, "rew_std": 811.7101, "Agent": "DDPG"}, {"env_step": 975000, "rew": 1907.9792, "rew_std": 863.3055, "Agent": "DDPG"}, {"env_step": 980000, "rew": 2151.5975, "rew_std": 920.9613, "Agent": "DDPG"}, {"env_step": 985000, "rew": 1636.355, "rew_std": 932.402, "Agent": "DDPG"}, {"env_step": 990000, "rew": 1931.229, "rew_std": 782.7125, "Agent": "DDPG"}, {"env_step": 995000, "rew": 2197.0024, "rew_std": 971.5598, "Agent": "DDPG"}, {"env_step": 1000000, "rew": 1604.1096, "rew_std": 936.3235, "Agent": "DDPG"}, {"env_step": 1005000, "rew": 1786.0517, "rew_std": 737.9123, "Agent": "DDPG"}, {"env_step": 1010000, "rew": 1909.8342, "rew_std": 871.6584, "Agent": "DDPG"}, {"env_step": 1015000, "rew": 1948.7802, "rew_std": 753.618, "Agent": "DDPG"}, {"env_step": 1020000, "rew": 1893.587, "rew_std": 750.6465, "Agent": "DDPG"}, {"env_step": 1025000, "rew": 1321.526, "rew_std": 862.1018, "Agent": "DDPG"}, {"env_step": 1030000, "rew": 1479.0536, "rew_std": 825.3967, "Agent": "DDPG"}, {"env_step": 1035000, "rew": 1893.2489, "rew_std": 857.862, "Agent": "DDPG"}, {"env_step": 1040000, "rew": 1492.398, "rew_std": 417.7379, "Agent": "DDPG"}, {"env_step": 1045000, "rew": 1968.4006, "rew_std": 1060.8542, "Agent": "DDPG"}, {"env_step": 1050000, "rew": 1699.4541, "rew_std": 693.4526, "Agent": "DDPG"}, {"env_step": 1055000, "rew": 1486.8643, "rew_std": 608.8139, "Agent": "DDPG"}, {"env_step": 1060000, "rew": 1834.2127, "rew_std": 806.547, "Agent": "DDPG"}, {"env_step": 1065000, "rew": 1898.1982, "rew_std": 868.8335, "Agent": "DDPG"}, {"env_step": 1070000, "rew": 1684.3683, "rew_std": 1056.3452, "Agent": "DDPG"}, {"env_step": 1075000, "rew": 1486.0796, "rew_std": 675.3654, "Agent": "DDPG"}, {"env_step": 1080000, "rew": 1803.2819, "rew_std": 650.8471, "Agent": "DDPG"}, {"env_step": 1085000, "rew": 1857.7992, "rew_std": 712.9232, "Agent": "DDPG"}, {"env_step": 1090000, "rew": 1920.1208, "rew_std": 741.0524, "Agent": "DDPG"}, {"env_step": 1095000, "rew": 1527.1626, "rew_std": 612.0535, "Agent": "DDPG"}, {"env_step": 1100000, "rew": 1914.8211, "rew_std": 878.0446, "Agent": "DDPG"}, {"env_step": 1105000, "rew": 1938.9422, "rew_std": 845.4695, "Agent": "DDPG"}, {"env_step": 1110000, "rew": 1898.7433, "rew_std": 778.8337, "Agent": "DDPG"}, {"env_step": 1115000, "rew": 1700.4836, "rew_std": 728.2356, "Agent": "DDPG"}, {"env_step": 1120000, "rew": 1972.3923, "rew_std": 724.0617, "Agent": "DDPG"}, {"env_step": 1125000, "rew": 1285.6144, "rew_std": 738.7202, "Agent": "DDPG"}, {"env_step": 1130000, "rew": 1615.0117, "rew_std": 726.2691, "Agent": "DDPG"}, {"env_step": 1135000, "rew": 1819.1191, "rew_std": 986.4788, "Agent": "DDPG"}, {"env_step": 1140000, "rew": 1942.4306, "rew_std": 760.4511, "Agent": "DDPG"}, {"env_step": 1145000, "rew": 1221.439, "rew_std": 556.0734, "Agent": "DDPG"}, {"env_step": 1150000, "rew": 1531.2899, "rew_std": 777.4329, "Agent": "DDPG"}, {"env_step": 1155000, "rew": 1326.1052, "rew_std": 652.3935, "Agent": "DDPG"}, {"env_step": 1160000, "rew": 1602.6076, "rew_std": 1082.0088, "Agent": "DDPG"}, {"env_step": 1165000, "rew": 1315.7433, "rew_std": 1057.8408, "Agent": "DDPG"}, {"env_step": 1170000, "rew": 1335.9779, "rew_std": 861.6155, "Agent": "DDPG"}, {"env_step": 1175000, "rew": 1171.8838, "rew_std": 994.2239, "Agent": "DDPG"}, {"env_step": 1180000, "rew": 1324.1715, "rew_std": 500.5259, "Agent": "DDPG"}, {"env_step": 1185000, "rew": 1494.8449, "rew_std": 781.0521, "Agent": "DDPG"}, {"env_step": 1190000, "rew": 1789.3493, "rew_std": 1027.1175, "Agent": "DDPG"}, {"env_step": 1195000, "rew": 1712.5583, "rew_std": 977.8344, "Agent": "DDPG"}, {"env_step": 1200000, "rew": 1564.3719, "rew_std": 649.959, "Agent": "DDPG"}, {"env_step": 1205000, "rew": 1433.258, "rew_std": 548.2289, "Agent": "DDPG"}, {"env_step": 1210000, "rew": 1008.6215, "rew_std": 401.7016, "Agent": "DDPG"}, {"env_step": 1215000, "rew": 1330.1364, "rew_std": 766.7963, "Agent": "DDPG"}, {"env_step": 1220000, "rew": 1759.6604, "rew_std": 909.4543, "Agent": "DDPG"}, {"env_step": 1225000, "rew": 1995.3988, "rew_std": 1042.6365, "Agent": "DDPG"}, {"env_step": 1230000, "rew": 1585.5809, "rew_std": 919.0067, "Agent": "DDPG"}, {"env_step": 1235000, "rew": 1708.5545, "rew_std": 1047.1052, "Agent": "DDPG"}, {"env_step": 1240000, "rew": 1646.8702, "rew_std": 992.2616, "Agent": "DDPG"}, {"env_step": 1245000, "rew": 1340.428, "rew_std": 824.6133, "Agent": "DDPG"}, {"env_step": 1250000, "rew": 1353.3964, "rew_std": 823.2441, "Agent": "DDPG"}, {"env_step": 0, "rew": 17.3274, "rew_std": 3.1882, "Agent": "NPG"}, {"env_step": 30720, "rew": 203.8315, "rew_std": 14.5111, "Agent": "NPG"}, {"env_step": 61440, "rew": 237.8075, "rew_std": 9.0874, "Agent": "NPG"}, {"env_step": 92160, "rew": 291.2451, "rew_std": 30.3522, "Agent": "NPG"}, {"env_step": 122880, "rew": 337.0792, "rew_std": 18.7415, "Agent": "NPG"}, {"env_step": 153600, "rew": 375.4023, "rew_std": 32.5844, "Agent": "NPG"}, {"env_step": 184320, "rew": 401.231, "rew_std": 28.3971, "Agent": "NPG"}, {"env_step": 215040, "rew": 423.9764, "rew_std": 22.5126, "Agent": "NPG"}, {"env_step": 245760, "rew": 460.5551, "rew_std": 64.4361, "Agent": "NPG"}, {"env_step": 276480, "rew": 519.9143, "rew_std": 136.6233, "Agent": "NPG"}, {"env_step": 307200, "rew": 553.7869, "rew_std": 168.2861, "Agent": "NPG"}, {"env_step": 337920, "rew": 582.6567, "rew_std": 194.1075, "Agent": "NPG"}, {"env_step": 368640, "rew": 653.1399, "rew_std": 247.264, "Agent": "NPG"}, {"env_step": 399360, "rew": 741.5686, "rew_std": 349.6129, "Agent": "NPG"}, {"env_step": 430080, "rew": 864.2315, "rew_std": 523.9531, "Agent": "NPG"}, {"env_step": 460800, "rew": 852.3554, "rew_std": 385.2958, "Agent": "NPG"}, {"env_step": 491520, "rew": 898.2792, "rew_std": 370.3424, "Agent": "NPG"}, {"env_step": 522240, "rew": 961.7205, "rew_std": 418.1247, "Agent": "NPG"}, {"env_step": 552960, "rew": 1011.1503, "rew_std": 473.6211, "Agent": "NPG"}, {"env_step": 583680, "rew": 1122.4003, "rew_std": 592.3021, "Agent": "NPG"}, {"env_step": 614400, "rew": 1131.8884, "rew_std": 547.6223, "Agent": "NPG"}, {"env_step": 645120, "rew": 1238.1649, "rew_std": 623.5523, "Agent": "NPG"}, {"env_step": 675840, "rew": 1244.9957, "rew_std": 484.3665, "Agent": "NPG"}, {"env_step": 706560, "rew": 1372.1575, "rew_std": 579.6097, "Agent": "NPG"}, {"env_step": 737280, "rew": 1545.6328, "rew_std": 629.8417, "Agent": "NPG"}, {"env_step": 768000, "rew": 1621.7295, "rew_std": 635.7453, "Agent": "NPG"}, {"env_step": 798720, "rew": 1586.0821, "rew_std": 582.9658, "Agent": "NPG"}, {"env_step": 829440, "rew": 1655.3994, "rew_std": 718.3732, "Agent": "NPG"}, {"env_step": 860160, "rew": 1904.103, "rew_std": 625.2208, "Agent": "NPG"}, {"env_step": 890880, "rew": 1837.8605, "rew_std": 698.25, "Agent": "NPG"}, {"env_step": 921600, "rew": 1787.2493, "rew_std": 600.2013, "Agent": "NPG"}, {"env_step": 952320, "rew": 1871.2556, "rew_std": 658.4671, "Agent": "NPG"}, {"env_step": 983040, "rew": 1915.1982, "rew_std": 550.5251, "Agent": "NPG"}, {"env_step": 1013760, "rew": 1883.5395, "rew_std": 607.3368, "Agent": "NPG"}, {"env_step": 1044480, "rew": 1784.9045, "rew_std": 616.9169, "Agent": "NPG"}, {"env_step": 1075200, "rew": 1934.1622, "rew_std": 632.0287, "Agent": "NPG"}, {"env_step": 1105920, "rew": 1931.5233, "rew_std": 547.5288, "Agent": "NPG"}, {"env_step": 1136640, "rew": 1982.61, "rew_std": 693.0945, "Agent": "NPG"}, {"env_step": 1167360, "rew": 2080.1817, "rew_std": 668.4118, "Agent": "NPG"}, {"env_step": 1198080, "rew": 1956.9138, "rew_std": 558.163, "Agent": "NPG"}, {"env_step": 1228800, "rew": 2007.3187, "rew_std": 589.66, "Agent": "NPG"}, {"env_step": 1259520, "rew": 1870.5981, "rew_std": 624.8375, "Agent": "NPG"}, {"env_step": 1290240, "rew": 1996.6054, "rew_std": 564.1005, "Agent": "NPG"}, {"env_step": 1320960, "rew": 2076.7399, "rew_std": 629.456, "Agent": "NPG"}, {"env_step": 1351680, "rew": 1997.9941, "rew_std": 649.6904, "Agent": "NPG"}, {"env_step": 1382400, "rew": 2002.5351, "rew_std": 547.6064, "Agent": "NPG"}, {"env_step": 1413120, "rew": 2056.7745, "rew_std": 533.2264, "Agent": "NPG"}, {"env_step": 1443840, "rew": 1988.813, "rew_std": 507.8021, "Agent": "NPG"}, {"env_step": 1474560, "rew": 2147.6497, "rew_std": 504.7356, "Agent": "NPG"}, {"env_step": 1505280, "rew": 2079.0909, "rew_std": 578.1407, "Agent": "NPG"}, {"env_step": 1536000, "rew": 2092.4962, "rew_std": 481.8786, "Agent": "NPG"}, {"env_step": 1566720, "rew": 2149.4969, "rew_std": 580.7579, "Agent": "NPG"}, {"env_step": 1597440, "rew": 2287.9842, "rew_std": 550.017, "Agent": "NPG"}, {"env_step": 1628160, "rew": 2170.1871, "rew_std": 479.2615, "Agent": "NPG"}, {"env_step": 1658880, "rew": 2203.4247, "rew_std": 478.7142, "Agent": "NPG"}, {"env_step": 1689600, "rew": 2092.001, "rew_std": 507.9722, "Agent": "NPG"}, {"env_step": 1720320, "rew": 2189.6386, "rew_std": 558.5493, "Agent": "NPG"}, {"env_step": 1751040, "rew": 2137.6187, "rew_std": 602.4165, "Agent": "NPG"}, {"env_step": 1781760, "rew": 2232.7823, "rew_std": 634.4069, "Agent": "NPG"}, {"env_step": 1812480, "rew": 2064.7807, "rew_std": 390.5897, "Agent": "NPG"}, {"env_step": 1843200, "rew": 2187.579, "rew_std": 446.4498, "Agent": "NPG"}, {"env_step": 1873920, "rew": 2325.7036, "rew_std": 531.1478, "Agent": "NPG"}, {"env_step": 1904640, "rew": 2401.6918, "rew_std": 542.0848, "Agent": "NPG"}, {"env_step": 1935360, "rew": 2200.0264, "rew_std": 510.0376, "Agent": "NPG"}, {"env_step": 1966080, "rew": 2297.9461, "rew_std": 483.4262, "Agent": "NPG"}, {"env_step": 1996800, "rew": 2331.2133, "rew_std": 509.2854, "Agent": "NPG"}, {"env_step": 2027520, "rew": 2361.1798, "rew_std": 562.208, "Agent": "NPG"}, {"env_step": 2058240, "rew": 2370.4972, "rew_std": 482.1761, "Agent": "NPG"}, {"env_step": 2088960, "rew": 2393.7227, "rew_std": 434.0232, "Agent": "NPG"}, {"env_step": 2119680, "rew": 2276.2466, "rew_std": 564.5921, "Agent": "NPG"}, {"env_step": 2150400, "rew": 2336.9217, "rew_std": 479.7896, "Agent": "NPG"}, {"env_step": 2181120, "rew": 2381.4366, "rew_std": 546.8422, "Agent": "NPG"}, {"env_step": 2211840, "rew": 2459.0929, "rew_std": 463.9144, "Agent": "NPG"}, {"env_step": 2242560, "rew": 2459.2929, "rew_std": 560.7651, "Agent": "NPG"}, {"env_step": 2273280, "rew": 2223.1782, "rew_std": 496.8314, "Agent": "NPG"}, {"env_step": 2304000, "rew": 2375.4968, "rew_std": 426.4026, "Agent": "NPG"}, {"env_step": 2334720, "rew": 2354.7356, "rew_std": 523.9221, "Agent": "NPG"}, {"env_step": 2365440, "rew": 2148.1848, "rew_std": 410.0888, "Agent": "NPG"}, {"env_step": 2396160, "rew": 2297.2782, "rew_std": 471.3105, "Agent": "NPG"}, {"env_step": 2426880, "rew": 2341.1945, "rew_std": 413.9194, "Agent": "NPG"}, {"env_step": 2457600, "rew": 2221.5854, "rew_std": 600.439, "Agent": "NPG"}, {"env_step": 2488320, "rew": 2421.9953, "rew_std": 663.6039, "Agent": "NPG"}, {"env_step": 2519040, "rew": 2520.4968, "rew_std": 454.7562, "Agent": "NPG"}, {"env_step": 2549760, "rew": 2432.1227, "rew_std": 485.1535, "Agent": "NPG"}, {"env_step": 2580480, "rew": 2433.1222, "rew_std": 421.6446, "Agent": "NPG"}, {"env_step": 2611200, "rew": 2443.7814, "rew_std": 527.5954, "Agent": "NPG"}, {"env_step": 2641920, "rew": 2252.6428, "rew_std": 613.1488, "Agent": "NPG"}, {"env_step": 2672640, "rew": 2328.3538, "rew_std": 451.5097, "Agent": "NPG"}, {"env_step": 2703360, "rew": 2449.0935, "rew_std": 453.5471, "Agent": "NPG"}, {"env_step": 2734080, "rew": 2360.1628, "rew_std": 492.6652, "Agent": "NPG"}, {"env_step": 2764800, "rew": 2421.0624, "rew_std": 496.3625, "Agent": "NPG"}, {"env_step": 2795520, "rew": 2504.4142, "rew_std": 661.299, "Agent": "NPG"}, {"env_step": 2826240, "rew": 2520.7559, "rew_std": 527.4457, "Agent": "NPG"}, {"env_step": 2856960, "rew": 2611.0908, "rew_std": 554.4775, "Agent": "NPG"}, {"env_step": 2887680, "rew": 2453.1244, "rew_std": 586.2238, "Agent": "NPG"}, {"env_step": 2918400, "rew": 2427.2545, "rew_std": 683.8347, "Agent": "NPG"}, {"env_step": 2949120, "rew": 2417.5517, "rew_std": 594.8328, "Agent": "NPG"}, {"env_step": 2979840, "rew": 2419.6, "rew_std": 571.0616, "Agent": "NPG"}, {"env_step": 3010560, "rew": 2531.9942, "rew_std": 593.9883, "Agent": "NPG"}, {"env_step": 3041280, "rew": 2542.3326, "rew_std": 438.6771, "Agent": "NPG"}, {"env_step": 3072000, "rew": 2445.7838, "rew_std": 440.8745, "Agent": "NPG"}]