[{"env_step": 0, "rew": -45.1638, "rew_std": 26.8049, "Agent": "PPO"}, {"env_step": 30720, "rew": 1.1798, "rew_std": 7.6052, "Agent": "PPO"}, {"env_step": 61440, "rew": 108.396, "rew_std": 24.5339, "Agent": "PPO"}, {"env_step": 92160, "rew": 257.0256, "rew_std": 60.1797, "Agent": "PPO"}, {"env_step": 122880, "rew": 409.4479, "rew_std": 107.6753, "Agent": "PPO"}, {"env_step": 153600, "rew": 576.9856, "rew_std": 104.0574, "Agent": "PPO"}, {"env_step": 184320, "rew": 680.1085, "rew_std": 154.5434, "Agent": "PPO"}, {"env_step": 215040, "rew": 734.055, "rew_std": 157.4357, "Agent": "PPO"}, {"env_step": 245760, "rew": 902.7627, "rew_std": 256.8418, "Agent": "PPO"}, {"env_step": 276480, "rew": 1002.7442, "rew_std": 263.7889, "Agent": "PPO"}, {"env_step": 307200, "rew": 933.2541, "rew_std": 233.041, "Agent": "PPO"}, {"env_step": 337920, "rew": 1381.7994, "rew_std": 171.3465, "Agent": "PPO"}, {"env_step": 368640, "rew": 1365.8795, "rew_std": 265.6691, "Agent": "PPO"}, {"env_step": 399360, "rew": 1422.151, "rew_std": 355.0902, "Agent": "PPO"}, {"env_step": 430080, "rew": 1437.5237, "rew_std": 351.6675, "Agent": "PPO"}, {"env_step": 460800, "rew": 1592.5595, "rew_std": 435.5349, "Agent": "PPO"}, {"env_step": 491520, "rew": 1830.9248, "rew_std": 327.1536, "Agent": "PPO"}, {"env_step": 522240, "rew": 1865.1769, "rew_std": 617.9661, "Agent": "PPO"}, {"env_step": 552960, "rew": 2027.5555, "rew_std": 450.231, "Agent": "PPO"}, {"env_step": 583680, "rew": 1922.7912, "rew_std": 530.9554, "Agent": "PPO"}, {"env_step": 614400, "rew": 2155.52, "rew_std": 605.2654, "Agent": "PPO"}, {"env_step": 645120, "rew": 2281.4225, "rew_std": 659.161, "Agent": "PPO"}, {"env_step": 675840, "rew": 2466.7854, "rew_std": 800.2599, "Agent": "PPO"}, {"env_step": 706560, "rew": 2778.6914, "rew_std": 818.3568, "Agent": "PPO"}, {"env_step": 737280, "rew": 2408.4636, "rew_std": 658.6381, "Agent": "PPO"}, {"env_step": 768000, "rew": 2787.5943, "rew_std": 758.873, "Agent": "PPO"}, {"env_step": 798720, "rew": 2672.0722, "rew_std": 886.4375, "Agent": "PPO"}, {"env_step": 829440, "rew": 2815.8244, "rew_std": 756.2206, "Agent": "PPO"}, {"env_step": 860160, "rew": 2881.8245, "rew_std": 932.4833, "Agent": "PPO"}, {"env_step": 890880, "rew": 3054.5044, "rew_std": 656.7209, "Agent": "PPO"}, {"env_step": 921600, "rew": 2805.7394, "rew_std": 811.9402, "Agent": "PPO"}, {"env_step": 952320, "rew": 3156.5113, "rew_std": 882.0281, "Agent": "PPO"}, {"env_step": 983040, "rew": 3258.3684, "rew_std": 1079.2574, "Agent": "PPO"}, {"env_step": 1013760, "rew": 3141.0442, "rew_std": 1009.4955, "Agent": "PPO"}, {"env_step": 1044480, "rew": 3103.7708, "rew_std": 785.5033, "Agent": "PPO"}, {"env_step": 1075200, "rew": 2894.7434, "rew_std": 844.0465, "Agent": "PPO"}, {"env_step": 1105920, "rew": 3268.2543, "rew_std": 849.4982, "Agent": "PPO"}, {"env_step": 1136640, "rew": 3032.4115, "rew_std": 887.7795, "Agent": "PPO"}, {"env_step": 1167360, "rew": 2798.2882, "rew_std": 1018.4211, "Agent": "PPO"}, {"env_step": 1198080, "rew": 2982.8664, "rew_std": 1182.9198, "Agent": "PPO"}, {"env_step": 1228800, "rew": 2853.1494, "rew_std": 856.6556, "Agent": "PPO"}, {"env_step": 1259520, "rew": 3189.8264, "rew_std": 857.3083, "Agent": "PPO"}, {"env_step": 1290240, "rew": 3148.1075, "rew_std": 1157.6515, "Agent": "PPO"}, {"env_step": 1320960, "rew": 3414.5263, "rew_std": 1133.0382, "Agent": "PPO"}, {"env_step": 1351680, "rew": 3182.4456, "rew_std": 848.7621, "Agent": "PPO"}, {"env_step": 1382400, "rew": 3163.9297, "rew_std": 898.0596, "Agent": "PPO"}, {"env_step": 1413120, "rew": 3334.0317, "rew_std": 1050.2921, "Agent": "PPO"}, {"env_step": 1443840, "rew": 3112.8048, "rew_std": 1262.7364, "Agent": "PPO"}, {"env_step": 1474560, "rew": 3406.995, "rew_std": 1065.5177, "Agent": "PPO"}, {"env_step": 1505280, "rew": 3200.8696, "rew_std": 1149.5605, "Agent": "PPO"}, {"env_step": 1536000, "rew": 3336.6813, "rew_std": 867.9635, "Agent": "PPO"}, {"env_step": 1566720, "rew": 3522.898, "rew_std": 1000.9456, "Agent": "PPO"}, {"env_step": 1597440, "rew": 3435.2771, "rew_std": 967.5778, "Agent": "PPO"}, {"env_step": 1628160, "rew": 3601.9068, "rew_std": 1035.0799, "Agent": "PPO"}, {"env_step": 1658880, "rew": 3446.1252, "rew_std": 820.5245, "Agent": "PPO"}, {"env_step": 1689600, "rew": 3505.6386, "rew_std": 968.1454, "Agent": "PPO"}, {"env_step": 1720320, "rew": 3687.4512, "rew_std": 867.7069, "Agent": "PPO"}, {"env_step": 1751040, "rew": 3615.7173, "rew_std": 839.4768, "Agent": "PPO"}, {"env_step": 1781760, "rew": 3712.6804, "rew_std": 957.1922, "Agent": "PPO"}, {"env_step": 1812480, "rew": 3525.5926, "rew_std": 825.2101, "Agent": "PPO"}, {"env_step": 1843200, "rew": 3679.4306, "rew_std": 753.9294, "Agent": "PPO"}, {"env_step": 1873920, "rew": 3758.6323, "rew_std": 770.2905, "Agent": "PPO"}, {"env_step": 1904640, "rew": 3481.2124, "rew_std": 756.4533, "Agent": "PPO"}, {"env_step": 1935360, "rew": 3420.7446, "rew_std": 805.4886, "Agent": "PPO"}, {"env_step": 1966080, "rew": 3494.1347, "rew_std": 752.0038, "Agent": "PPO"}, {"env_step": 1996800, "rew": 3577.4866, "rew_std": 339.4057, "Agent": "PPO"}, {"env_step": 2027520, "rew": 3639.4031, "rew_std": 971.0206, "Agent": "PPO"}, {"env_step": 2058240, "rew": 3519.3977, "rew_std": 713.6278, "Agent": "PPO"}, {"env_step": 2088960, "rew": 3512.7617, "rew_std": 780.0977, "Agent": "PPO"}, {"env_step": 2119680, "rew": 3530.8447, "rew_std": 636.9476, "Agent": "PPO"}, {"env_step": 2150400, "rew": 3523.7627, "rew_std": 741.5985, "Agent": "PPO"}, {"env_step": 2181120, "rew": 3564.3577, "rew_std": 708.5225, "Agent": "PPO"}, {"env_step": 2211840, "rew": 3576.1605, "rew_std": 866.6277, "Agent": "PPO"}, {"env_step": 2242560, "rew": 3804.0978, "rew_std": 705.8611, "Agent": "PPO"}, {"env_step": 2273280, "rew": 3599.313, "rew_std": 699.1721, "Agent": "PPO"}, {"env_step": 2304000, "rew": 3721.4555, "rew_std": 711.6818, "Agent": "PPO"}, {"env_step": 2334720, "rew": 3532.7069, "rew_std": 837.1282, "Agent": "PPO"}, {"env_step": 2365440, "rew": 3608.8838, "rew_std": 1090.2108, "Agent": "PPO"}, {"env_step": 2396160, "rew": 3910.161, "rew_std": 678.6507, "Agent": "PPO"}, {"env_step": 2426880, "rew": 3426.0564, "rew_std": 1185.8051, "Agent": "PPO"}, {"env_step": 2457600, "rew": 3679.0407, "rew_std": 873.2651, "Agent": "PPO"}, {"env_step": 2488320, "rew": 3757.3899, "rew_std": 950.9568, "Agent": "PPO"}, {"env_step": 2519040, "rew": 3813.3742, "rew_std": 764.5632, "Agent": "PPO"}, {"env_step": 2549760, "rew": 3773.2322, "rew_std": 727.4568, "Agent": "PPO"}, {"env_step": 2580480, "rew": 3639.3853, "rew_std": 827.8082, "Agent": "PPO"}, {"env_step": 2611200, "rew": 3704.148, "rew_std": 691.7173, "Agent": "PPO"}, {"env_step": 2641920, "rew": 3798.3913, "rew_std": 694.0727, "Agent": "PPO"}, {"env_step": 2672640, "rew": 3826.2185, "rew_std": 891.9137, "Agent": "PPO"}, {"env_step": 2703360, "rew": 3965.214, "rew_std": 820.4513, "Agent": "PPO"}, {"env_step": 2734080, "rew": 3644.2885, "rew_std": 977.7322, "Agent": "PPO"}, {"env_step": 2764800, "rew": 3832.7547, "rew_std": 857.0111, "Agent": "PPO"}, {"env_step": 2795520, "rew": 3870.129, "rew_std": 816.0748, "Agent": "PPO"}, {"env_step": 2826240, "rew": 3877.0556, "rew_std": 882.7163, "Agent": "PPO"}, {"env_step": 2856960, "rew": 4003.1883, "rew_std": 676.3348, "Agent": "PPO"}, {"env_step": 2887680, "rew": 3668.3481, "rew_std": 838.448, "Agent": "PPO"}, {"env_step": 2918400, "rew": 4079.2655, "rew_std": 880.1724, "Agent": "PPO"}, {"env_step": 2949120, "rew": 3730.9786, "rew_std": 834.9895, "Agent": "PPO"}, {"env_step": 2979840, "rew": 3877.0596, "rew_std": 878.0078, "Agent": "PPO"}, {"env_step": 3010560, "rew": 3750.2836, "rew_std": 849.4658, "Agent": "PPO"}, {"env_step": 3041280, "rew": 4148.1549, "rew_std": 852.399, "Agent": "PPO"}, {"env_step": 3072000, "rew": 3803.2651, "rew_std": 890.7726, "Agent": "PPO"}, {"env_step": 5000, "rew": 873.2881, "rew_std": 38.9518, "Agent": "TD3"}, {"env_step": 10000, "rew": 692.9757, "rew_std": 120.2028, "Agent": "TD3"}, {"env_step": 15000, "rew": 397.0552, "rew_std": 128.6915, "Agent": "TD3"}, {"env_step": 20000, "rew": 480.1642, "rew_std": 153.2019, "Agent": "TD3"}, {"env_step": 25000, "rew": 400.1059, "rew_std": 117.3685, "Agent": "TD3"}, {"env_step": 30000, "rew": 327.8603, "rew_std": 112.1915, "Agent": "TD3"}, {"env_step": 35000, "rew": 423.3604, "rew_std": 110.1699, "Agent": "TD3"}, {"env_step": 40000, "rew": 550.256, "rew_std": 120.7782, "Agent": "TD3"}, {"env_step": 45000, "rew": 622.4788, "rew_std": 118.6195, "Agent": "TD3"}, {"env_step": 50000, "rew": 597.6534, "rew_std": 116.1693, "Agent": "TD3"}, {"env_step": 55000, "rew": 655.5329, "rew_std": 52.1289, "Agent": "TD3"}, {"env_step": 60000, "rew": 605.0446, "rew_std": 79.2021, "Agent": "TD3"}, {"env_step": 65000, "rew": 711.6328, "rew_std": 154.2924, "Agent": "TD3"}, {"env_step": 70000, "rew": 815.7518, "rew_std": 183.6716, "Agent": "TD3"}, {"env_step": 75000, "rew": 787.1799, "rew_std": 162.4248, "Agent": "TD3"}, {"env_step": 80000, "rew": 824.0866, "rew_std": 188.9611, "Agent": "TD3"}, {"env_step": 85000, "rew": 790.719, "rew_std": 246.543, "Agent": "TD3"}, {"env_step": 90000, "rew": 919.297, "rew_std": 227.2307, "Agent": "TD3"}, {"env_step": 95000, "rew": 904.733, "rew_std": 246.6162, "Agent": "TD3"}, {"env_step": 100000, "rew": 827.7371, "rew_std": 224.2807, "Agent": "TD3"}, {"env_step": 105000, "rew": 877.6288, "rew_std": 302.8262, "Agent": "TD3"}, {"env_step": 110000, "rew": 909.9317, "rew_std": 494.907, "Agent": "TD3"}, {"env_step": 115000, "rew": 1157.1115, "rew_std": 416.5022, "Agent": "TD3"}, {"env_step": 120000, "rew": 1124.3433, "rew_std": 486.0497, "Agent": "TD3"}, {"env_step": 125000, "rew": 1267.6399, "rew_std": 570.4972, "Agent": "TD3"}, {"env_step": 130000, "rew": 1185.5972, "rew_std": 499.663, "Agent": "TD3"}, {"env_step": 135000, "rew": 1192.8429, "rew_std": 534.078, "Agent": "TD3"}, {"env_step": 140000, "rew": 1378.7758, "rew_std": 648.9205, "Agent": "TD3"}, {"env_step": 145000, "rew": 1346.322, "rew_std": 606.1947, "Agent": "TD3"}, {"env_step": 150000, "rew": 1505.2054, "rew_std": 677.1879, "Agent": "TD3"}, {"env_step": 155000, "rew": 1381.1472, "rew_std": 674.4805, "Agent": "TD3"}, {"env_step": 160000, "rew": 1399.9608, "rew_std": 402.3369, "Agent": "TD3"}, {"env_step": 165000, "rew": 1796.5644, "rew_std": 536.4386, "Agent": "TD3"}, {"env_step": 170000, "rew": 1493.7889, "rew_std": 721.5545, "Agent": "TD3"}, {"env_step": 175000, "rew": 1725.0112, "rew_std": 623.0873, "Agent": "TD3"}, {"env_step": 180000, "rew": 1938.587, "rew_std": 717.4994, "Agent": "TD3"}, {"env_step": 185000, "rew": 1783.4559, "rew_std": 740.0566, "Agent": "TD3"}, {"env_step": 190000, "rew": 1865.5029, "rew_std": 575.1663, "Agent": "TD3"}, {"env_step": 195000, "rew": 1894.567, "rew_std": 588.6718, "Agent": "TD3"}, {"env_step": 200000, "rew": 1987.107, "rew_std": 656.7583, "Agent": "TD3"}, {"env_step": 205000, "rew": 1794.3525, "rew_std": 506.857, "Agent": "TD3"}, {"env_step": 210000, "rew": 2027.3582, "rew_std": 788.0785, "Agent": "TD3"}, {"env_step": 215000, "rew": 2086.72, "rew_std": 493.8283, "Agent": "TD3"}, {"env_step": 220000, "rew": 2199.8547, "rew_std": 800.2519, "Agent": "TD3"}, {"env_step": 225000, "rew": 2274.8124, "rew_std": 698.8824, "Agent": "TD3"}, {"env_step": 230000, "rew": 2389.5561, "rew_std": 639.7828, "Agent": "TD3"}, {"env_step": 235000, "rew": 2579.1222, "rew_std": 680.182, "Agent": "TD3"}, {"env_step": 240000, "rew": 2322.6897, "rew_std": 490.1931, "Agent": "TD3"}, {"env_step": 245000, "rew": 2498.8825, "rew_std": 726.4331, "Agent": "TD3"}, {"env_step": 250000, "rew": 2523.3431, "rew_std": 643.0873, "Agent": "TD3"}, {"env_step": 255000, "rew": 2525.9347, "rew_std": 572.6054, "Agent": "TD3"}, {"env_step": 260000, "rew": 2875.4046, "rew_std": 707.0678, "Agent": "TD3"}, {"env_step": 265000, "rew": 2664.8142, "rew_std": 672.9307, "Agent": "TD3"}, {"env_step": 270000, "rew": 2917.7714, "rew_std": 714.7034, "Agent": "TD3"}, {"env_step": 275000, "rew": 2790.7163, "rew_std": 934.7828, "Agent": "TD3"}, {"env_step": 280000, "rew": 2977.8037, "rew_std": 826.6263, "Agent": "TD3"}, {"env_step": 285000, "rew": 2697.3986, "rew_std": 734.8315, "Agent": "TD3"}, {"env_step": 290000, "rew": 2907.1497, "rew_std": 863.047, "Agent": "TD3"}, {"env_step": 295000, "rew": 2967.0549, "rew_std": 708.2859, "Agent": "TD3"}, {"env_step": 300000, "rew": 2836.3506, "rew_std": 522.9356, "Agent": "TD3"}, {"env_step": 305000, "rew": 3079.2142, "rew_std": 781.9768, "Agent": "TD3"}, {"env_step": 310000, "rew": 2442.7108, "rew_std": 1035.4865, "Agent": "TD3"}, {"env_step": 315000, "rew": 2990.2987, "rew_std": 722.2599, "Agent": "TD3"}, {"env_step": 320000, "rew": 3125.9481, "rew_std": 729.2069, "Agent": "TD3"}, {"env_step": 325000, "rew": 3259.542, "rew_std": 711.0829, "Agent": "TD3"}, {"env_step": 330000, "rew": 3276.4432, "rew_std": 859.4927, "Agent": "TD3"}, {"env_step": 335000, "rew": 3186.125, "rew_std": 830.8368, "Agent": "TD3"}, {"env_step": 340000, "rew": 3258.4379, "rew_std": 710.1632, "Agent": "TD3"}, {"env_step": 345000, "rew": 3429.9357, "rew_std": 816.5659, "Agent": "TD3"}, {"env_step": 350000, "rew": 3142.0116, "rew_std": 924.3029, "Agent": "TD3"}, {"env_step": 355000, "rew": 3418.0257, "rew_std": 965.9174, "Agent": "TD3"}, {"env_step": 360000, "rew": 3423.1524, "rew_std": 903.6584, "Agent": "TD3"}, {"env_step": 365000, "rew": 3349.9063, "rew_std": 924.1522, "Agent": "TD3"}, {"env_step": 370000, "rew": 3388.3679, "rew_std": 670.0697, "Agent": "TD3"}, {"env_step": 375000, "rew": 3495.4122, "rew_std": 881.0026, "Agent": "TD3"}, {"env_step": 380000, "rew": 3522.7816, "rew_std": 834.9933, "Agent": "TD3"}, {"env_step": 385000, "rew": 3659.0542, "rew_std": 969.7367, "Agent": "TD3"}, {"env_step": 390000, "rew": 3412.5765, "rew_std": 1009.7869, "Agent": "TD3"}, {"env_step": 395000, "rew": 3441.4975, "rew_std": 828.764, "Agent": "TD3"}, {"env_step": 400000, "rew": 3507.3728, "rew_std": 1011.5694, "Agent": "TD3"}, {"env_step": 405000, "rew": 3505.6583, "rew_std": 961.0357, "Agent": "TD3"}, {"env_step": 410000, "rew": 3562.0921, "rew_std": 1000.0948, "Agent": "TD3"}, {"env_step": 415000, "rew": 3593.3924, "rew_std": 922.8568, "Agent": "TD3"}, {"env_step": 420000, "rew": 3622.2384, "rew_std": 836.6786, "Agent": "TD3"}, {"env_step": 425000, "rew": 3638.8397, "rew_std": 887.4577, "Agent": "TD3"}, {"env_step": 430000, "rew": 3628.5981, "rew_std": 902.6081, "Agent": "TD3"}, {"env_step": 435000, "rew": 3755.8288, "rew_std": 1041.5487, "Agent": "TD3"}, {"env_step": 440000, "rew": 3924.9246, "rew_std": 904.4263, "Agent": "TD3"}, {"env_step": 445000, "rew": 3848.7819, "rew_std": 863.726, "Agent": "TD3"}, {"env_step": 450000, "rew": 3786.3387, "rew_std": 881.7482, "Agent": "TD3"}, {"env_step": 455000, "rew": 3717.0026, "rew_std": 907.9821, "Agent": "TD3"}, {"env_step": 460000, "rew": 3972.8882, "rew_std": 873.4861, "Agent": "TD3"}, {"env_step": 465000, "rew": 3932.6164, "rew_std": 978.6592, "Agent": "TD3"}, {"env_step": 470000, "rew": 3856.3465, "rew_std": 963.4382, "Agent": "TD3"}, {"env_step": 475000, "rew": 3718.0162, "rew_std": 842.7566, "Agent": "TD3"}, {"env_step": 480000, "rew": 3738.2352, "rew_std": 995.4955, "Agent": "TD3"}, {"env_step": 485000, "rew": 3987.6998, "rew_std": 952.0839, "Agent": "TD3"}, {"env_step": 490000, "rew": 4052.6013, "rew_std": 783.8302, "Agent": "TD3"}, {"env_step": 495000, "rew": 3984.2972, "rew_std": 884.055, "Agent": "TD3"}, {"env_step": 500000, "rew": 3911.7144, "rew_std": 969.3004, "Agent": "TD3"}, {"env_step": 505000, "rew": 4126.2723, "rew_std": 863.1074, "Agent": "TD3"}, {"env_step": 510000, "rew": 3886.6877, "rew_std": 957.9709, "Agent": "TD3"}, {"env_step": 515000, "rew": 4062.4149, "rew_std": 1049.8531, "Agent": "TD3"}, {"env_step": 520000, "rew": 4084.531, "rew_std": 1042.5492, "Agent": "TD3"}, {"env_step": 525000, "rew": 4004.6619, "rew_std": 1103.5235, "Agent": "TD3"}, {"env_step": 530000, "rew": 3934.9948, "rew_std": 1061.6479, "Agent": "TD3"}, {"env_step": 535000, "rew": 3868.5868, "rew_std": 916.7911, "Agent": "TD3"}, {"env_step": 540000, "rew": 4259.9649, "rew_std": 779.3447, "Agent": "TD3"}, {"env_step": 545000, "rew": 4244.3096, "rew_std": 1002.53, "Agent": "TD3"}, {"env_step": 550000, "rew": 3960.2673, "rew_std": 876.5064, "Agent": "TD3"}, {"env_step": 555000, "rew": 4220.8084, "rew_std": 937.5224, "Agent": "TD3"}, {"env_step": 560000, "rew": 3938.5143, "rew_std": 820.3796, "Agent": "TD3"}, {"env_step": 565000, "rew": 4187.9774, "rew_std": 954.6565, "Agent": "TD3"}, {"env_step": 570000, "rew": 4095.1393, "rew_std": 1213.9982, "Agent": "TD3"}, {"env_step": 575000, "rew": 4315.6683, "rew_std": 871.5209, "Agent": "TD3"}, {"env_step": 580000, "rew": 4267.7739, "rew_std": 971.3827, "Agent": "TD3"}, {"env_step": 585000, "rew": 4152.9573, "rew_std": 840.2973, "Agent": "TD3"}, {"env_step": 590000, "rew": 4284.2829, "rew_std": 741.1785, "Agent": "TD3"}, {"env_step": 595000, "rew": 4348.1121, "rew_std": 908.2769, "Agent": "TD3"}, {"env_step": 600000, "rew": 4227.2577, "rew_std": 772.8629, "Agent": "TD3"}, {"env_step": 605000, "rew": 4395.6928, "rew_std": 953.3646, "Agent": "TD3"}, {"env_step": 610000, "rew": 4254.7732, "rew_std": 1073.3009, "Agent": "TD3"}, {"env_step": 615000, "rew": 4351.2641, "rew_std": 884.8591, "Agent": "TD3"}, {"env_step": 620000, "rew": 4336.1917, "rew_std": 1050.0142, "Agent": "TD3"}, {"env_step": 625000, "rew": 4127.4012, "rew_std": 835.0643, "Agent": "TD3"}, {"env_step": 630000, "rew": 4275.5443, "rew_std": 971.1633, "Agent": "TD3"}, {"env_step": 635000, "rew": 4465.4718, "rew_std": 823.02, "Agent": "TD3"}, {"env_step": 640000, "rew": 4350.7206, "rew_std": 953.1402, "Agent": "TD3"}, {"env_step": 645000, "rew": 4362.6552, "rew_std": 954.6996, "Agent": "TD3"}, {"env_step": 650000, "rew": 4301.645, "rew_std": 958.4777, "Agent": "TD3"}, {"env_step": 655000, "rew": 4432.7426, "rew_std": 960.7613, "Agent": "TD3"}, {"env_step": 660000, "rew": 4523.4884, "rew_std": 989.8137, "Agent": "TD3"}, {"env_step": 665000, "rew": 4546.4361, "rew_std": 885.5609, "Agent": "TD3"}, {"env_step": 670000, "rew": 4549.9462, "rew_std": 844.8013, "Agent": "TD3"}, {"env_step": 675000, "rew": 4321.5394, "rew_std": 910.4307, "Agent": "TD3"}, {"env_step": 680000, "rew": 4563.8536, "rew_std": 940.1484, "Agent": "TD3"}, {"env_step": 685000, "rew": 4490.2904, "rew_std": 785.6802, "Agent": "TD3"}, {"env_step": 690000, "rew": 4310.1555, "rew_std": 884.1603, "Agent": "TD3"}, {"env_step": 695000, "rew": 4326.8583, "rew_std": 1042.7645, "Agent": "TD3"}, {"env_step": 700000, "rew": 4583.9799, "rew_std": 930.0643, "Agent": "TD3"}, {"env_step": 705000, "rew": 4469.792, "rew_std": 888.5858, "Agent": "TD3"}, {"env_step": 710000, "rew": 4559.0077, "rew_std": 1086.2756, "Agent": "TD3"}, {"env_step": 715000, "rew": 4509.8791, "rew_std": 973.8389, "Agent": "TD3"}, {"env_step": 720000, "rew": 4678.2358, "rew_std": 960.0865, "Agent": "TD3"}, {"env_step": 725000, "rew": 4369.9315, "rew_std": 1196.3701, "Agent": "TD3"}, {"env_step": 730000, "rew": 4633.144, "rew_std": 854.0979, "Agent": "TD3"}, {"env_step": 735000, "rew": 4412.2788, "rew_std": 995.7851, "Agent": "TD3"}, {"env_step": 740000, "rew": 4541.2385, "rew_std": 1104.5576, "Agent": "TD3"}, {"env_step": 745000, "rew": 4534.3878, "rew_std": 795.6433, "Agent": "TD3"}, {"env_step": 750000, "rew": 4408.3879, "rew_std": 1044.1758, "Agent": "TD3"}, {"env_step": 755000, "rew": 4661.9304, "rew_std": 1098.4214, "Agent": "TD3"}, {"env_step": 760000, "rew": 4672.0089, "rew_std": 858.8352, "Agent": "TD3"}, {"env_step": 765000, "rew": 4641.7838, "rew_std": 741.3466, "Agent": "TD3"}, {"env_step": 770000, "rew": 4577.7005, "rew_std": 791.7753, "Agent": "TD3"}, {"env_step": 775000, "rew": 4645.9155, "rew_std": 916.5786, "Agent": "TD3"}, {"env_step": 780000, "rew": 4626.3724, "rew_std": 838.3194, "Agent": "TD3"}, {"env_step": 785000, "rew": 4590.6479, "rew_std": 826.8026, "Agent": "TD3"}, {"env_step": 790000, "rew": 4693.2594, "rew_std": 881.5832, "Agent": "TD3"}, {"env_step": 795000, "rew": 4571.8228, "rew_std": 1001.9763, "Agent": "TD3"}, {"env_step": 800000, "rew": 4749.5884, "rew_std": 1079.7026, "Agent": "TD3"}, {"env_step": 805000, "rew": 4749.8754, "rew_std": 895.1584, "Agent": "TD3"}, {"env_step": 810000, "rew": 4597.6498, "rew_std": 1036.8005, "Agent": "TD3"}, {"env_step": 815000, "rew": 4752.6457, "rew_std": 1035.2265, "Agent": "TD3"}, {"env_step": 820000, "rew": 4798.439, "rew_std": 832.0876, "Agent": "TD3"}, {"env_step": 825000, "rew": 4715.2744, "rew_std": 970.3636, "Agent": "TD3"}, {"env_step": 830000, "rew": 4682.6615, "rew_std": 972.6327, "Agent": "TD3"}, {"env_step": 835000, "rew": 4528.5159, "rew_std": 749.9223, "Agent": "TD3"}, {"env_step": 840000, "rew": 4867.6554, "rew_std": 895.6796, "Agent": "TD3"}, {"env_step": 845000, "rew": 4631.9192, "rew_std": 881.8808, "Agent": "TD3"}, {"env_step": 850000, "rew": 4780.6696, "rew_std": 913.4925, "Agent": "TD3"}, {"env_step": 855000, "rew": 4673.5937, "rew_std": 971.9718, "Agent": "TD3"}, {"env_step": 860000, "rew": 4731.0357, "rew_std": 968.3834, "Agent": "TD3"}, {"env_step": 865000, "rew": 4852.9469, "rew_std": 815.505, "Agent": "TD3"}, {"env_step": 870000, "rew": 4809.0254, "rew_std": 889.6001, "Agent": "TD3"}, {"env_step": 875000, "rew": 4737.5216, "rew_std": 828.7946, "Agent": "TD3"}, {"env_step": 880000, "rew": 4877.515, "rew_std": 808.7414, "Agent": "TD3"}, {"env_step": 885000, "rew": 4461.5787, "rew_std": 1001.0224, "Agent": "TD3"}, {"env_step": 890000, "rew": 4812.5231, "rew_std": 824.0173, "Agent": "TD3"}, {"env_step": 895000, "rew": 4809.0292, "rew_std": 822.1125, "Agent": "TD3"}, {"env_step": 900000, "rew": 4887.8963, "rew_std": 895.6354, "Agent": "TD3"}, {"env_step": 905000, "rew": 5053.9041, "rew_std": 762.3531, "Agent": "TD3"}, {"env_step": 910000, "rew": 4857.3797, "rew_std": 998.3682, "Agent": "TD3"}, {"env_step": 915000, "rew": 4907.1562, "rew_std": 826.4833, "Agent": "TD3"}, {"env_step": 920000, "rew": 4846.0661, "rew_std": 799.8304, "Agent": "TD3"}, {"env_step": 925000, "rew": 4923.9718, "rew_std": 725.9898, "Agent": "TD3"}, {"env_step": 930000, "rew": 4834.1895, "rew_std": 1053.2119, "Agent": "TD3"}, {"env_step": 935000, "rew": 5029.8406, "rew_std": 870.2379, "Agent": "TD3"}, {"env_step": 940000, "rew": 4828.7276, "rew_std": 772.8665, "Agent": "TD3"}, {"env_step": 945000, "rew": 4816.7274, "rew_std": 1026.5873, "Agent": "TD3"}, {"env_step": 950000, "rew": 4888.2284, "rew_std": 761.6572, "Agent": "TD3"}, {"env_step": 955000, "rew": 4804.2551, "rew_std": 899.2745, "Agent": "TD3"}, {"env_step": 960000, "rew": 4841.1225, "rew_std": 982.2515, "Agent": "TD3"}, {"env_step": 965000, "rew": 5001.7156, "rew_std": 796.2098, "Agent": "TD3"}, {"env_step": 970000, "rew": 4963.6273, "rew_std": 885.9466, "Agent": "TD3"}, {"env_step": 975000, "rew": 4873.6439, "rew_std": 934.3578, "Agent": "TD3"}, {"env_step": 980000, "rew": 4986.4284, "rew_std": 727.5026, "Agent": "TD3"}, {"env_step": 985000, "rew": 5039.04, "rew_std": 826.451, "Agent": "TD3"}, {"env_step": 990000, "rew": 4960.1642, "rew_std": 784.3563, "Agent": "TD3"}, {"env_step": 995000, "rew": 4999.292, "rew_std": 777.1722, "Agent": "TD3"}, {"env_step": 1000000, "rew": 4911.2309, "rew_std": 918.1377, "Agent": "TD3"}, {"env_step": 1005000, "rew": 4769.6997, "rew_std": 1054.2545, "Agent": "TD3"}, {"env_step": 1010000, "rew": 4880.854, "rew_std": 887.1015, "Agent": "TD3"}, {"env_step": 1015000, "rew": 4863.4448, "rew_std": 950.289, "Agent": "TD3"}, {"env_step": 1020000, "rew": 5054.0226, "rew_std": 812.4345, "Agent": "TD3"}, {"env_step": 1025000, "rew": 4866.6239, "rew_std": 849.4627, "Agent": "TD3"}, {"env_step": 1030000, "rew": 4781.6789, "rew_std": 846.0881, "Agent": "TD3"}, {"env_step": 1035000, "rew": 5037.8187, "rew_std": 904.3878, "Agent": "TD3"}, {"env_step": 1040000, "rew": 5010.1024, "rew_std": 883.645, "Agent": "TD3"}, {"env_step": 1045000, "rew": 4940.0185, "rew_std": 853.7942, "Agent": "TD3"}, {"env_step": 1050000, "rew": 4869.8351, "rew_std": 1065.8683, "Agent": "TD3"}, {"env_step": 1055000, "rew": 5065.608, "rew_std": 884.4816, "Agent": "TD3"}, {"env_step": 1060000, "rew": 5079.3512, "rew_std": 797.8488, "Agent": "TD3"}, {"env_step": 1065000, "rew": 5050.3343, "rew_std": 703.362, "Agent": "TD3"}, {"env_step": 1070000, "rew": 5188.6333, "rew_std": 883.3329, "Agent": "TD3"}, {"env_step": 1075000, "rew": 4966.898, "rew_std": 924.0908, "Agent": "TD3"}, {"env_step": 1080000, "rew": 5028.612, "rew_std": 910.7201, "Agent": "TD3"}, {"env_step": 1085000, "rew": 5146.3244, "rew_std": 829.8989, "Agent": "TD3"}, {"env_step": 1090000, "rew": 5095.4587, "rew_std": 881.6364, "Agent": "TD3"}, {"env_step": 1095000, "rew": 5087.68, "rew_std": 1029.9957, "Agent": "TD3"}, {"env_step": 1100000, "rew": 5165.735, "rew_std": 757.8112, "Agent": "TD3"}, {"env_step": 1105000, "rew": 5180.7916, "rew_std": 924.8973, "Agent": "TD3"}, {"env_step": 1110000, "rew": 5258.8776, "rew_std": 723.154, "Agent": "TD3"}, {"env_step": 1115000, "rew": 5154.2468, "rew_std": 946.6712, "Agent": "TD3"}, {"env_step": 1120000, "rew": 4855.1916, "rew_std": 998.1512, "Agent": "TD3"}, {"env_step": 1125000, "rew": 5109.7468, "rew_std": 866.5871, "Agent": "TD3"}, {"env_step": 1130000, "rew": 5109.2571, "rew_std": 875.319, "Agent": "TD3"}, {"env_step": 1135000, "rew": 5249.2797, "rew_std": 817.1159, "Agent": "TD3"}, {"env_step": 1140000, "rew": 5183.5445, "rew_std": 876.9945, "Agent": "TD3"}, {"env_step": 1145000, "rew": 5111.9414, "rew_std": 935.2839, "Agent": "TD3"}, {"env_step": 1150000, "rew": 5140.7273, "rew_std": 805.8536, "Agent": "TD3"}, {"env_step": 1155000, "rew": 5037.2696, "rew_std": 845.695, "Agent": "TD3"}, {"env_step": 1160000, "rew": 5008.4221, "rew_std": 952.8048, "Agent": "TD3"}, {"env_step": 1165000, "rew": 5130.9812, "rew_std": 991.83, "Agent": "TD3"}, {"env_step": 1170000, "rew": 4889.7251, "rew_std": 1224.0601, "Agent": "TD3"}, {"env_step": 1175000, "rew": 4713.3788, "rew_std": 1632.4869, "Agent": "TD3"}, {"env_step": 1180000, "rew": 4964.1914, "rew_std": 1026.0415, "Agent": "TD3"}, {"env_step": 1185000, "rew": 4920.8587, "rew_std": 1037.1662, "Agent": "TD3"}, {"env_step": 1190000, "rew": 4827.8426, "rew_std": 995.3367, "Agent": "TD3"}, {"env_step": 1195000, "rew": 5161.0952, "rew_std": 945.0446, "Agent": "TD3"}, {"env_step": 1200000, "rew": 5250.055, "rew_std": 834.4152, "Agent": "TD3"}, {"env_step": 1205000, "rew": 5257.3788, "rew_std": 779.9084, "Agent": "TD3"}, {"env_step": 1210000, "rew": 4970.1045, "rew_std": 974.5391, "Agent": "TD3"}, {"env_step": 1215000, "rew": 4639.1005, "rew_std": 1732.0484, "Agent": "TD3"}, {"env_step": 1220000, "rew": 4353.0499, "rew_std": 2244.2511, "Agent": "TD3"}, {"env_step": 1225000, "rew": 4075.511, "rew_std": 2314.6058, "Agent": "TD3"}, {"env_step": 1230000, "rew": 5068.5288, "rew_std": 991.9342, "Agent": "TD3"}, {"env_step": 1235000, "rew": 5115.0143, "rew_std": 878.5611, "Agent": "TD3"}, {"env_step": 1240000, "rew": 5238.8184, "rew_std": 1062.6486, "Agent": "TD3"}, {"env_step": 1245000, "rew": 5198.4506, "rew_std": 794.2966, "Agent": "TD3"}, {"env_step": 1250000, "rew": 5433.2663, "rew_std": 805.9253, "Agent": "TD3"}, {"env_step": 0, "rew": 27.7176, "rew_std": 10.7358, "Agent": "REINFORCE"}, {"env_step": 30720, "rew": 33.3533, "rew_std": 15.3157, "Agent": "REINFORCE"}, {"env_step": 61440, "rew": 41.4711, "rew_std": 14.8108, "Agent": "REINFORCE"}, {"env_step": 92160, "rew": 48.6603, "rew_std": 12.8797, "Agent": "REINFORCE"}, {"env_step": 122880, "rew": 36.7399, "rew_std": 16.7203, "Agent": "REINFORCE"}, {"env_step": 153600, "rew": 44.7029, "rew_std": 12.1446, "Agent": "REINFORCE"}, {"env_step": 184320, "rew": 42.3812, "rew_std": 13.0596, "Agent": "REINFORCE"}, {"env_step": 215040, "rew": 68.8463, "rew_std": 20.4335, "Agent": "REINFORCE"}, {"env_step": 245760, "rew": 41.8285, "rew_std": 18.668, "Agent": "REINFORCE"}, {"env_step": 276480, "rew": 61.6224, "rew_std": 13.3752, "Agent": "REINFORCE"}, {"env_step": 307200, "rew": 58.2795, "rew_std": 22.9679, "Agent": "REINFORCE"}, {"env_step": 337920, "rew": 69.899, "rew_std": 24.5287, "Agent": "REINFORCE"}, {"env_step": 368640, "rew": 71.4402, "rew_std": 22.2039, "Agent": "REINFORCE"}, {"env_step": 399360, "rew": 64.7685, "rew_std": 27.8313, "Agent": "REINFORCE"}, {"env_step": 430080, "rew": 77.4212, "rew_std": 20.5991, "Agent": "REINFORCE"}, {"env_step": 460800, "rew": 81.0816, "rew_std": 32.3568, "Agent": "REINFORCE"}, {"env_step": 491520, "rew": 100.2472, "rew_std": 29.5934, "Agent": "REINFORCE"}, {"env_step": 522240, "rew": 105.3082, "rew_std": 36.861, "Agent": "REINFORCE"}, {"env_step": 552960, "rew": 88.4532, "rew_std": 24.8457, "Agent": "REINFORCE"}, {"env_step": 583680, "rew": 132.3005, "rew_std": 36.845, "Agent": "REINFORCE"}, {"env_step": 614400, "rew": 115.8723, "rew_std": 45.9245, "Agent": "REINFORCE"}, {"env_step": 645120, "rew": 128.5706, "rew_std": 31.6052, "Agent": "REINFORCE"}, {"env_step": 675840, "rew": 139.1624, "rew_std": 38.3564, "Agent": "REINFORCE"}, {"env_step": 706560, "rew": 122.3089, "rew_std": 22.9594, "Agent": "REINFORCE"}, {"env_step": 737280, "rew": 139.8168, "rew_std": 36.04, "Agent": "REINFORCE"}, {"env_step": 768000, "rew": 135.3548, "rew_std": 31.8188, "Agent": "REINFORCE"}, {"env_step": 798720, "rew": 154.814, "rew_std": 36.1231, "Agent": "REINFORCE"}, {"env_step": 829440, "rew": 138.0523, "rew_std": 23.4258, "Agent": "REINFORCE"}, {"env_step": 860160, "rew": 154.9802, "rew_std": 28.0355, "Agent": "REINFORCE"}, {"env_step": 890880, "rew": 163.9125, "rew_std": 46.5653, "Agent": "REINFORCE"}, {"env_step": 921600, "rew": 178.5543, "rew_std": 39.1556, "Agent": "REINFORCE"}, {"env_step": 952320, "rew": 148.4363, "rew_std": 31.9275, "Agent": "REINFORCE"}, {"env_step": 983040, "rew": 173.0948, "rew_std": 35.8674, "Agent": "REINFORCE"}, {"env_step": 1013760, "rew": 184.1079, "rew_std": 48.525, "Agent": "REINFORCE"}, {"env_step": 1044480, "rew": 188.7721, "rew_std": 47.7577, "Agent": "REINFORCE"}, {"env_step": 1075200, "rew": 222.5404, "rew_std": 45.0577, "Agent": "REINFORCE"}, {"env_step": 1105920, "rew": 204.1252, "rew_std": 58.2783, "Agent": "REINFORCE"}, {"env_step": 1136640, "rew": 227.1378, "rew_std": 68.7146, "Agent": "REINFORCE"}, {"env_step": 1167360, "rew": 205.754, "rew_std": 21.5251, "Agent": "REINFORCE"}, {"env_step": 1198080, "rew": 195.8821, "rew_std": 38.2101, "Agent": "REINFORCE"}, {"env_step": 1228800, "rew": 222.6474, "rew_std": 26.4, "Agent": "REINFORCE"}, {"env_step": 1259520, "rew": 215.2108, "rew_std": 46.4782, "Agent": "REINFORCE"}, {"env_step": 1290240, "rew": 225.4944, "rew_std": 47.4316, "Agent": "REINFORCE"}, {"env_step": 1320960, "rew": 247.2296, "rew_std": 41.7104, "Agent": "REINFORCE"}, {"env_step": 1351680, "rew": 248.6715, "rew_std": 42.0487, "Agent": "REINFORCE"}, {"env_step": 1382400, "rew": 250.6153, "rew_std": 48.6851, "Agent": "REINFORCE"}, {"env_step": 1413120, "rew": 255.4334, "rew_std": 47.6847, "Agent": "REINFORCE"}, {"env_step": 1443840, "rew": 260.1298, "rew_std": 50.7508, "Agent": "REINFORCE"}, {"env_step": 1474560, "rew": 285.7685, "rew_std": 47.8319, "Agent": "REINFORCE"}, {"env_step": 1505280, "rew": 303.9189, "rew_std": 58.4329, "Agent": "REINFORCE"}, {"env_step": 1536000, "rew": 299.0006, "rew_std": 55.5217, "Agent": "REINFORCE"}, {"env_step": 1566720, "rew": 291.9584, "rew_std": 48.0131, "Agent": "REINFORCE"}, {"env_step": 1597440, "rew": 298.1129, "rew_std": 71.0903, "Agent": "REINFORCE"}, {"env_step": 1628160, "rew": 295.2096, "rew_std": 55.1375, "Agent": "REINFORCE"}, {"env_step": 1658880, "rew": 256.9214, "rew_std": 31.8228, "Agent": "REINFORCE"}, {"env_step": 1689600, "rew": 306.4976, "rew_std": 55.3333, "Agent": "REINFORCE"}, {"env_step": 1720320, "rew": 309.0145, "rew_std": 48.844, "Agent": "REINFORCE"}, {"env_step": 1751040, "rew": 292.7145, "rew_std": 49.9569, "Agent": "REINFORCE"}, {"env_step": 1781760, "rew": 297.1903, "rew_std": 57.495, "Agent": "REINFORCE"}, {"env_step": 1812480, "rew": 285.1572, "rew_std": 77.7148, "Agent": "REINFORCE"}, {"env_step": 1843200, "rew": 302.7925, "rew_std": 98.092, "Agent": "REINFORCE"}, {"env_step": 1873920, "rew": 312.8332, "rew_std": 80.4849, "Agent": "REINFORCE"}, {"env_step": 1904640, "rew": 328.3923, "rew_std": 44.7151, "Agent": "REINFORCE"}, {"env_step": 1935360, "rew": 353.9316, "rew_std": 50.9284, "Agent": "REINFORCE"}, {"env_step": 1966080, "rew": 326.6882, "rew_std": 89.6125, "Agent": "REINFORCE"}, {"env_step": 1996800, "rew": 304.3854, "rew_std": 78.2457, "Agent": "REINFORCE"}, {"env_step": 2027520, "rew": 364.8491, "rew_std": 45.1922, "Agent": "REINFORCE"}, {"env_step": 2058240, "rew": 301.7265, "rew_std": 74.8352, "Agent": "REINFORCE"}, {"env_step": 2088960, "rew": 324.6792, "rew_std": 53.6144, "Agent": "REINFORCE"}, {"env_step": 2119680, "rew": 341.6978, "rew_std": 63.9434, "Agent": "REINFORCE"}, {"env_step": 2150400, "rew": 363.9016, "rew_std": 64.7186, "Agent": "REINFORCE"}, {"env_step": 2181120, "rew": 374.0682, "rew_std": 45.6372, "Agent": "REINFORCE"}, {"env_step": 2211840, "rew": 385.5681, "rew_std": 89.3322, "Agent": "REINFORCE"}, {"env_step": 2242560, "rew": 378.1436, "rew_std": 86.5271, "Agent": "REINFORCE"}, {"env_step": 2273280, "rew": 335.9349, "rew_std": 75.4024, "Agent": "REINFORCE"}, {"env_step": 2304000, "rew": 423.9954, "rew_std": 65.6686, "Agent": "REINFORCE"}, {"env_step": 2334720, "rew": 385.9904, "rew_std": 49.5371, "Agent": "REINFORCE"}, {"env_step": 2365440, "rew": 373.246, "rew_std": 87.2209, "Agent": "REINFORCE"}, {"env_step": 2396160, "rew": 360.8469, "rew_std": 79.2568, "Agent": "REINFORCE"}, {"env_step": 2426880, "rew": 417.3086, "rew_std": 99.0708, "Agent": "REINFORCE"}, {"env_step": 2457600, "rew": 385.6445, "rew_std": 93.4971, "Agent": "REINFORCE"}, {"env_step": 2488320, "rew": 416.7968, "rew_std": 61.8736, "Agent": "REINFORCE"}, {"env_step": 2519040, "rew": 380.9239, "rew_std": 72.2998, "Agent": "REINFORCE"}, {"env_step": 2549760, "rew": 356.601, "rew_std": 79.8959, "Agent": "REINFORCE"}, {"env_step": 2580480, "rew": 437.0575, "rew_std": 77.9993, "Agent": "REINFORCE"}, {"env_step": 2611200, "rew": 393.3934, "rew_std": 82.0512, "Agent": "REINFORCE"}, {"env_step": 2641920, "rew": 390.14, "rew_std": 74.0242, "Agent": "REINFORCE"}, {"env_step": 2672640, "rew": 380.3886, "rew_std": 44.6099, "Agent": "REINFORCE"}, {"env_step": 2703360, "rew": 411.4326, "rew_std": 39.9505, "Agent": "REINFORCE"}, {"env_step": 2734080, "rew": 426.8174, "rew_std": 43.9964, "Agent": "REINFORCE"}, {"env_step": 2764800, "rew": 390.6643, "rew_std": 66.2562, "Agent": "REINFORCE"}, {"env_step": 2795520, "rew": 396.97, "rew_std": 104.7072, "Agent": "REINFORCE"}, {"env_step": 2826240, "rew": 467.2725, "rew_std": 48.5015, "Agent": "REINFORCE"}, {"env_step": 2856960, "rew": 374.8978, "rew_std": 108.3885, "Agent": "REINFORCE"}, {"env_step": 2887680, "rew": 450.2795, "rew_std": 95.4089, "Agent": "REINFORCE"}, {"env_step": 2918400, "rew": 428.4842, "rew_std": 111.6204, "Agent": "REINFORCE"}, {"env_step": 2949120, "rew": 417.3782, "rew_std": 91.5549, "Agent": "REINFORCE"}, {"env_step": 2979840, "rew": 383.2412, "rew_std": 78.9286, "Agent": "REINFORCE"}, {"env_step": 3010560, "rew": 448.1727, "rew_std": 133.4732, "Agent": "REINFORCE"}, {"env_step": 3041280, "rew": 474.9232, "rew_std": 133.5394, "Agent": "REINFORCE"}, {"env_step": 3072000, "rew": 458.941, "rew_std": 87.7709, "Agent": "REINFORCE"}, {"env_step": 3102720, "rew": 434.3256, "rew_std": 119.6724, "Agent": "REINFORCE"}, {"env_step": 3133440, "rew": 425.1408, "rew_std": 113.6893, "Agent": "REINFORCE"}, {"env_step": 3164160, "rew": 445.6428, "rew_std": 89.4675, "Agent": "REINFORCE"}, {"env_step": 3194880, "rew": 441.357, "rew_std": 89.8821, "Agent": "REINFORCE"}, {"env_step": 3225600, "rew": 469.4754, "rew_std": 94.0679, "Agent": "REINFORCE"}, {"env_step": 3256320, "rew": 433.924, "rew_std": 121.3369, "Agent": "REINFORCE"}, {"env_step": 3287040, "rew": 393.9809, "rew_std": 122.1391, "Agent": "REINFORCE"}, {"env_step": 3317760, "rew": 442.0835, "rew_std": 97.7841, "Agent": "REINFORCE"}, {"env_step": 3348480, "rew": 433.7272, "rew_std": 61.3641, "Agent": "REINFORCE"}, {"env_step": 3379200, "rew": 447.5686, "rew_std": 84.2138, "Agent": "REINFORCE"}, {"env_step": 3409920, "rew": 497.7688, "rew_std": 86.3697, "Agent": "REINFORCE"}, {"env_step": 3440640, "rew": 533.3218, "rew_std": 71.5671, "Agent": "REINFORCE"}, {"env_step": 3471360, "rew": 439.6428, "rew_std": 62.7993, "Agent": "REINFORCE"}, {"env_step": 3502080, "rew": 459.9121, "rew_std": 108.291, "Agent": "REINFORCE"}, {"env_step": 3532800, "rew": 459.4379, "rew_std": 132.8943, "Agent": "REINFORCE"}, {"env_step": 3563520, "rew": 470.9714, "rew_std": 106.7905, "Agent": "REINFORCE"}, {"env_step": 3594240, "rew": 502.5269, "rew_std": 112.8716, "Agent": "REINFORCE"}, {"env_step": 3624960, "rew": 518.7053, "rew_std": 85.9213, "Agent": "REINFORCE"}, {"env_step": 3655680, "rew": 510.9007, "rew_std": 81.0547, "Agent": "REINFORCE"}, {"env_step": 3686400, "rew": 422.44, "rew_std": 101.416, "Agent": "REINFORCE"}, {"env_step": 3717120, "rew": 509.2242, "rew_std": 133.3777, "Agent": "REINFORCE"}, {"env_step": 3747840, "rew": 478.1535, "rew_std": 142.6283, "Agent": "REINFORCE"}, {"env_step": 3778560, "rew": 424.1849, "rew_std": 55.8675, "Agent": "REINFORCE"}, {"env_step": 3809280, "rew": 414.8215, "rew_std": 103.8898, "Agent": "REINFORCE"}, {"env_step": 3840000, "rew": 440.345, "rew_std": 167.3447, "Agent": "REINFORCE"}, {"env_step": 3870720, "rew": 476.521, "rew_std": 131.104, "Agent": "REINFORCE"}, {"env_step": 3901440, "rew": 519.2961, "rew_std": 98.1275, "Agent": "REINFORCE"}, {"env_step": 3932160, "rew": 560.9757, "rew_std": 149.2555, "Agent": "REINFORCE"}, {"env_step": 3962880, "rew": 468.661, "rew_std": 148.3693, "Agent": "REINFORCE"}, {"env_step": 3993600, "rew": 429.7429, "rew_std": 92.4378, "Agent": "REINFORCE"}, {"env_step": 4024320, "rew": 530.7159, "rew_std": 115.3881, "Agent": "REINFORCE"}, {"env_step": 4055040, "rew": 504.7885, "rew_std": 139.296, "Agent": "REINFORCE"}, {"env_step": 4085760, "rew": 527.264, "rew_std": 114.0875, "Agent": "REINFORCE"}, {"env_step": 4116480, "rew": 524.9679, "rew_std": 97.0679, "Agent": "REINFORCE"}, {"env_step": 4147200, "rew": 502.5799, "rew_std": 51.4227, "Agent": "REINFORCE"}, {"env_step": 4177920, "rew": 558.6022, "rew_std": 141.0198, "Agent": "REINFORCE"}, {"env_step": 4208640, "rew": 542.5564, "rew_std": 143.6826, "Agent": "REINFORCE"}, {"env_step": 4239360, "rew": 565.7178, "rew_std": 123.4404, "Agent": "REINFORCE"}, {"env_step": 4270080, "rew": 588.5188, "rew_std": 91.6356, "Agent": "REINFORCE"}, {"env_step": 4300800, "rew": 509.4929, "rew_std": 88.4461, "Agent": "REINFORCE"}, {"env_step": 4331520, "rew": 560.255, "rew_std": 110.7314, "Agent": "REINFORCE"}, {"env_step": 4362240, "rew": 584.3804, "rew_std": 115.0177, "Agent": "REINFORCE"}, {"env_step": 4392960, "rew": 511.6448, "rew_std": 115.7761, "Agent": "REINFORCE"}, {"env_step": 4423680, "rew": 548.2895, "rew_std": 97.5672, "Agent": "REINFORCE"}, {"env_step": 4454400, "rew": 643.0676, "rew_std": 147.6213, "Agent": "REINFORCE"}, {"env_step": 4485120, "rew": 549.4917, "rew_std": 92.6585, "Agent": "REINFORCE"}, {"env_step": 4515840, "rew": 514.8249, "rew_std": 137.2659, "Agent": "REINFORCE"}, {"env_step": 4546560, "rew": 584.2434, "rew_std": 127.4338, "Agent": "REINFORCE"}, {"env_step": 4577280, "rew": 603.557, "rew_std": 106.7744, "Agent": "REINFORCE"}, {"env_step": 4608000, "rew": 509.8114, "rew_std": 113.999, "Agent": "REINFORCE"}, {"env_step": 4638720, "rew": 570.2314, "rew_std": 128.3169, "Agent": "REINFORCE"}, {"env_step": 4669440, "rew": 561.8519, "rew_std": 167.7081, "Agent": "REINFORCE"}, {"env_step": 4700160, "rew": 512.5841, "rew_std": 105.8006, "Agent": "REINFORCE"}, {"env_step": 4730880, "rew": 579.3501, "rew_std": 131.1142, "Agent": "REINFORCE"}, {"env_step": 4761600, "rew": 580.1297, "rew_std": 136.0232, "Agent": "REINFORCE"}, {"env_step": 4792320, "rew": 515.8023, "rew_std": 102.5996, "Agent": "REINFORCE"}, {"env_step": 4823040, "rew": 598.8872, "rew_std": 158.7483, "Agent": "REINFORCE"}, {"env_step": 4853760, "rew": 622.3687, "rew_std": 95.173, "Agent": "REINFORCE"}, {"env_step": 4884480, "rew": 544.3778, "rew_std": 112.6735, "Agent": "REINFORCE"}, {"env_step": 4915200, "rew": 588.5974, "rew_std": 113.4368, "Agent": "REINFORCE"}, {"env_step": 4945920, "rew": 550.9882, "rew_std": 133.2863, "Agent": "REINFORCE"}, {"env_step": 4976640, "rew": 541.7536, "rew_std": 89.7816, "Agent": "REINFORCE"}, {"env_step": 5007360, "rew": 603.986, "rew_std": 135.1224, "Agent": "REINFORCE"}, {"env_step": 5038080, "rew": 583.561, "rew_std": 114.0059, "Agent": "REINFORCE"}, {"env_step": 5068800, "rew": 567.4875, "rew_std": 147.1721, "Agent": "REINFORCE"}, {"env_step": 5099520, "rew": 572.4557, "rew_std": 156.9581, "Agent": "REINFORCE"}, {"env_step": 5130240, "rew": 666.3246, "rew_std": 176.1906, "Agent": "REINFORCE"}, {"env_step": 5160960, "rew": 597.1891, "rew_std": 151.6925, "Agent": "REINFORCE"}, {"env_step": 5191680, "rew": 597.5578, "rew_std": 165.4627, "Agent": "REINFORCE"}, {"env_step": 5222400, "rew": 559.7764, "rew_std": 121.6349, "Agent": "REINFORCE"}, {"env_step": 5253120, "rew": 614.2217, "rew_std": 134.1647, "Agent": "REINFORCE"}, {"env_step": 5283840, "rew": 535.2713, "rew_std": 184.4832, "Agent": "REINFORCE"}, {"env_step": 5314560, "rew": 644.3689, "rew_std": 122.9989, "Agent": "REINFORCE"}, {"env_step": 5345280, "rew": 576.1621, "rew_std": 149.0917, "Agent": "REINFORCE"}, {"env_step": 5376000, "rew": 561.303, "rew_std": 165.4708, "Agent": "REINFORCE"}, {"env_step": 5406720, "rew": 648.7732, "rew_std": 219.9609, "Agent": "REINFORCE"}, {"env_step": 5437440, "rew": 576.5953, "rew_std": 140.9941, "Agent": "REINFORCE"}, {"env_step": 5468160, "rew": 562.7847, "rew_std": 152.2883, "Agent": "REINFORCE"}, {"env_step": 5498880, "rew": 655.4698, "rew_std": 101.2357, "Agent": "REINFORCE"}, {"env_step": 5529600, "rew": 626.2532, "rew_std": 225.647, "Agent": "REINFORCE"}, {"env_step": 5560320, "rew": 561.6642, "rew_std": 162.0297, "Agent": "REINFORCE"}, {"env_step": 5591040, "rew": 621.637, "rew_std": 144.4238, "Agent": "REINFORCE"}, {"env_step": 5621760, "rew": 621.095, "rew_std": 299.2659, "Agent": "REINFORCE"}, {"env_step": 5652480, "rew": 591.8279, "rew_std": 160.6478, "Agent": "REINFORCE"}, {"env_step": 5683200, "rew": 566.1898, "rew_std": 124.7465, "Agent": "REINFORCE"}, {"env_step": 5713920, "rew": 571.6892, "rew_std": 99.2399, "Agent": "REINFORCE"}, {"env_step": 5744640, "rew": 518.5974, "rew_std": 110.1643, "Agent": "REINFORCE"}, {"env_step": 5775360, "rew": 507.0606, "rew_std": 118.8786, "Agent": "REINFORCE"}, {"env_step": 5806080, "rew": 645.1324, "rew_std": 118.7828, "Agent": "REINFORCE"}, {"env_step": 5836800, "rew": 575.8455, "rew_std": 130.6544, "Agent": "REINFORCE"}, {"env_step": 5867520, "rew": 580.2341, "rew_std": 148.9996, "Agent": "REINFORCE"}, {"env_step": 5898240, "rew": 639.1779, "rew_std": 125.3437, "Agent": "REINFORCE"}, {"env_step": 5928960, "rew": 576.9596, "rew_std": 124.1505, "Agent": "REINFORCE"}, {"env_step": 5959680, "rew": 644.9708, "rew_std": 66.2187, "Agent": "REINFORCE"}, {"env_step": 5990400, "rew": 694.9196, "rew_std": 177.9414, "Agent": "REINFORCE"}, {"env_step": 6021120, "rew": 694.7615, "rew_std": 220.8509, "Agent": "REINFORCE"}, {"env_step": 6051840, "rew": 729.0638, "rew_std": 225.7093, "Agent": "REINFORCE"}, {"env_step": 6082560, "rew": 664.6531, "rew_std": 165.6677, "Agent": "REINFORCE"}, {"env_step": 6113280, "rew": 637.6006, "rew_std": 218.98, "Agent": "REINFORCE"}, {"env_step": 6144000, "rew": 528.8907, "rew_std": 108.5123, "Agent": "REINFORCE"}, {"env_step": 6174720, "rew": 582.7341, "rew_std": 142.043, "Agent": "REINFORCE"}, {"env_step": 6205440, "rew": 655.7331, "rew_std": 141.1264, "Agent": "REINFORCE"}, {"env_step": 6236160, "rew": 673.7024, "rew_std": 233.1061, "Agent": "REINFORCE"}, {"env_step": 6266880, "rew": 635.9546, "rew_std": 217.1002, "Agent": "REINFORCE"}, {"env_step": 6297600, "rew": 666.5248, "rew_std": 209.9766, "Agent": "REINFORCE"}, {"env_step": 6328320, "rew": 680.161, "rew_std": 140.829, "Agent": "REINFORCE"}, {"env_step": 6359040, "rew": 685.1298, "rew_std": 129.4409, "Agent": "REINFORCE"}, {"env_step": 6389760, "rew": 744.9942, "rew_std": 400.4335, "Agent": "REINFORCE"}, {"env_step": 6420480, "rew": 673.2758, "rew_std": 157.3355, "Agent": "REINFORCE"}, {"env_step": 6451200, "rew": 735.2884, "rew_std": 171.1652, "Agent": "REINFORCE"}, {"env_step": 6481920, "rew": 788.1765, "rew_std": 239.2203, "Agent": "REINFORCE"}, {"env_step": 6512640, "rew": 627.7094, "rew_std": 209.5059, "Agent": "REINFORCE"}, {"env_step": 6543360, "rew": 702.6232, "rew_std": 151.2339, "Agent": "REINFORCE"}, {"env_step": 6574080, "rew": 761.3974, "rew_std": 214.923, "Agent": "REINFORCE"}, {"env_step": 6604800, "rew": 715.0448, "rew_std": 193.3326, "Agent": "REINFORCE"}, {"env_step": 6635520, "rew": 687.1525, "rew_std": 80.5748, "Agent": "REINFORCE"}, {"env_step": 6666240, "rew": 738.8947, "rew_std": 197.2139, "Agent": "REINFORCE"}, {"env_step": 6696960, "rew": 735.0513, "rew_std": 243.043, "Agent": "REINFORCE"}, {"env_step": 6727680, "rew": 661.899, "rew_std": 137.0016, "Agent": "REINFORCE"}, {"env_step": 6758400, "rew": 717.0317, "rew_std": 115.1148, "Agent": "REINFORCE"}, {"env_step": 6789120, "rew": 713.7875, "rew_std": 190.9573, "Agent": "REINFORCE"}, {"env_step": 6819840, "rew": 753.5813, "rew_std": 224.2372, "Agent": "REINFORCE"}, {"env_step": 6850560, "rew": 827.5102, "rew_std": 200.4547, "Agent": "REINFORCE"}, {"env_step": 6881280, "rew": 790.6831, "rew_std": 281.7583, "Agent": "REINFORCE"}, {"env_step": 6912000, "rew": 828.0825, "rew_std": 186.1612, "Agent": "REINFORCE"}, {"env_step": 6942720, "rew": 740.5346, "rew_std": 192.5644, "Agent": "REINFORCE"}, {"env_step": 6973440, "rew": 768.3898, "rew_std": 173.439, "Agent": "REINFORCE"}, {"env_step": 7004160, "rew": 767.4472, "rew_std": 81.7889, "Agent": "REINFORCE"}, {"env_step": 7034880, "rew": 843.0486, "rew_std": 207.4263, "Agent": "REINFORCE"}, {"env_step": 7065600, "rew": 917.0862, "rew_std": 175.6432, "Agent": "REINFORCE"}, {"env_step": 7096320, "rew": 764.7748, "rew_std": 186.3004, "Agent": "REINFORCE"}, {"env_step": 7127040, "rew": 818.4783, "rew_std": 227.9405, "Agent": "REINFORCE"}, {"env_step": 7157760, "rew": 840.2352, "rew_std": 254.5002, "Agent": "REINFORCE"}, {"env_step": 7188480, "rew": 731.5163, "rew_std": 233.0287, "Agent": "REINFORCE"}, {"env_step": 7219200, "rew": 804.892, "rew_std": 206.5893, "Agent": "REINFORCE"}, {"env_step": 7249920, "rew": 721.1122, "rew_std": 119.3359, "Agent": "REINFORCE"}, {"env_step": 7280640, "rew": 745.0533, "rew_std": 216.2748, "Agent": "REINFORCE"}, {"env_step": 7311360, "rew": 789.4155, "rew_std": 201.4028, "Agent": "REINFORCE"}, {"env_step": 7342080, "rew": 778.7515, "rew_std": 169.0804, "Agent": "REINFORCE"}, {"env_step": 7372800, "rew": 722.2184, "rew_std": 159.7289, "Agent": "REINFORCE"}, {"env_step": 7403520, "rew": 730.5377, "rew_std": 244.0747, "Agent": "REINFORCE"}, {"env_step": 7434240, "rew": 821.842, "rew_std": 228.4728, "Agent": "REINFORCE"}, {"env_step": 7464960, "rew": 773.8623, "rew_std": 236.9126, "Agent": "REINFORCE"}, {"env_step": 7495680, "rew": 785.3531, "rew_std": 206.1696, "Agent": "REINFORCE"}, {"env_step": 7526400, "rew": 851.5261, "rew_std": 228.7796, "Agent": "REINFORCE"}, {"env_step": 7557120, "rew": 831.5571, "rew_std": 212.207, "Agent": "REINFORCE"}, {"env_step": 7587840, "rew": 813.1027, "rew_std": 244.633, "Agent": "REINFORCE"}, {"env_step": 7618560, "rew": 924.0815, "rew_std": 257.4552, "Agent": "REINFORCE"}, {"env_step": 7649280, "rew": 849.9347, "rew_std": 237.2322, "Agent": "REINFORCE"}, {"env_step": 7680000, "rew": 809.7352, "rew_std": 161.8209, "Agent": "REINFORCE"}, {"env_step": 7710720, "rew": 899.7744, "rew_std": 126.8619, "Agent": "REINFORCE"}, {"env_step": 7741440, "rew": 775.6868, "rew_std": 111.1748, "Agent": "REINFORCE"}, {"env_step": 7772160, "rew": 783.3401, "rew_std": 172.1061, "Agent": "REINFORCE"}, {"env_step": 7802880, "rew": 775.995, "rew_std": 238.964, "Agent": "REINFORCE"}, {"env_step": 7833600, "rew": 738.9181, "rew_std": 247.9718, "Agent": "REINFORCE"}, {"env_step": 7864320, "rew": 845.1103, "rew_std": 144.6614, "Agent": "REINFORCE"}, {"env_step": 7895040, "rew": 846.7213, "rew_std": 251.5901, "Agent": "REINFORCE"}, {"env_step": 7925760, "rew": 903.9714, "rew_std": 248.4302, "Agent": "REINFORCE"}, {"env_step": 7956480, "rew": 885.5948, "rew_std": 214.2679, "Agent": "REINFORCE"}, {"env_step": 7987200, "rew": 797.1632, "rew_std": 213.6274, "Agent": "REINFORCE"}, {"env_step": 8017920, "rew": 750.0977, "rew_std": 243.3167, "Agent": "REINFORCE"}, {"env_step": 8048640, "rew": 775.8821, "rew_std": 222.1063, "Agent": "REINFORCE"}, {"env_step": 8079360, "rew": 776.964, "rew_std": 195.6586, "Agent": "REINFORCE"}, {"env_step": 8110080, "rew": 834.2439, "rew_std": 307.1783, "Agent": "REINFORCE"}, {"env_step": 8140800, "rew": 922.2053, "rew_std": 245.5225, "Agent": "REINFORCE"}, {"env_step": 8171520, "rew": 900.8791, "rew_std": 257.9531, "Agent": "REINFORCE"}, {"env_step": 8202240, "rew": 896.3298, "rew_std": 277.692, "Agent": "REINFORCE"}, {"env_step": 8232960, "rew": 915.0473, "rew_std": 384.9129, "Agent": "REINFORCE"}, {"env_step": 8263680, "rew": 830.1566, "rew_std": 127.4406, "Agent": "REINFORCE"}, {"env_step": 8294400, "rew": 889.0198, "rew_std": 312.3793, "Agent": "REINFORCE"}, {"env_step": 8325120, "rew": 888.688, "rew_std": 271.7225, "Agent": "REINFORCE"}, {"env_step": 8355840, "rew": 824.6942, "rew_std": 196.723, "Agent": "REINFORCE"}, {"env_step": 8386560, "rew": 863.9463, "rew_std": 227.5124, "Agent": "REINFORCE"}, {"env_step": 8417280, "rew": 870.4753, "rew_std": 236.4412, "Agent": "REINFORCE"}, {"env_step": 8448000, "rew": 818.8857, "rew_std": 222.3761, "Agent": "REINFORCE"}, {"env_step": 8478720, "rew": 776.188, "rew_std": 228.0678, "Agent": "REINFORCE"}, {"env_step": 8509440, "rew": 882.9349, "rew_std": 201.0272, "Agent": "REINFORCE"}, {"env_step": 8540160, "rew": 825.3203, "rew_std": 188.1268, "Agent": "REINFORCE"}, {"env_step": 8570880, "rew": 831.3546, "rew_std": 251.4183, "Agent": "REINFORCE"}, {"env_step": 8601600, "rew": 820.2887, "rew_std": 219.7999, "Agent": "REINFORCE"}, {"env_step": 8632320, "rew": 925.9424, "rew_std": 204.7964, "Agent": "REINFORCE"}, {"env_step": 8663040, "rew": 765.2604, "rew_std": 149.2658, "Agent": "REINFORCE"}, {"env_step": 8693760, "rew": 913.36, "rew_std": 347.7958, "Agent": "REINFORCE"}, {"env_step": 8724480, "rew": 747.734, "rew_std": 165.6218, "Agent": "REINFORCE"}, {"env_step": 8755200, "rew": 864.8618, "rew_std": 258.5876, "Agent": "REINFORCE"}, {"env_step": 8785920, "rew": 834.3716, "rew_std": 149.974, "Agent": "REINFORCE"}, {"env_step": 8816640, "rew": 942.7596, "rew_std": 318.8342, "Agent": "REINFORCE"}, {"env_step": 8847360, "rew": 819.8248, "rew_std": 136.2533, "Agent": "REINFORCE"}, {"env_step": 8878080, "rew": 939.1256, "rew_std": 345.884, "Agent": "REINFORCE"}, {"env_step": 8908800, "rew": 919.9905, "rew_std": 318.5415, "Agent": "REINFORCE"}, {"env_step": 8939520, "rew": 952.3609, "rew_std": 243.2247, "Agent": "REINFORCE"}, {"env_step": 8970240, "rew": 1002.9598, "rew_std": 411.5419, "Agent": "REINFORCE"}, {"env_step": 9000960, "rew": 978.2093, "rew_std": 150.1634, "Agent": "REINFORCE"}, {"env_step": 9031680, "rew": 1000.6892, "rew_std": 238.6836, "Agent": "REINFORCE"}, {"env_step": 9062400, "rew": 923.7965, "rew_std": 265.0906, "Agent": "REINFORCE"}, {"env_step": 9093120, "rew": 1027.5603, "rew_std": 356.688, "Agent": "REINFORCE"}, {"env_step": 9123840, "rew": 927.87, "rew_std": 218.0477, "Agent": "REINFORCE"}, {"env_step": 9154560, "rew": 947.8009, "rew_std": 196.2311, "Agent": "REINFORCE"}, {"env_step": 9185280, "rew": 1002.6192, "rew_std": 346.7466, "Agent": "REINFORCE"}, {"env_step": 9216000, "rew": 966.7356, "rew_std": 257.1045, "Agent": "REINFORCE"}, {"env_step": 9246720, "rew": 850.2131, "rew_std": 272.2633, "Agent": "REINFORCE"}, {"env_step": 9277440, "rew": 999.9818, "rew_std": 242.1809, "Agent": "REINFORCE"}, {"env_step": 9308160, "rew": 945.274, "rew_std": 292.8736, "Agent": "REINFORCE"}, {"env_step": 9338880, "rew": 1011.6188, "rew_std": 206.0314, "Agent": "REINFORCE"}, {"env_step": 9369600, "rew": 936.7706, "rew_std": 169.1316, "Agent": "REINFORCE"}, {"env_step": 9400320, "rew": 909.0751, "rew_std": 195.3988, "Agent": "REINFORCE"}, {"env_step": 9431040, "rew": 854.0486, "rew_std": 211.4514, "Agent": "REINFORCE"}, {"env_step": 9461760, "rew": 960.132, "rew_std": 259.6515, "Agent": "REINFORCE"}, {"env_step": 9492480, "rew": 907.91, "rew_std": 339.0151, "Agent": "REINFORCE"}, {"env_step": 9523200, "rew": 1108.1313, "rew_std": 323.0787, "Agent": "REINFORCE"}, {"env_step": 9553920, "rew": 1003.4416, "rew_std": 259.1606, "Agent": "REINFORCE"}, {"env_step": 9584640, "rew": 906.0153, "rew_std": 269.067, "Agent": "REINFORCE"}, {"env_step": 9615360, "rew": 832.5955, "rew_std": 223.1421, "Agent": "REINFORCE"}, {"env_step": 9646080, "rew": 870.3656, "rew_std": 172.9299, "Agent": "REINFORCE"}, {"env_step": 9676800, "rew": 952.6487, "rew_std": 256.4124, "Agent": "REINFORCE"}, {"env_step": 9707520, "rew": 891.1408, "rew_std": 258.5006, "Agent": "REINFORCE"}, {"env_step": 9738240, "rew": 1067.376, "rew_std": 426.0889, "Agent": "REINFORCE"}, {"env_step": 9768960, "rew": 994.8644, "rew_std": 235.152, "Agent": "REINFORCE"}, {"env_step": 9799680, "rew": 1036.7538, "rew_std": 350.4073, "Agent": "REINFORCE"}, {"env_step": 9830400, "rew": 941.5028, "rew_std": 290.7186, "Agent": "REINFORCE"}, {"env_step": 9861120, "rew": 1004.6263, "rew_std": 189.7126, "Agent": "REINFORCE"}, {"env_step": 9891840, "rew": 1090.99, "rew_std": 218.7887, "Agent": "REINFORCE"}, {"env_step": 9922560, "rew": 1025.0696, "rew_std": 270.5742, "Agent": "REINFORCE"}, {"env_step": 9953280, "rew": 1001.7405, "rew_std": 334.5234, "Agent": "REINFORCE"}, {"env_step": 9984000, "rew": 859.6256, "rew_std": 283.6046, "Agent": "REINFORCE"}, {"env_step": 10014720, "rew": 916.4069, "rew_std": 234.0294, "Agent": "REINFORCE"}, {"env_step": 10045440, "rew": 999.6534, "rew_std": 370.8359, "Agent": "REINFORCE"}, {"env_step": 10076160, "rew": 956.329, "rew_std": 303.8919, "Agent": "REINFORCE"}, {"env_step": 10106880, "rew": 966.2531, "rew_std": 375.6601, "Agent": "REINFORCE"}, {"env_step": 10137600, "rew": 940.921, "rew_std": 362.3317, "Agent": "REINFORCE"}, {"env_step": 10168320, "rew": 989.9863, "rew_std": 233.9977, "Agent": "REINFORCE"}, {"env_step": 10199040, "rew": 870.4539, "rew_std": 227.1541, "Agent": "REINFORCE"}, {"env_step": 10229760, "rew": 1087.806, "rew_std": 295.9252, "Agent": "REINFORCE"}, {"env_step": 0, "rew": 990.3785, "rew_std": 4.297, "Agent": "SAC"}, {"env_step": 5000, "rew": 634.386, "rew_std": 184.9621, "Agent": "SAC"}, {"env_step": 10000, "rew": 466.3264, "rew_std": 104.4639, "Agent": "SAC"}, {"env_step": 15000, "rew": 472.4038, "rew_std": 142.9891, "Agent": "SAC"}, {"env_step": 20000, "rew": 506.0177, "rew_std": 161.9189, "Agent": "SAC"}, {"env_step": 25000, "rew": 603.8001, "rew_std": 120.5751, "Agent": "SAC"}, {"env_step": 30000, "rew": 608.1596, "rew_std": 147.4683, "Agent": "SAC"}, {"env_step": 35000, "rew": 596.8617, "rew_std": 185.3435, "Agent": "SAC"}, {"env_step": 40000, "rew": 605.0013, "rew_std": 123.9596, "Agent": "SAC"}, {"env_step": 45000, "rew": 682.4043, "rew_std": 126.4225, "Agent": "SAC"}, {"env_step": 50000, "rew": 711.1211, "rew_std": 181.235, "Agent": "SAC"}, {"env_step": 55000, "rew": 712.1348, "rew_std": 158.3893, "Agent": "SAC"}, {"env_step": 60000, "rew": 668.6808, "rew_std": 186.2096, "Agent": "SAC"}, {"env_step": 65000, "rew": 803.7135, "rew_std": 128.7597, "Agent": "SAC"}, {"env_step": 70000, "rew": 836.9211, "rew_std": 249.2294, "Agent": "SAC"}, {"env_step": 75000, "rew": 812.1804, "rew_std": 203.7858, "Agent": "SAC"}, {"env_step": 80000, "rew": 816.8486, "rew_std": 280.3634, "Agent": "SAC"}, {"env_step": 85000, "rew": 838.3772, "rew_std": 331.4502, "Agent": "SAC"}, {"env_step": 90000, "rew": 901.242, "rew_std": 295.797, "Agent": "SAC"}, {"env_step": 95000, "rew": 859.4468, "rew_std": 261.5593, "Agent": "SAC"}, {"env_step": 100000, "rew": 1019.8017, "rew_std": 449.9045, "Agent": "SAC"}, {"env_step": 105000, "rew": 1030.3104, "rew_std": 286.2318, "Agent": "SAC"}, {"env_step": 110000, "rew": 963.0668, "rew_std": 311.5471, "Agent": "SAC"}, {"env_step": 115000, "rew": 1089.9735, "rew_std": 519.6678, "Agent": "SAC"}, {"env_step": 120000, "rew": 1178.9178, "rew_std": 389.9193, "Agent": "SAC"}, {"env_step": 125000, "rew": 1322.1717, "rew_std": 393.7724, "Agent": "SAC"}, {"env_step": 130000, "rew": 1312.6976, "rew_std": 469.6964, "Agent": "SAC"}, {"env_step": 135000, "rew": 1347.1568, "rew_std": 414.4463, "Agent": "SAC"}, {"env_step": 140000, "rew": 1386.2821, "rew_std": 553.034, "Agent": "SAC"}, {"env_step": 145000, "rew": 1585.8144, "rew_std": 678.5971, "Agent": "SAC"}, {"env_step": 150000, "rew": 1426.0943, "rew_std": 782.1992, "Agent": "SAC"}, {"env_step": 155000, "rew": 1485.7579, "rew_std": 816.0993, "Agent": "SAC"}, {"env_step": 160000, "rew": 1335.9676, "rew_std": 526.1357, "Agent": "SAC"}, {"env_step": 165000, "rew": 1727.0195, "rew_std": 949.2217, "Agent": "SAC"}, {"env_step": 170000, "rew": 1815.7559, "rew_std": 780.9618, "Agent": "SAC"}, {"env_step": 175000, "rew": 1679.7342, "rew_std": 608.2833, "Agent": "SAC"}, {"env_step": 180000, "rew": 1755.6202, "rew_std": 908.6728, "Agent": "SAC"}, {"env_step": 185000, "rew": 2060.7492, "rew_std": 798.1616, "Agent": "SAC"}, {"env_step": 190000, "rew": 2071.3926, "rew_std": 891.6286, "Agent": "SAC"}, {"env_step": 195000, "rew": 1972.7574, "rew_std": 905.4189, "Agent": "SAC"}, {"env_step": 200000, "rew": 2132.5654, "rew_std": 977.1712, "Agent": "SAC"}, {"env_step": 205000, "rew": 2025.7295, "rew_std": 691.8455, "Agent": "SAC"}, {"env_step": 210000, "rew": 2247.2497, "rew_std": 695.7745, "Agent": "SAC"}, {"env_step": 215000, "rew": 2227.0186, "rew_std": 914.713, "Agent": "SAC"}, {"env_step": 220000, "rew": 2743.7285, "rew_std": 978.705, "Agent": "SAC"}, {"env_step": 225000, "rew": 2755.1179, "rew_std": 976.5856, "Agent": "SAC"}, {"env_step": 230000, "rew": 2240.208, "rew_std": 758.3069, "Agent": "SAC"}, {"env_step": 235000, "rew": 2476.1974, "rew_std": 1088.2916, "Agent": "SAC"}, {"env_step": 240000, "rew": 2759.6599, "rew_std": 868.8349, "Agent": "SAC"}, {"env_step": 245000, "rew": 2654.4313, "rew_std": 1008.0752, "Agent": "SAC"}, {"env_step": 250000, "rew": 2892.8498, "rew_std": 1175.0901, "Agent": "SAC"}, {"env_step": 255000, "rew": 3023.2165, "rew_std": 936.6243, "Agent": "SAC"}, {"env_step": 260000, "rew": 2987.143, "rew_std": 954.9922, "Agent": "SAC"}, {"env_step": 265000, "rew": 3086.6823, "rew_std": 878.5816, "Agent": "SAC"}, {"env_step": 270000, "rew": 2476.7571, "rew_std": 831.4616, "Agent": "SAC"}, {"env_step": 275000, "rew": 3028.8691, "rew_std": 810.8356, "Agent": "SAC"}, {"env_step": 280000, "rew": 3236.7877, "rew_std": 1200.7687, "Agent": "SAC"}, {"env_step": 285000, "rew": 3482.0228, "rew_std": 1098.2739, "Agent": "SAC"}, {"env_step": 290000, "rew": 3599.3998, "rew_std": 707.1372, "Agent": "SAC"}, {"env_step": 295000, "rew": 3509.0719, "rew_std": 898.0675, "Agent": "SAC"}, {"env_step": 300000, "rew": 3560.7321, "rew_std": 779.5421, "Agent": "SAC"}, {"env_step": 305000, "rew": 3496.5751, "rew_std": 1100.757, "Agent": "SAC"}, {"env_step": 310000, "rew": 3608.0523, "rew_std": 971.3736, "Agent": "SAC"}, {"env_step": 315000, "rew": 3281.9811, "rew_std": 1226.0263, "Agent": "SAC"}, {"env_step": 320000, "rew": 3766.0278, "rew_std": 1120.3099, "Agent": "SAC"}, {"env_step": 325000, "rew": 4018.244, "rew_std": 799.463, "Agent": "SAC"}, {"env_step": 330000, "rew": 3653.1125, "rew_std": 1122.2692, "Agent": "SAC"}, {"env_step": 335000, "rew": 3968.1996, "rew_std": 848.7675, "Agent": "SAC"}, {"env_step": 340000, "rew": 3903.1583, "rew_std": 586.599, "Agent": "SAC"}, {"env_step": 345000, "rew": 3799.5278, "rew_std": 897.6643, "Agent": "SAC"}, {"env_step": 350000, "rew": 3659.2519, "rew_std": 813.1146, "Agent": "SAC"}, {"env_step": 355000, "rew": 4339.5464, "rew_std": 627.7838, "Agent": "SAC"}, {"env_step": 360000, "rew": 3534.6213, "rew_std": 978.4176, "Agent": "SAC"}, {"env_step": 365000, "rew": 3823.3135, "rew_std": 840.9491, "Agent": "SAC"}, {"env_step": 370000, "rew": 4312.3502, "rew_std": 707.5655, "Agent": "SAC"}, {"env_step": 375000, "rew": 3882.813, "rew_std": 899.9477, "Agent": "SAC"}, {"env_step": 380000, "rew": 4151.4361, "rew_std": 886.019, "Agent": "SAC"}, {"env_step": 385000, "rew": 4247.4278, "rew_std": 817.3344, "Agent": "SAC"}, {"env_step": 390000, "rew": 4193.3913, "rew_std": 1289.8256, "Agent": "SAC"}, {"env_step": 395000, "rew": 4262.8331, "rew_std": 856.4907, "Agent": "SAC"}, {"env_step": 400000, "rew": 4417.5728, "rew_std": 710.4488, "Agent": "SAC"}, {"env_step": 405000, "rew": 4215.4565, "rew_std": 737.7075, "Agent": "SAC"}, {"env_step": 410000, "rew": 4656.0872, "rew_std": 618.7525, "Agent": "SAC"}, {"env_step": 415000, "rew": 4324.2753, "rew_std": 1087.3486, "Agent": "SAC"}, {"env_step": 420000, "rew": 4373.4924, "rew_std": 1044.2813, "Agent": "SAC"}, {"env_step": 425000, "rew": 4343.1537, "rew_std": 650.1327, "Agent": "SAC"}, {"env_step": 430000, "rew": 4477.3905, "rew_std": 881.3755, "Agent": "SAC"}, {"env_step": 435000, "rew": 4355.3773, "rew_std": 944.8012, "Agent": "SAC"}, {"env_step": 440000, "rew": 4675.7451, "rew_std": 647.9754, "Agent": "SAC"}, {"env_step": 445000, "rew": 4120.4879, "rew_std": 1154.4533, "Agent": "SAC"}, {"env_step": 450000, "rew": 4728.8119, "rew_std": 754.292, "Agent": "SAC"}, {"env_step": 455000, "rew": 4705.7272, "rew_std": 691.9497, "Agent": "SAC"}, {"env_step": 460000, "rew": 4537.7941, "rew_std": 1034.1699, "Agent": "SAC"}, {"env_step": 465000, "rew": 4082.6977, "rew_std": 1489.3087, "Agent": "SAC"}, {"env_step": 470000, "rew": 4350.9532, "rew_std": 1500.3143, "Agent": "SAC"}, {"env_step": 475000, "rew": 4122.221, "rew_std": 1546.766, "Agent": "SAC"}, {"env_step": 480000, "rew": 4725.6855, "rew_std": 949.7799, "Agent": "SAC"}, {"env_step": 485000, "rew": 4804.9972, "rew_std": 707.0428, "Agent": "SAC"}, {"env_step": 490000, "rew": 4877.2005, "rew_std": 643.9763, "Agent": "SAC"}, {"env_step": 495000, "rew": 5034.0545, "rew_std": 475.6285, "Agent": "SAC"}, {"env_step": 500000, "rew": 5128.7439, "rew_std": 518.8488, "Agent": "SAC"}, {"env_step": 505000, "rew": 5069.8386, "rew_std": 636.3886, "Agent": "SAC"}, {"env_step": 510000, "rew": 5159.2177, "rew_std": 596.1149, "Agent": "SAC"}, {"env_step": 515000, "rew": 4712.5957, "rew_std": 827.3416, "Agent": "SAC"}, {"env_step": 520000, "rew": 4981.1566, "rew_std": 963.9806, "Agent": "SAC"}, {"env_step": 525000, "rew": 4913.5781, "rew_std": 737.1729, "Agent": "SAC"}, {"env_step": 530000, "rew": 4850.7048, "rew_std": 852.6721, "Agent": "SAC"}, {"env_step": 535000, "rew": 4963.8677, "rew_std": 858.5452, "Agent": "SAC"}, {"env_step": 540000, "rew": 5204.4067, "rew_std": 472.5198, "Agent": "SAC"}, {"env_step": 545000, "rew": 5012.2747, "rew_std": 705.919, "Agent": "SAC"}, {"env_step": 550000, "rew": 5167.2548, "rew_std": 609.7783, "Agent": "SAC"}, {"env_step": 555000, "rew": 4387.9413, "rew_std": 2043.9651, "Agent": "SAC"}, {"env_step": 560000, "rew": 4758.9642, "rew_std": 1701.0235, "Agent": "SAC"}, {"env_step": 565000, "rew": 4160.9355, "rew_std": 2370.4786, "Agent": "SAC"}, {"env_step": 570000, "rew": 4081.5274, "rew_std": 2229.5623, "Agent": "SAC"}, {"env_step": 575000, "rew": 4145.1935, "rew_std": 2112.6704, "Agent": "SAC"}, {"env_step": 580000, "rew": 4558.6605, "rew_std": 1902.1764, "Agent": "SAC"}, {"env_step": 585000, "rew": 4824.5614, "rew_std": 1853.2917, "Agent": "SAC"}, {"env_step": 590000, "rew": 4470.5525, "rew_std": 1523.8954, "Agent": "SAC"}, {"env_step": 595000, "rew": 5261.3918, "rew_std": 814.7524, "Agent": "SAC"}, {"env_step": 600000, "rew": 4924.1725, "rew_std": 720.2538, "Agent": "SAC"}, {"env_step": 605000, "rew": 5051.8181, "rew_std": 548.6794, "Agent": "SAC"}, {"env_step": 610000, "rew": 4967.6005, "rew_std": 925.7063, "Agent": "SAC"}, {"env_step": 615000, "rew": 5394.8005, "rew_std": 639.5644, "Agent": "SAC"}, {"env_step": 620000, "rew": 5062.7683, "rew_std": 724.4078, "Agent": "SAC"}, {"env_step": 625000, "rew": 5078.1642, "rew_std": 702.1159, "Agent": "SAC"}, {"env_step": 630000, "rew": 5317.6296, "rew_std": 437.7749, "Agent": "SAC"}, {"env_step": 635000, "rew": 4704.1758, "rew_std": 2060.9637, "Agent": "SAC"}, {"env_step": 640000, "rew": 4843.6902, "rew_std": 1808.5671, "Agent": "SAC"}, {"env_step": 645000, "rew": 4581.3947, "rew_std": 1571.9396, "Agent": "SAC"}, {"env_step": 650000, "rew": 4826.9942, "rew_std": 1221.073, "Agent": "SAC"}, {"env_step": 655000, "rew": 5288.6551, "rew_std": 490.8404, "Agent": "SAC"}, {"env_step": 660000, "rew": 5335.5634, "rew_std": 508.8307, "Agent": "SAC"}, {"env_step": 665000, "rew": 5266.9036, "rew_std": 517.7074, "Agent": "SAC"}, {"env_step": 670000, "rew": 5547.8741, "rew_std": 354.7182, "Agent": "SAC"}, {"env_step": 675000, "rew": 5328.8314, "rew_std": 489.3294, "Agent": "SAC"}, {"env_step": 680000, "rew": 5405.7608, "rew_std": 288.6692, "Agent": "SAC"}, {"env_step": 685000, "rew": 5411.7402, "rew_std": 503.3251, "Agent": "SAC"}, {"env_step": 690000, "rew": 5260.8163, "rew_std": 502.3217, "Agent": "SAC"}, {"env_step": 695000, "rew": 5450.3069, "rew_std": 519.2909, "Agent": "SAC"}, {"env_step": 700000, "rew": 5336.7194, "rew_std": 764.3954, "Agent": "SAC"}, {"env_step": 705000, "rew": 5491.0999, "rew_std": 602.9351, "Agent": "SAC"}, {"env_step": 710000, "rew": 5338.5924, "rew_std": 430.7632, "Agent": "SAC"}, {"env_step": 715000, "rew": 5694.361, "rew_std": 227.2388, "Agent": "SAC"}, {"env_step": 720000, "rew": 5406.0092, "rew_std": 443.1683, "Agent": "SAC"}, {"env_step": 725000, "rew": 5575.3379, "rew_std": 379.3146, "Agent": "SAC"}, {"env_step": 730000, "rew": 5475.6525, "rew_std": 482.8181, "Agent": "SAC"}, {"env_step": 735000, "rew": 5315.6012, "rew_std": 605.0353, "Agent": "SAC"}, {"env_step": 740000, "rew": 5569.833, "rew_std": 348.5342, "Agent": "SAC"}, {"env_step": 745000, "rew": 5545.2522, "rew_std": 556.2845, "Agent": "SAC"}, {"env_step": 750000, "rew": 5725.0663, "rew_std": 311.8731, "Agent": "SAC"}, {"env_step": 755000, "rew": 5690.6184, "rew_std": 351.7627, "Agent": "SAC"}, {"env_step": 760000, "rew": 5567.3753, "rew_std": 482.2716, "Agent": "SAC"}, {"env_step": 765000, "rew": 5510.4696, "rew_std": 385.251, "Agent": "SAC"}, {"env_step": 770000, "rew": 5270.3259, "rew_std": 987.3123, "Agent": "SAC"}, {"env_step": 775000, "rew": 5467.4195, "rew_std": 853.2007, "Agent": "SAC"}, {"env_step": 780000, "rew": 5287.154, "rew_std": 1035.4332, "Agent": "SAC"}, {"env_step": 785000, "rew": 5691.6446, "rew_std": 516.7474, "Agent": "SAC"}, {"env_step": 790000, "rew": 5591.892, "rew_std": 295.6546, "Agent": "SAC"}, {"env_step": 795000, "rew": 5488.8903, "rew_std": 424.9128, "Agent": "SAC"}, {"env_step": 800000, "rew": 5459.0244, "rew_std": 826.6396, "Agent": "SAC"}, {"env_step": 805000, "rew": 5664.4516, "rew_std": 397.5254, "Agent": "SAC"}, {"env_step": 810000, "rew": 5543.2376, "rew_std": 562.8029, "Agent": "SAC"}, {"env_step": 815000, "rew": 5693.9674, "rew_std": 408.3632, "Agent": "SAC"}, {"env_step": 820000, "rew": 5680.3464, "rew_std": 307.6037, "Agent": "SAC"}, {"env_step": 825000, "rew": 5709.4142, "rew_std": 227.2665, "Agent": "SAC"}, {"env_step": 830000, "rew": 5555.0137, "rew_std": 505.6524, "Agent": "SAC"}, {"env_step": 835000, "rew": 5673.183, "rew_std": 379.6022, "Agent": "SAC"}, {"env_step": 840000, "rew": 5107.2045, "rew_std": 1424.1345, "Agent": "SAC"}, {"env_step": 845000, "rew": 5517.1734, "rew_std": 693.1669, "Agent": "SAC"}, {"env_step": 850000, "rew": 5629.4855, "rew_std": 347.9435, "Agent": "SAC"}, {"env_step": 855000, "rew": 5564.5545, "rew_std": 534.6357, "Agent": "SAC"}, {"env_step": 860000, "rew": 5395.1586, "rew_std": 782.8633, "Agent": "SAC"}, {"env_step": 865000, "rew": 5656.6156, "rew_std": 360.7084, "Agent": "SAC"}, {"env_step": 870000, "rew": 5845.8685, "rew_std": 260.3917, "Agent": "SAC"}, {"env_step": 875000, "rew": 5446.3008, "rew_std": 735.6111, "Agent": "SAC"}, {"env_step": 880000, "rew": 5640.0635, "rew_std": 470.5824, "Agent": "SAC"}, {"env_step": 885000, "rew": 5732.5999, "rew_std": 502.8969, "Agent": "SAC"}, {"env_step": 890000, "rew": 5555.4769, "rew_std": 465.2802, "Agent": "SAC"}, {"env_step": 895000, "rew": 5651.3705, "rew_std": 230.4769, "Agent": "SAC"}, {"env_step": 900000, "rew": 5702.166, "rew_std": 372.4946, "Agent": "SAC"}, {"env_step": 905000, "rew": 5720.2143, "rew_std": 355.2288, "Agent": "SAC"}, {"env_step": 910000, "rew": 5585.9028, "rew_std": 563.3985, "Agent": "SAC"}, {"env_step": 915000, "rew": 5672.2431, "rew_std": 522.0986, "Agent": "SAC"}, {"env_step": 920000, "rew": 5778.5705, "rew_std": 412.6784, "Agent": "SAC"}, {"env_step": 925000, "rew": 5810.2684, "rew_std": 324.2981, "Agent": "SAC"}, {"env_step": 930000, "rew": 5125.3163, "rew_std": 1923.0686, "Agent": "SAC"}, {"env_step": 935000, "rew": 4851.2896, "rew_std": 2254.6923, "Agent": "SAC"}, {"env_step": 940000, "rew": 5244.8474, "rew_std": 1666.2577, "Agent": "SAC"}, {"env_step": 945000, "rew": 5303.0647, "rew_std": 1354.3917, "Agent": "SAC"}, {"env_step": 950000, "rew": 5653.4382, "rew_std": 624.9922, "Agent": "SAC"}, {"env_step": 955000, "rew": 5778.0612, "rew_std": 426.7755, "Agent": "SAC"}, {"env_step": 960000, "rew": 5670.2887, "rew_std": 693.5821, "Agent": "SAC"}, {"env_step": 965000, "rew": 5044.8635, "rew_std": 1861.1285, "Agent": "SAC"}, {"env_step": 970000, "rew": 4849.5535, "rew_std": 2068.7704, "Agent": "SAC"}, {"env_step": 975000, "rew": 5113.4048, "rew_std": 1735.4742, "Agent": "SAC"}, {"env_step": 980000, "rew": 5188.3984, "rew_std": 1727.6241, "Agent": "SAC"}, {"env_step": 985000, "rew": 5850.2488, "rew_std": 475.6532, "Agent": "SAC"}, {"env_step": 990000, "rew": 5813.4523, "rew_std": 264.809, "Agent": "SAC"}, {"env_step": 995000, "rew": 5742.2444, "rew_std": 418.5699, "Agent": "SAC"}, {"env_step": 1000000, "rew": 5714.2661, "rew_std": 368.5243, "Agent": "SAC"}, {"env_step": 1005000, "rew": 5413.1424, "rew_std": 797.9577, "Agent": "SAC"}, {"env_step": 1010000, "rew": 5183.4618, "rew_std": 2031.9834, "Agent": "SAC"}, {"env_step": 1015000, "rew": 5119.8702, "rew_std": 1840.3876, "Agent": "SAC"}, {"env_step": 1020000, "rew": 5168.524, "rew_std": 1586.408, "Agent": "SAC"}, {"env_step": 1025000, "rew": 5733.1041, "rew_std": 317.4068, "Agent": "SAC"}, {"env_step": 1030000, "rew": 5642.594, "rew_std": 248.2455, "Agent": "SAC"}, {"env_step": 1035000, "rew": 5850.1509, "rew_std": 411.4642, "Agent": "SAC"}, {"env_step": 1040000, "rew": 5974.4491, "rew_std": 269.7785, "Agent": "SAC"}, {"env_step": 1045000, "rew": 5031.7685, "rew_std": 2330.7907, "Agent": "SAC"}, {"env_step": 1050000, "rew": 5236.7993, "rew_std": 1973.0137, "Agent": "SAC"}, {"env_step": 1055000, "rew": 5021.8125, "rew_std": 2004.5906, "Agent": "SAC"}, {"env_step": 1060000, "rew": 5165.6284, "rew_std": 2382.8055, "Agent": "SAC"}, {"env_step": 1065000, "rew": 5158.7046, "rew_std": 1851.172, "Agent": "SAC"}, {"env_step": 1070000, "rew": 5138.9775, "rew_std": 2083.5424, "Agent": "SAC"}, {"env_step": 1075000, "rew": 5019.4091, "rew_std": 2127.5281, "Agent": "SAC"}, {"env_step": 1080000, "rew": 5292.9344, "rew_std": 2149.235, "Agent": "SAC"}, {"env_step": 1085000, "rew": 5154.5682, "rew_std": 1838.3159, "Agent": "SAC"}, {"env_step": 1090000, "rew": 5282.5727, "rew_std": 1822.7381, "Agent": "SAC"}, {"env_step": 1095000, "rew": 4668.0528, "rew_std": 2605.2238, "Agent": "SAC"}, {"env_step": 1100000, "rew": 4801.5646, "rew_std": 2266.8663, "Agent": "SAC"}, {"env_step": 1105000, "rew": 4975.1772, "rew_std": 2411.4807, "Agent": "SAC"}, {"env_step": 1110000, "rew": 5378.207, "rew_std": 1623.0413, "Agent": "SAC"}, {"env_step": 1115000, "rew": 5516.254, "rew_std": 841.5805, "Agent": "SAC"}, {"env_step": 1120000, "rew": 5419.4915, "rew_std": 888.8777, "Agent": "SAC"}, {"env_step": 1125000, "rew": 5582.7173, "rew_std": 1128.1217, "Agent": "SAC"}, {"env_step": 1130000, "rew": 5497.8511, "rew_std": 1006.239, "Agent": "SAC"}, {"env_step": 1135000, "rew": 5839.487, "rew_std": 431.9108, "Agent": "SAC"}, {"env_step": 1140000, "rew": 5961.432, "rew_std": 378.7637, "Agent": "SAC"}, {"env_step": 1145000, "rew": 5857.0817, "rew_std": 374.6548, "Agent": "SAC"}, {"env_step": 1150000, "rew": 5925.9246, "rew_std": 342.4812, "Agent": "SAC"}, {"env_step": 1155000, "rew": 5907.3666, "rew_std": 498.7652, "Agent": "SAC"}, {"env_step": 1160000, "rew": 6098.61, "rew_std": 263.329, "Agent": "SAC"}, {"env_step": 1165000, "rew": 5864.8649, "rew_std": 387.2574, "Agent": "SAC"}, {"env_step": 1170000, "rew": 5890.1991, "rew_std": 508.4673, "Agent": "SAC"}, {"env_step": 1175000, "rew": 5840.934, "rew_std": 384.9363, "Agent": "SAC"}, {"env_step": 1180000, "rew": 5641.1752, "rew_std": 507.7719, "Agent": "SAC"}, {"env_step": 1185000, "rew": 5885.6678, "rew_std": 434.8161, "Agent": "SAC"}, {"env_step": 1190000, "rew": 5746.5579, "rew_std": 341.3485, "Agent": "SAC"}, {"env_step": 1195000, "rew": 5856.6325, "rew_std": 438.0519, "Agent": "SAC"}, {"env_step": 1200000, "rew": 5912.71, "rew_std": 225.9145, "Agent": "SAC"}, {"env_step": 1205000, "rew": 6033.2897, "rew_std": 362.7604, "Agent": "SAC"}, {"env_step": 1210000, "rew": 5916.6141, "rew_std": 264.2832, "Agent": "SAC"}, {"env_step": 1215000, "rew": 6096.7137, "rew_std": 276.9315, "Agent": "SAC"}, {"env_step": 1220000, "rew": 6058.312, "rew_std": 220.9652, "Agent": "SAC"}, {"env_step": 1225000, "rew": 6058.1806, "rew_std": 321.2416, "Agent": "SAC"}, {"env_step": 1230000, "rew": 5876.7533, "rew_std": 364.0235, "Agent": "SAC"}, {"env_step": 1235000, "rew": 6052.7966, "rew_std": 334.4648, "Agent": "SAC"}, {"env_step": 1240000, "rew": 6014.9591, "rew_std": 470.4387, "Agent": "SAC"}, {"env_step": 1245000, "rew": 5959.6132, "rew_std": 405.2573, "Agent": "SAC"}, {"env_step": 1250000, "rew": 6059.9079, "rew_std": 333.8162, "Agent": "SAC"}, {"env_step": 0, "rew": -46.1947, "rew_std": 25.5804, "Agent": "TRPO"}, {"env_step": 30720, "rew": -13.9012, "rew_std": 11.913, "Agent": "TRPO"}, {"env_step": 61440, "rew": 18.0615, "rew_std": 9.0166, "Agent": "TRPO"}, {"env_step": 92160, "rew": 51.9175, "rew_std": 16.4955, "Agent": "TRPO"}, {"env_step": 122880, "rew": 108.4958, "rew_std": 33.2241, "Agent": "TRPO"}, {"env_step": 153600, "rew": 183.9944, "rew_std": 35.8262, "Agent": "TRPO"}, {"env_step": 184320, "rew": 257.4861, "rew_std": 60.051, "Agent": "TRPO"}, {"env_step": 215040, "rew": 430.4068, "rew_std": 124.2541, "Agent": "TRPO"}, {"env_step": 245760, "rew": 564.2017, "rew_std": 146.0606, "Agent": "TRPO"}, {"env_step": 276480, "rew": 682.5168, "rew_std": 122.3187, "Agent": "TRPO"}, {"env_step": 307200, "rew": 832.5033, "rew_std": 159.2968, "Agent": "TRPO"}, {"env_step": 337920, "rew": 1014.1049, "rew_std": 221.8108, "Agent": "TRPO"}, {"env_step": 368640, "rew": 1128.5618, "rew_std": 167.9213, "Agent": "TRPO"}, {"env_step": 399360, "rew": 1146.4494, "rew_std": 215.1602, "Agent": "TRPO"}, {"env_step": 430080, "rew": 1233.6374, "rew_std": 286.8604, "Agent": "TRPO"}, {"env_step": 460800, "rew": 1261.4876, "rew_std": 301.0892, "Agent": "TRPO"}, {"env_step": 491520, "rew": 1472.6865, "rew_std": 215.7148, "Agent": "TRPO"}, {"env_step": 522240, "rew": 1501.5343, "rew_std": 428.1053, "Agent": "TRPO"}, {"env_step": 552960, "rew": 1631.5161, "rew_std": 558.1692, "Agent": "TRPO"}, {"env_step": 583680, "rew": 1741.6005, "rew_std": 483.7599, "Agent": "TRPO"}, {"env_step": 614400, "rew": 1809.3667, "rew_std": 444.8329, "Agent": "TRPO"}, {"env_step": 645120, "rew": 1943.2351, "rew_std": 386.0455, "Agent": "TRPO"}, {"env_step": 675840, "rew": 2119.3593, "rew_std": 463.9853, "Agent": "TRPO"}, {"env_step": 706560, "rew": 2160.9349, "rew_std": 299.8534, "Agent": "TRPO"}, {"env_step": 737280, "rew": 2205.6584, "rew_std": 495.8226, "Agent": "TRPO"}, {"env_step": 768000, "rew": 2148.4616, "rew_std": 617.4263, "Agent": "TRPO"}, {"env_step": 798720, "rew": 2294.2347, "rew_std": 619.654, "Agent": "TRPO"}, {"env_step": 829440, "rew": 2334.3877, "rew_std": 569.8366, "Agent": "TRPO"}, {"env_step": 860160, "rew": 2373.0195, "rew_std": 635.4872, "Agent": "TRPO"}, {"env_step": 890880, "rew": 2572.1874, "rew_std": 771.2781, "Agent": "TRPO"}, {"env_step": 921600, "rew": 2568.2581, "rew_std": 539.7726, "Agent": "TRPO"}, {"env_step": 952320, "rew": 2639.2867, "rew_std": 572.4301, "Agent": "TRPO"}, {"env_step": 983040, "rew": 2866.6508, "rew_std": 707.8937, "Agent": "TRPO"}, {"env_step": 1013760, "rew": 2731.0697, "rew_std": 675.644, "Agent": "TRPO"}, {"env_step": 1044480, "rew": 2702.1965, "rew_std": 742.4807, "Agent": "TRPO"}, {"env_step": 1075200, "rew": 3001.7621, "rew_std": 688.8314, "Agent": "TRPO"}, {"env_step": 1105920, "rew": 2877.8716, "rew_std": 922.2411, "Agent": "TRPO"}, {"env_step": 1136640, "rew": 3104.9072, "rew_std": 800.8227, "Agent": "TRPO"}, {"env_step": 1167360, "rew": 2976.5528, "rew_std": 661.5153, "Agent": "TRPO"}, {"env_step": 1198080, "rew": 3196.2228, "rew_std": 707.9679, "Agent": "TRPO"}, {"env_step": 1228800, "rew": 3237.2005, "rew_std": 505.6685, "Agent": "TRPO"}, {"env_step": 1259520, "rew": 3098.3083, "rew_std": 578.4346, "Agent": "TRPO"}, {"env_step": 1290240, "rew": 3356.962, "rew_std": 786.3838, "Agent": "TRPO"}, {"env_step": 1320960, "rew": 3241.2647, "rew_std": 600.3495, "Agent": "TRPO"}, {"env_step": 1351680, "rew": 3361.1722, "rew_std": 547.5151, "Agent": "TRPO"}, {"env_step": 1382400, "rew": 3495.3879, "rew_std": 662.5387, "Agent": "TRPO"}, {"env_step": 1413120, "rew": 3388.8443, "rew_std": 537.1016, "Agent": "TRPO"}, {"env_step": 1443840, "rew": 3493.6456, "rew_std": 509.2391, "Agent": "TRPO"}, {"env_step": 1474560, "rew": 3256.3625, "rew_std": 412.1903, "Agent": "TRPO"}, {"env_step": 1505280, "rew": 3695.3862, "rew_std": 644.5284, "Agent": "TRPO"}, {"env_step": 1536000, "rew": 3685.0253, "rew_std": 537.4812, "Agent": "TRPO"}, {"env_step": 1566720, "rew": 3565.3736, "rew_std": 647.2313, "Agent": "TRPO"}, {"env_step": 1597440, "rew": 3790.5153, "rew_std": 702.1943, "Agent": "TRPO"}, {"env_step": 1628160, "rew": 3598.3267, "rew_std": 626.2541, "Agent": "TRPO"}, {"env_step": 1658880, "rew": 3970.7287, "rew_std": 647.9836, "Agent": "TRPO"}, {"env_step": 1689600, "rew": 3658.6492, "rew_std": 645.0697, "Agent": "TRPO"}, {"env_step": 1720320, "rew": 3848.0345, "rew_std": 701.1273, "Agent": "TRPO"}, {"env_step": 1751040, "rew": 4061.4513, "rew_std": 690.0289, "Agent": "TRPO"}, {"env_step": 1781760, "rew": 3807.921, "rew_std": 706.5999, "Agent": "TRPO"}, {"env_step": 1812480, "rew": 3802.0342, "rew_std": 663.7139, "Agent": "TRPO"}, {"env_step": 1843200, "rew": 3873.6662, "rew_std": 566.3833, "Agent": "TRPO"}, {"env_step": 1873920, "rew": 4038.6082, "rew_std": 518.5079, "Agent": "TRPO"}, {"env_step": 1904640, "rew": 4167.3221, "rew_std": 440.9658, "Agent": "TRPO"}, {"env_step": 1935360, "rew": 3922.2855, "rew_std": 733.8238, "Agent": "TRPO"}, {"env_step": 1966080, "rew": 4174.7307, "rew_std": 495.1849, "Agent": "TRPO"}, {"env_step": 1996800, "rew": 4155.8384, "rew_std": 477.6376, "Agent": "TRPO"}, {"env_step": 2027520, "rew": 4259.3055, "rew_std": 577.3636, "Agent": "TRPO"}, {"env_step": 2058240, "rew": 4256.1933, "rew_std": 594.2826, "Agent": "TRPO"}, {"env_step": 2088960, "rew": 4355.0669, "rew_std": 605.8978, "Agent": "TRPO"}, {"env_step": 2119680, "rew": 4297.2252, "rew_std": 474.421, "Agent": "TRPO"}, {"env_step": 2150400, "rew": 4287.4698, "rew_std": 363.7332, "Agent": "TRPO"}, {"env_step": 2181120, "rew": 4398.2137, "rew_std": 354.3603, "Agent": "TRPO"}, {"env_step": 2211840, "rew": 4413.5796, "rew_std": 460.9681, "Agent": "TRPO"}, {"env_step": 2242560, "rew": 4329.001, "rew_std": 530.2755, "Agent": "TRPO"}, {"env_step": 2273280, "rew": 4252.3464, "rew_std": 597.5882, "Agent": "TRPO"}, {"env_step": 2304000, "rew": 4462.5657, "rew_std": 495.3802, "Agent": "TRPO"}, {"env_step": 2334720, "rew": 4374.2838, "rew_std": 457.0956, "Agent": "TRPO"}, {"env_step": 2365440, "rew": 4529.4549, "rew_std": 461.1733, "Agent": "TRPO"}, {"env_step": 2396160, "rew": 4291.4468, "rew_std": 411.2142, "Agent": "TRPO"}, {"env_step": 2426880, "rew": 4430.1459, "rew_std": 601.8812, "Agent": "TRPO"}, {"env_step": 2457600, "rew": 4508.078, "rew_std": 465.0507, "Agent": "TRPO"}, {"env_step": 2488320, "rew": 4151.3796, "rew_std": 414.656, "Agent": "TRPO"}, {"env_step": 2519040, "rew": 4705.7212, "rew_std": 477.1206, "Agent": "TRPO"}, {"env_step": 2549760, "rew": 4641.3111, "rew_std": 622.6369, "Agent": "TRPO"}, {"env_step": 2580480, "rew": 4484.1452, "rew_std": 442.0811, "Agent": "TRPO"}, {"env_step": 2611200, "rew": 4658.7294, "rew_std": 432.1496, "Agent": "TRPO"}, {"env_step": 2641920, "rew": 4625.8785, "rew_std": 357.4208, "Agent": "TRPO"}, {"env_step": 2672640, "rew": 4284.9794, "rew_std": 599.7262, "Agent": "TRPO"}, {"env_step": 2703360, "rew": 4419.1972, "rew_std": 447.5325, "Agent": "TRPO"}, {"env_step": 2734080, "rew": 4746.1067, "rew_std": 580.4515, "Agent": "TRPO"}, {"env_step": 2764800, "rew": 4756.6644, "rew_std": 502.4658, "Agent": "TRPO"}, {"env_step": 2795520, "rew": 4607.7287, "rew_std": 427.1984, "Agent": "TRPO"}, {"env_step": 2826240, "rew": 4404.4363, "rew_std": 555.3297, "Agent": "TRPO"}, {"env_step": 2856960, "rew": 4816.8623, "rew_std": 528.6794, "Agent": "TRPO"}, {"env_step": 2887680, "rew": 4753.3578, "rew_std": 715.7057, "Agent": "TRPO"}, {"env_step": 2918400, "rew": 4604.763, "rew_std": 447.4458, "Agent": "TRPO"}, {"env_step": 2949120, "rew": 4800.2693, "rew_std": 602.9667, "Agent": "TRPO"}, {"env_step": 2979840, "rew": 4772.9396, "rew_std": 368.1691, "Agent": "TRPO"}, {"env_step": 3010560, "rew": 4897.0257, "rew_std": 449.1329, "Agent": "TRPO"}, {"env_step": 3041280, "rew": 4841.7814, "rew_std": 534.8951, "Agent": "TRPO"}, {"env_step": 3072000, "rew": 4604.9043, "rew_std": 580.976, "Agent": "TRPO"}, {"env_step": 0, "rew": -51.4935, "rew_std": 27.5503, "Agent": "A2C"}, {"env_step": 30000, "rew": -29.8644, "rew_std": 10.21, "Agent": "A2C"}, {"env_step": 60000, "rew": 8.1853, "rew_std": 18.2229, "Agent": "A2C"}, {"env_step": 90000, "rew": 72.4685, "rew_std": 23.1961, "Agent": "A2C"}, {"env_step": 120000, "rew": 166.4676, "rew_std": 47.3271, "Agent": "A2C"}, {"env_step": 150000, "rew": 295.9591, "rew_std": 53.7155, "Agent": "A2C"}, {"env_step": 180000, "rew": 433.0201, "rew_std": 61.09, "Agent": "A2C"}, {"env_step": 210000, "rew": 586.3078, "rew_std": 67.2288, "Agent": "A2C"}, {"env_step": 240000, "rew": 756.9108, "rew_std": 94.0155, "Agent": "A2C"}, {"env_step": 270000, "rew": 805.3976, "rew_std": 247.5444, "Agent": "A2C"}, {"env_step": 300000, "rew": 1061.0577, "rew_std": 248.3772, "Agent": "A2C"}, {"env_step": 330000, "rew": 1097.009, "rew_std": 287.8099, "Agent": "A2C"}, {"env_step": 360000, "rew": 1361.5714, "rew_std": 207.5136, "Agent": "A2C"}, {"env_step": 390000, "rew": 1461.0194, "rew_std": 208.5063, "Agent": "A2C"}, {"env_step": 420000, "rew": 1664.8355, "rew_std": 330.0613, "Agent": "A2C"}, {"env_step": 450000, "rew": 2027.2921, "rew_std": 406.546, "Agent": "A2C"}, {"env_step": 480000, "rew": 2167.3209, "rew_std": 296.5709, "Agent": "A2C"}, {"env_step": 510000, "rew": 2056.6103, "rew_std": 433.0343, "Agent": "A2C"}, {"env_step": 540000, "rew": 2277.6117, "rew_std": 415.327, "Agent": "A2C"}, {"env_step": 570000, "rew": 2426.6807, "rew_std": 406.55, "Agent": "A2C"}, {"env_step": 600000, "rew": 2246.863, "rew_std": 394.1466, "Agent": "A2C"}, {"env_step": 630000, "rew": 2542.0354, "rew_std": 308.5228, "Agent": "A2C"}, {"env_step": 660000, "rew": 2831.0715, "rew_std": 421.904, "Agent": "A2C"}, {"env_step": 690000, "rew": 2505.3813, "rew_std": 541.7428, "Agent": "A2C"}, {"env_step": 720000, "rew": 2858.1248, "rew_std": 808.4451, "Agent": "A2C"}, {"env_step": 750000, "rew": 2779.9051, "rew_std": 499.6664, "Agent": "A2C"}, {"env_step": 780000, "rew": 3057.9012, "rew_std": 438.8949, "Agent": "A2C"}, {"env_step": 810000, "rew": 2922.3404, "rew_std": 487.1237, "Agent": "A2C"}, {"env_step": 840000, "rew": 3062.2575, "rew_std": 570.3453, "Agent": "A2C"}, {"env_step": 870000, "rew": 3098.2249, "rew_std": 598.1617, "Agent": "A2C"}, {"env_step": 900000, "rew": 3468.0156, "rew_std": 356.8802, "Agent": "A2C"}, {"env_step": 930000, "rew": 3332.6813, "rew_std": 455.3087, "Agent": "A2C"}, {"env_step": 960000, "rew": 3485.3726, "rew_std": 433.075, "Agent": "A2C"}, {"env_step": 990000, "rew": 3532.2745, "rew_std": 355.396, "Agent": "A2C"}, {"env_step": 1020000, "rew": 3371.1942, "rew_std": 756.4559, "Agent": "A2C"}, {"env_step": 1050000, "rew": 3327.8508, "rew_std": 465.0158, "Agent": "A2C"}, {"env_step": 1080000, "rew": 3410.0672, "rew_std": 487.9373, "Agent": "A2C"}, {"env_step": 1110000, "rew": 3508.0405, "rew_std": 492.2738, "Agent": "A2C"}, {"env_step": 1140000, "rew": 3645.9659, "rew_std": 234.3579, "Agent": "A2C"}, {"env_step": 1170000, "rew": 3601.9476, "rew_std": 410.754, "Agent": "A2C"}, {"env_step": 1200000, "rew": 3697.1497, "rew_std": 336.5131, "Agent": "A2C"}, {"env_step": 1230000, "rew": 3600.163, "rew_std": 755.6142, "Agent": "A2C"}, {"env_step": 1260000, "rew": 3783.988, "rew_std": 365.581, "Agent": "A2C"}, {"env_step": 1290000, "rew": 3999.3058, "rew_std": 357.098, "Agent": "A2C"}, {"env_step": 1320000, "rew": 3882.6923, "rew_std": 427.2421, "Agent": "A2C"}, {"env_step": 1350000, "rew": 4203.9126, "rew_std": 322.069, "Agent": "A2C"}, {"env_step": 1380000, "rew": 4071.4676, "rew_std": 298.9797, "Agent": "A2C"}, {"env_step": 1410000, "rew": 3725.2422, "rew_std": 638.7074, "Agent": "A2C"}, {"env_step": 1440000, "rew": 3869.6779, "rew_std": 614.8018, "Agent": "A2C"}, {"env_step": 1470000, "rew": 3937.0898, "rew_std": 566.8286, "Agent": "A2C"}, {"env_step": 1500000, "rew": 4054.1049, "rew_std": 565.2622, "Agent": "A2C"}, {"env_step": 1530000, "rew": 4147.8125, "rew_std": 536.8616, "Agent": "A2C"}, {"env_step": 1560000, "rew": 4044.8505, "rew_std": 322.5931, "Agent": "A2C"}, {"env_step": 1590000, "rew": 4189.3446, "rew_std": 273.6783, "Agent": "A2C"}, {"env_step": 1620000, "rew": 4134.2459, "rew_std": 478.0475, "Agent": "A2C"}, {"env_step": 1650000, "rew": 4109.2237, "rew_std": 576.0219, "Agent": "A2C"}, {"env_step": 1680000, "rew": 4373.6784, "rew_std": 203.6434, "Agent": "A2C"}, {"env_step": 1710000, "rew": 4463.585, "rew_std": 379.672, "Agent": "A2C"}, {"env_step": 1740000, "rew": 4189.2454, "rew_std": 566.2247, "Agent": "A2C"}, {"env_step": 1770000, "rew": 4368.2683, "rew_std": 505.7004, "Agent": "A2C"}, {"env_step": 1800000, "rew": 4242.8701, "rew_std": 714.7195, "Agent": "A2C"}, {"env_step": 1830000, "rew": 4408.0621, "rew_std": 300.5416, "Agent": "A2C"}, {"env_step": 1860000, "rew": 4574.196, "rew_std": 279.109, "Agent": "A2C"}, {"env_step": 1890000, "rew": 4396.9066, "rew_std": 490.7734, "Agent": "A2C"}, {"env_step": 1920000, "rew": 4523.7742, "rew_std": 397.95, "Agent": "A2C"}, {"env_step": 1950000, "rew": 4554.3086, "rew_std": 592.726, "Agent": "A2C"}, {"env_step": 1980000, "rew": 4305.6687, "rew_std": 562.9579, "Agent": "A2C"}, {"env_step": 2010000, "rew": 4894.4541, "rew_std": 219.3345, "Agent": "A2C"}, {"env_step": 2040000, "rew": 4487.1695, "rew_std": 301.3349, "Agent": "A2C"}, {"env_step": 2070000, "rew": 4466.5832, "rew_std": 464.2145, "Agent": "A2C"}, {"env_step": 2100000, "rew": 4666.3744, "rew_std": 370.7685, "Agent": "A2C"}, {"env_step": 2130000, "rew": 4706.4277, "rew_std": 403.2524, "Agent": "A2C"}, {"env_step": 2160000, "rew": 4530.5346, "rew_std": 514.5, "Agent": "A2C"}, {"env_step": 2190000, "rew": 4873.5241, "rew_std": 324.0447, "Agent": "A2C"}, {"env_step": 2220000, "rew": 4810.5365, "rew_std": 344.5598, "Agent": "A2C"}, {"env_step": 2250000, "rew": 4721.3229, "rew_std": 238.1361, "Agent": "A2C"}, {"env_step": 2280000, "rew": 4736.7355, "rew_std": 413.251, "Agent": "A2C"}, {"env_step": 2310000, "rew": 4755.9058, "rew_std": 473.5718, "Agent": "A2C"}, {"env_step": 2340000, "rew": 4974.8084, "rew_std": 217.7102, "Agent": "A2C"}, {"env_step": 2370000, "rew": 5030.6218, "rew_std": 207.6396, "Agent": "A2C"}, {"env_step": 2400000, "rew": 4690.2767, "rew_std": 409.2839, "Agent": "A2C"}, {"env_step": 2430000, "rew": 5039.456, "rew_std": 318.2659, "Agent": "A2C"}, {"env_step": 2460000, "rew": 4773.1173, "rew_std": 416.1896, "Agent": "A2C"}, {"env_step": 2490000, "rew": 4789.5868, "rew_std": 502.159, "Agent": "A2C"}, {"env_step": 2520000, "rew": 4823.6652, "rew_std": 396.6441, "Agent": "A2C"}, {"env_step": 2550000, "rew": 4879.6176, "rew_std": 429.7661, "Agent": "A2C"}, {"env_step": 2580000, "rew": 4993.1127, "rew_std": 328.2962, "Agent": "A2C"}, {"env_step": 2610000, "rew": 4898.4844, "rew_std": 489.4285, "Agent": "A2C"}, {"env_step": 2640000, "rew": 5096.5163, "rew_std": 294.0463, "Agent": "A2C"}, {"env_step": 2670000, "rew": 4900.6782, "rew_std": 323.0878, "Agent": "A2C"}, {"env_step": 2700000, "rew": 5009.7045, "rew_std": 226.3388, "Agent": "A2C"}, {"env_step": 2730000, "rew": 4908.1905, "rew_std": 478.5281, "Agent": "A2C"}, {"env_step": 2760000, "rew": 4939.0956, "rew_std": 377.716, "Agent": "A2C"}, {"env_step": 2790000, "rew": 5165.0076, "rew_std": 268.143, "Agent": "A2C"}, {"env_step": 2820000, "rew": 5035.1886, "rew_std": 405.329, "Agent": "A2C"}, {"env_step": 2850000, "rew": 5094.7334, "rew_std": 427.7514, "Agent": "A2C"}, {"env_step": 2880000, "rew": 4926.0901, "rew_std": 387.6091, "Agent": "A2C"}, {"env_step": 2910000, "rew": 5062.6458, "rew_std": 495.6891, "Agent": "A2C"}, {"env_step": 2940000, "rew": 5111.7299, "rew_std": 400.9655, "Agent": "A2C"}, {"env_step": 2970000, "rew": 5236.7584, "rew_std": 236.6818, "Agent": "A2C"}, {"env_step": 3000000, "rew": 5064.3433, "rew_std": 284.9814, "Agent": "A2C"}, {"env_step": 0, "rew": -51.1159, "rew_std": 22.2925, "Agent": "ACKTR"}, {"env_step": 30000, "rew": -55.1733, "rew_std": 20.7228, "Agent": "ACKTR"}, {"env_step": 60000, "rew": -29.8844, "rew_std": 24.9148, "Agent": "ACKTR"}, {"env_step": 90000, "rew": -17.8622, "rew_std": 15.4919, "Agent": "ACKTR"}, {"env_step": 120000, "rew": 2.7944, "rew_std": 12.5161, "Agent": "ACKTR"}, {"env_step": 150000, "rew": 17.5914, "rew_std": 16.5646, "Agent": "ACKTR"}, {"env_step": 180000, "rew": 50.012, "rew_std": 28.5837, "Agent": "ACKTR"}, {"env_step": 210000, "rew": 60.5538, "rew_std": 17.2586, "Agent": "ACKTR"}, {"env_step": 240000, "rew": 113.237, "rew_std": 45.2853, "Agent": "ACKTR"}, {"env_step": 270000, "rew": 165.6851, "rew_std": 51.042, "Agent": "ACKTR"}, {"env_step": 300000, "rew": 209.2715, "rew_std": 61.4836, "Agent": "ACKTR"}, {"env_step": 330000, "rew": 251.8624, "rew_std": 89.1594, "Agent": "ACKTR"}, {"env_step": 360000, "rew": 335.1485, "rew_std": 86.1314, "Agent": "ACKTR"}, {"env_step": 390000, "rew": 372.0135, "rew_std": 84.6685, "Agent": "ACKTR"}, {"env_step": 420000, "rew": 454.8912, "rew_std": 107.7605, "Agent": "ACKTR"}, {"env_step": 450000, "rew": 502.1926, "rew_std": 96.7837, "Agent": "ACKTR"}, {"env_step": 480000, "rew": 508.3361, "rew_std": 67.995, "Agent": "ACKTR"}, {"env_step": 510000, "rew": 542.7329, "rew_std": 122.4863, "Agent": "ACKTR"}, {"env_step": 540000, "rew": 619.618, "rew_std": 127.1325, "Agent": "ACKTR"}, {"env_step": 570000, "rew": 622.386, "rew_std": 87.0652, "Agent": "ACKTR"}, {"env_step": 600000, "rew": 643.2475, "rew_std": 118.3534, "Agent": "ACKTR"}, {"env_step": 630000, "rew": 711.5836, "rew_std": 115.2815, "Agent": "ACKTR"}, {"env_step": 660000, "rew": 726.6018, "rew_std": 132.7868, "Agent": "ACKTR"}, {"env_step": 690000, "rew": 700.3915, "rew_std": 136.5581, "Agent": "ACKTR"}, {"env_step": 720000, "rew": 846.5125, "rew_std": 221.4335, "Agent": "ACKTR"}, {"env_step": 750000, "rew": 897.5913, "rew_std": 217.1571, "Agent": "ACKTR"}, {"env_step": 780000, "rew": 997.8158, "rew_std": 209.6639, "Agent": "ACKTR"}, {"env_step": 810000, "rew": 1008.6334, "rew_std": 188.3656, "Agent": "ACKTR"}, {"env_step": 840000, "rew": 1039.4789, "rew_std": 194.9829, "Agent": "ACKTR"}, {"env_step": 870000, "rew": 1127.0584, "rew_std": 277.8994, "Agent": "ACKTR"}, {"env_step": 900000, "rew": 1033.4706, "rew_std": 222.9172, "Agent": "ACKTR"}, {"env_step": 930000, "rew": 1151.4823, "rew_std": 173.3884, "Agent": "ACKTR"}, {"env_step": 960000, "rew": 1368.184, "rew_std": 272.4198, "Agent": "ACKTR"}, {"env_step": 990000, "rew": 1366.1295, "rew_std": 247.5901, "Agent": "ACKTR"}, {"env_step": 1020000, "rew": 1308.2419, "rew_std": 506.5229, "Agent": "ACKTR"}, {"env_step": 1050000, "rew": 1363.1904, "rew_std": 513.6879, "Agent": "ACKTR"}, {"env_step": 1080000, "rew": 1386.6625, "rew_std": 425.1895, "Agent": "ACKTR"}, {"env_step": 1110000, "rew": 1656.4518, "rew_std": 448.8382, "Agent": "ACKTR"}, {"env_step": 1140000, "rew": 1377.252, "rew_std": 406.0232, "Agent": "ACKTR"}, {"env_step": 1170000, "rew": 1834.7485, "rew_std": 531.4445, "Agent": "ACKTR"}, {"env_step": 1200000, "rew": 2003.9069, "rew_std": 552.9861, "Agent": "ACKTR"}, {"env_step": 1230000, "rew": 1971.8287, "rew_std": 605.6529, "Agent": "ACKTR"}, {"env_step": 1260000, "rew": 1873.144, "rew_std": 645.0478, "Agent": "ACKTR"}, {"env_step": 1290000, "rew": 2033.1415, "rew_std": 791.0491, "Agent": "ACKTR"}, {"env_step": 1320000, "rew": 2018.2048, "rew_std": 614.233, "Agent": "ACKTR"}, {"env_step": 1350000, "rew": 2036.331, "rew_std": 600.9722, "Agent": "ACKTR"}, {"env_step": 1380000, "rew": 1982.4575, "rew_std": 537.2168, "Agent": "ACKTR"}, {"env_step": 1410000, "rew": 2008.5591, "rew_std": 943.9488, "Agent": "ACKTR"}, {"env_step": 1440000, "rew": 2167.1065, "rew_std": 613.2319, "Agent": "ACKTR"}, {"env_step": 1470000, "rew": 2003.5611, "rew_std": 521.1535, "Agent": "ACKTR"}, {"env_step": 1500000, "rew": 2343.0121, "rew_std": 854.0222, "Agent": "ACKTR"}, {"env_step": 1530000, "rew": 2301.379, "rew_std": 679.1948, "Agent": "ACKTR"}, {"env_step": 1560000, "rew": 2248.8094, "rew_std": 747.5392, "Agent": "ACKTR"}, {"env_step": 1590000, "rew": 2274.8919, "rew_std": 581.671, "Agent": "ACKTR"}, {"env_step": 1620000, "rew": 2520.9423, "rew_std": 702.1277, "Agent": "ACKTR"}, {"env_step": 1650000, "rew": 2394.4035, "rew_std": 684.8675, "Agent": "ACKTR"}, {"env_step": 1680000, "rew": 2807.4318, "rew_std": 921.0878, "Agent": "ACKTR"}, {"env_step": 1710000, "rew": 2496.0115, "rew_std": 543.7313, "Agent": "ACKTR"}, {"env_step": 1740000, "rew": 2400.4852, "rew_std": 581.3117, "Agent": "ACKTR"}, {"env_step": 1770000, "rew": 2727.1568, "rew_std": 678.8937, "Agent": "ACKTR"}, {"env_step": 1800000, "rew": 2549.6539, "rew_std": 545.8151, "Agent": "ACKTR"}, {"env_step": 1830000, "rew": 2587.8716, "rew_std": 588.693, "Agent": "ACKTR"}, {"env_step": 1860000, "rew": 2549.5426, "rew_std": 462.1076, "Agent": "ACKTR"}, {"env_step": 1890000, "rew": 2946.9396, "rew_std": 659.176, "Agent": "ACKTR"}, {"env_step": 1920000, "rew": 2965.8238, "rew_std": 849.7264, "Agent": "ACKTR"}, {"env_step": 1950000, "rew": 2992.4915, "rew_std": 610.0303, "Agent": "ACKTR"}, {"env_step": 1980000, "rew": 2905.0368, "rew_std": 573.7697, "Agent": "ACKTR"}, {"env_step": 2010000, "rew": 2681.4138, "rew_std": 462.5838, "Agent": "ACKTR"}, {"env_step": 2040000, "rew": 3018.0111, "rew_std": 751.8595, "Agent": "ACKTR"}, {"env_step": 2070000, "rew": 2931.385, "rew_std": 671.6752, "Agent": "ACKTR"}, {"env_step": 2100000, "rew": 3275.6425, "rew_std": 626.7001, "Agent": "ACKTR"}, {"env_step": 2130000, "rew": 3376.6405, "rew_std": 718.642, "Agent": "ACKTR"}, {"env_step": 2160000, "rew": 3264.1332, "rew_std": 711.1494, "Agent": "ACKTR"}, {"env_step": 2190000, "rew": 3286.5841, "rew_std": 683.5056, "Agent": "ACKTR"}, {"env_step": 2220000, "rew": 3125.924, "rew_std": 848.001, "Agent": "ACKTR"}, {"env_step": 2250000, "rew": 3171.802, "rew_std": 576.0974, "Agent": "ACKTR"}, {"env_step": 2280000, "rew": 3300.7179, "rew_std": 599.8094, "Agent": "ACKTR"}, {"env_step": 2310000, "rew": 3230.7315, "rew_std": 751.0966, "Agent": "ACKTR"}, {"env_step": 2340000, "rew": 3225.3237, "rew_std": 654.915, "Agent": "ACKTR"}, {"env_step": 2370000, "rew": 3339.8517, "rew_std": 702.8875, "Agent": "ACKTR"}, {"env_step": 2400000, "rew": 3474.9053, "rew_std": 711.4999, "Agent": "ACKTR"}, {"env_step": 2430000, "rew": 3598.8509, "rew_std": 658.1381, "Agent": "ACKTR"}, {"env_step": 2460000, "rew": 3631.9426, "rew_std": 744.2699, "Agent": "ACKTR"}, {"env_step": 2490000, "rew": 3700.43, "rew_std": 707.7157, "Agent": "ACKTR"}, {"env_step": 2520000, "rew": 3650.0648, "rew_std": 738.0914, "Agent": "ACKTR"}, {"env_step": 2550000, "rew": 3644.216, "rew_std": 674.1804, "Agent": "ACKTR"}, {"env_step": 2580000, "rew": 3485.5256, "rew_std": 718.9007, "Agent": "ACKTR"}, {"env_step": 2610000, "rew": 3428.4171, "rew_std": 540.3576, "Agent": "ACKTR"}, {"env_step": 2640000, "rew": 3772.7819, "rew_std": 538.3571, "Agent": "ACKTR"}, {"env_step": 2670000, "rew": 3929.4809, "rew_std": 687.1127, "Agent": "ACKTR"}, {"env_step": 2700000, "rew": 3559.1185, "rew_std": 678.0846, "Agent": "ACKTR"}, {"env_step": 2730000, "rew": 3468.7167, "rew_std": 558.8028, "Agent": "ACKTR"}, {"env_step": 2760000, "rew": 3600.9884, "rew_std": 765.1541, "Agent": "ACKTR"}, {"env_step": 2790000, "rew": 3711.564, "rew_std": 706.9286, "Agent": "ACKTR"}, {"env_step": 2820000, "rew": 3735.4943, "rew_std": 850.731, "Agent": "ACKTR"}, {"env_step": 2850000, "rew": 3804.8742, "rew_std": 1012.9631, "Agent": "ACKTR"}, {"env_step": 2880000, "rew": 3507.3954, "rew_std": 909.7035, "Agent": "ACKTR"}, {"env_step": 2910000, "rew": 3435.6452, "rew_std": 636.2781, "Agent": "ACKTR"}, {"env_step": 2940000, "rew": 3945.7842, "rew_std": 965.3295, "Agent": "ACKTR"}, {"env_step": 2970000, "rew": 3645.5525, "rew_std": 797.9247, "Agent": "ACKTR"}, {"env_step": 3000000, "rew": 3835.3951, "rew_std": 1122.2309, "Agent": "ACKTR"}, {"env_step": 0, "rew": 990.3775, "rew_std": 4.2988, "Agent": "DDPG"}, {"env_step": 5000, "rew": -264.9603, "rew_std": 150.403, "Agent": "DDPG"}, {"env_step": 10000, "rew": -102.281, "rew_std": 91.1585, "Agent": "DDPG"}, {"env_step": 15000, "rew": -143.1314, "rew_std": 81.0776, "Agent": "DDPG"}, {"env_step": 20000, "rew": -211.1981, "rew_std": 129.6291, "Agent": "DDPG"}, {"env_step": 25000, "rew": -226.9656, "rew_std": 158.8799, "Agent": "DDPG"}, {"env_step": 30000, "rew": -224.9604, "rew_std": 104.4, "Agent": "DDPG"}, {"env_step": 35000, "rew": -372.6741, "rew_std": 211.2733, "Agent": "DDPG"}, {"env_step": 40000, "rew": -275.7362, "rew_std": 145.3991, "Agent": "DDPG"}, {"env_step": 45000, "rew": -334.0932, "rew_std": 230.6398, "Agent": "DDPG"}, {"env_step": 50000, "rew": -331.5473, "rew_std": 172.596, "Agent": "DDPG"}, {"env_step": 55000, "rew": -318.7348, "rew_std": 146.5198, "Agent": "DDPG"}, {"env_step": 60000, "rew": -439.613, "rew_std": 238.9257, "Agent": "DDPG"}, {"env_step": 65000, "rew": -285.0307, "rew_std": 192.0539, "Agent": "DDPG"}, {"env_step": 70000, "rew": -390.7666, "rew_std": 212.5538, "Agent": "DDPG"}, {"env_step": 75000, "rew": -313.1766, "rew_std": 188.3958, "Agent": "DDPG"}, {"env_step": 80000, "rew": -284.1551, "rew_std": 206.5472, "Agent": "DDPG"}, {"env_step": 85000, "rew": -199.3411, "rew_std": 71.2859, "Agent": "DDPG"}, {"env_step": 90000, "rew": -264.6298, "rew_std": 171.4911, "Agent": "DDPG"}, {"env_step": 95000, "rew": -290.3529, "rew_std": 189.5071, "Agent": "DDPG"}, {"env_step": 100000, "rew": -286.0806, "rew_std": 141.4327, "Agent": "DDPG"}, {"env_step": 105000, "rew": -262.0053, "rew_std": 160.5764, "Agent": "DDPG"}, {"env_step": 110000, "rew": -246.8272, "rew_std": 157.0853, "Agent": "DDPG"}, {"env_step": 115000, "rew": -383.9334, "rew_std": 148.8186, "Agent": "DDPG"}, {"env_step": 120000, "rew": -304.7294, "rew_std": 147.2911, "Agent": "DDPG"}, {"env_step": 125000, "rew": -351.9924, "rew_std": 249.8939, "Agent": "DDPG"}, {"env_step": 130000, "rew": -334.1367, "rew_std": 192.0608, "Agent": "DDPG"}, {"env_step": 135000, "rew": -350.9877, "rew_std": 207.3599, "Agent": "DDPG"}, {"env_step": 140000, "rew": -274.5018, "rew_std": 158.3473, "Agent": "DDPG"}, {"env_step": 145000, "rew": -323.9643, "rew_std": 171.0525, "Agent": "DDPG"}, {"env_step": 150000, "rew": -268.7093, "rew_std": 162.6873, "Agent": "DDPG"}, {"env_step": 155000, "rew": -267.165, "rew_std": 141.0928, "Agent": "DDPG"}, {"env_step": 160000, "rew": -292.6231, "rew_std": 129.7231, "Agent": "DDPG"}, {"env_step": 165000, "rew": -273.1202, "rew_std": 160.0995, "Agent": "DDPG"}, {"env_step": 170000, "rew": -229.7015, "rew_std": 94.2036, "Agent": "DDPG"}, {"env_step": 175000, "rew": -228.0526, "rew_std": 151.2225, "Agent": "DDPG"}, {"env_step": 180000, "rew": -261.7921, "rew_std": 112.1936, "Agent": "DDPG"}, {"env_step": 185000, "rew": -350.9193, "rew_std": 229.0705, "Agent": "DDPG"}, {"env_step": 190000, "rew": -344.8744, "rew_std": 189.5019, "Agent": "DDPG"}, {"env_step": 195000, "rew": -352.284, "rew_std": 245.8252, "Agent": "DDPG"}, {"env_step": 200000, "rew": -184.4852, "rew_std": 96.5308, "Agent": "DDPG"}, {"env_step": 205000, "rew": -272.4764, "rew_std": 120.4672, "Agent": "DDPG"}, {"env_step": 210000, "rew": -287.1041, "rew_std": 137.247, "Agent": "DDPG"}, {"env_step": 215000, "rew": -271.4143, "rew_std": 110.8385, "Agent": "DDPG"}, {"env_step": 220000, "rew": -272.5712, "rew_std": 119.3937, "Agent": "DDPG"}, {"env_step": 225000, "rew": -275.9917, "rew_std": 142.3404, "Agent": "DDPG"}, {"env_step": 230000, "rew": -308.7602, "rew_std": 171.4882, "Agent": "DDPG"}, {"env_step": 235000, "rew": -284.4355, "rew_std": 93.677, "Agent": "DDPG"}, {"env_step": 240000, "rew": -298.3893, "rew_std": 172.9615, "Agent": "DDPG"}, {"env_step": 245000, "rew": -387.3001, "rew_std": 216.0408, "Agent": "DDPG"}, {"env_step": 250000, "rew": -298.1023, "rew_std": 146.4381, "Agent": "DDPG"}, {"env_step": 255000, "rew": -258.6759, "rew_std": 121.7973, "Agent": "DDPG"}, {"env_step": 260000, "rew": -324.8005, "rew_std": 166.7637, "Agent": "DDPG"}, {"env_step": 265000, "rew": -255.6078, "rew_std": 156.5995, "Agent": "DDPG"}, {"env_step": 270000, "rew": -316.6506, "rew_std": 147.5006, "Agent": "DDPG"}, {"env_step": 275000, "rew": -258.3453, "rew_std": 137.476, "Agent": "DDPG"}, {"env_step": 280000, "rew": -390.4388, "rew_std": 235.748, "Agent": "DDPG"}, {"env_step": 285000, "rew": -225.9875, "rew_std": 77.8894, "Agent": "DDPG"}, {"env_step": 290000, "rew": -290.4895, "rew_std": 185.9677, "Agent": "DDPG"}, {"env_step": 295000, "rew": -300.5484, "rew_std": 123.4829, "Agent": "DDPG"}, {"env_step": 300000, "rew": -362.7267, "rew_std": 156.1688, "Agent": "DDPG"}, {"env_step": 305000, "rew": -213.9227, "rew_std": 93.6869, "Agent": "DDPG"}, {"env_step": 310000, "rew": -327.0641, "rew_std": 86.7959, "Agent": "DDPG"}, {"env_step": 315000, "rew": -234.5996, "rew_std": 132.1258, "Agent": "DDPG"}, {"env_step": 320000, "rew": -294.0503, "rew_std": 185.8398, "Agent": "DDPG"}, {"env_step": 325000, "rew": -305.9732, "rew_std": 155.4417, "Agent": "DDPG"}, {"env_step": 330000, "rew": -365.8385, "rew_std": 181.6744, "Agent": "DDPG"}, {"env_step": 335000, "rew": -368.2359, "rew_std": 182.6425, "Agent": "DDPG"}, {"env_step": 340000, "rew": -348.5352, "rew_std": 133.1437, "Agent": "DDPG"}, {"env_step": 345000, "rew": -384.662, "rew_std": 145.002, "Agent": "DDPG"}, {"env_step": 350000, "rew": -331.6225, "rew_std": 131.0167, "Agent": "DDPG"}, {"env_step": 355000, "rew": -259.168, "rew_std": 76.1548, "Agent": "DDPG"}, {"env_step": 360000, "rew": -255.8124, "rew_std": 130.9712, "Agent": "DDPG"}, {"env_step": 365000, "rew": -456.0603, "rew_std": 194.8, "Agent": "DDPG"}, {"env_step": 370000, "rew": -398.9166, "rew_std": 150.5447, "Agent": "DDPG"}, {"env_step": 375000, "rew": -405.75, "rew_std": 363.3503, "Agent": "DDPG"}, {"env_step": 380000, "rew": -662.0463, "rew_std": 177.3496, "Agent": "DDPG"}, {"env_step": 385000, "rew": -538.3942, "rew_std": 419.9355, "Agent": "DDPG"}, {"env_step": 390000, "rew": -645.4876, "rew_std": 362.0333, "Agent": "DDPG"}, {"env_step": 395000, "rew": -722.5296, "rew_std": 343.0093, "Agent": "DDPG"}, {"env_step": 400000, "rew": -785.547, "rew_std": 550.5672, "Agent": "DDPG"}, {"env_step": 405000, "rew": -651.5462, "rew_std": 359.0273, "Agent": "DDPG"}, {"env_step": 410000, "rew": -590.5508, "rew_std": 393.7796, "Agent": "DDPG"}, {"env_step": 415000, "rew": -680.8052, "rew_std": 484.7692, "Agent": "DDPG"}, {"env_step": 420000, "rew": -700.6755, "rew_std": 544.5943, "Agent": "DDPG"}, {"env_step": 425000, "rew": -570.4075, "rew_std": 538.7718, "Agent": "DDPG"}, {"env_step": 430000, "rew": -703.2318, "rew_std": 485.7277, "Agent": "DDPG"}, {"env_step": 435000, "rew": -683.4084, "rew_std": 577.0482, "Agent": "DDPG"}, {"env_step": 440000, "rew": -640.5323, "rew_std": 457.5518, "Agent": "DDPG"}, {"env_step": 445000, "rew": -574.8007, "rew_std": 472.5012, "Agent": "DDPG"}, {"env_step": 450000, "rew": -693.8662, "rew_std": 331.3535, "Agent": "DDPG"}, {"env_step": 455000, "rew": -761.8418, "rew_std": 438.3566, "Agent": "DDPG"}, {"env_step": 460000, "rew": -790.4578, "rew_std": 510.3858, "Agent": "DDPG"}, {"env_step": 465000, "rew": -734.0699, "rew_std": 502.4104, "Agent": "DDPG"}, {"env_step": 470000, "rew": -580.8933, "rew_std": 496.5509, "Agent": "DDPG"}, {"env_step": 475000, "rew": -622.7698, "rew_std": 306.7372, "Agent": "DDPG"}, {"env_step": 480000, "rew": -597.5903, "rew_std": 479.7028, "Agent": "DDPG"}, {"env_step": 485000, "rew": -496.5723, "rew_std": 409.4345, "Agent": "DDPG"}, {"env_step": 490000, "rew": -474.7281, "rew_std": 553.0422, "Agent": "DDPG"}, {"env_step": 495000, "rew": -718.454, "rew_std": 508.5459, "Agent": "DDPG"}, {"env_step": 500000, "rew": -519.0221, "rew_std": 485.7399, "Agent": "DDPG"}, {"env_step": 505000, "rew": -345.1241, "rew_std": 409.183, "Agent": "DDPG"}, {"env_step": 510000, "rew": -517.5172, "rew_std": 304.7734, "Agent": "DDPG"}, {"env_step": 515000, "rew": -387.9395, "rew_std": 315.7722, "Agent": "DDPG"}, {"env_step": 520000, "rew": -457.5481, "rew_std": 390.5131, "Agent": "DDPG"}, {"env_step": 525000, "rew": -391.5585, "rew_std": 539.0123, "Agent": "DDPG"}, {"env_step": 530000, "rew": -360.2725, "rew_std": 414.1826, "Agent": "DDPG"}, {"env_step": 535000, "rew": -320.7459, "rew_std": 465.0856, "Agent": "DDPG"}, {"env_step": 540000, "rew": -368.0916, "rew_std": 350.6185, "Agent": "DDPG"}, {"env_step": 545000, "rew": -520.4293, "rew_std": 342.2237, "Agent": "DDPG"}, {"env_step": 550000, "rew": -468.8602, "rew_std": 440.5926, "Agent": "DDPG"}, {"env_step": 555000, "rew": -378.1778, "rew_std": 502.1599, "Agent": "DDPG"}, {"env_step": 560000, "rew": -408.0724, "rew_std": 358.9013, "Agent": "DDPG"}, {"env_step": 565000, "rew": -473.7454, "rew_std": 498.5437, "Agent": "DDPG"}, {"env_step": 570000, "rew": -337.2682, "rew_std": 552.3182, "Agent": "DDPG"}, {"env_step": 575000, "rew": -318.0568, "rew_std": 663.5847, "Agent": "DDPG"}, {"env_step": 580000, "rew": -467.2081, "rew_std": 686.31, "Agent": "DDPG"}, {"env_step": 585000, "rew": -283.433, "rew_std": 499.1016, "Agent": "DDPG"}, {"env_step": 590000, "rew": -576.0506, "rew_std": 743.3304, "Agent": "DDPG"}, {"env_step": 595000, "rew": -523.4312, "rew_std": 543.8762, "Agent": "DDPG"}, {"env_step": 600000, "rew": -290.2641, "rew_std": 504.4617, "Agent": "DDPG"}, {"env_step": 605000, "rew": -287.9134, "rew_std": 468.2899, "Agent": "DDPG"}, {"env_step": 610000, "rew": -279.245, "rew_std": 510.2628, "Agent": "DDPG"}, {"env_step": 615000, "rew": -293.0744, "rew_std": 521.4399, "Agent": "DDPG"}, {"env_step": 620000, "rew": -262.9651, "rew_std": 532.2983, "Agent": "DDPG"}, {"env_step": 625000, "rew": -114.4813, "rew_std": 423.1847, "Agent": "DDPG"}, {"env_step": 630000, "rew": -252.8271, "rew_std": 655.7101, "Agent": "DDPG"}, {"env_step": 635000, "rew": -231.8681, "rew_std": 583.7409, "Agent": "DDPG"}, {"env_step": 640000, "rew": -225.1097, "rew_std": 576.478, "Agent": "DDPG"}, {"env_step": 645000, "rew": -216.8845, "rew_std": 577.7498, "Agent": "DDPG"}, {"env_step": 650000, "rew": -69.707, "rew_std": 457.7335, "Agent": "DDPG"}, {"env_step": 655000, "rew": 38.7784, "rew_std": 478.9931, "Agent": "DDPG"}, {"env_step": 660000, "rew": -48.134, "rew_std": 403.0322, "Agent": "DDPG"}, {"env_step": 665000, "rew": 74.6522, "rew_std": 390.9822, "Agent": "DDPG"}, {"env_step": 670000, "rew": 20.0033, "rew_std": 536.4488, "Agent": "DDPG"}, {"env_step": 675000, "rew": 153.8525, "rew_std": 426.2199, "Agent": "DDPG"}, {"env_step": 680000, "rew": 150.8311, "rew_std": 489.5175, "Agent": "DDPG"}, {"env_step": 685000, "rew": 37.3832, "rew_std": 762.0161, "Agent": "DDPG"}, {"env_step": 690000, "rew": 226.8652, "rew_std": 427.3436, "Agent": "DDPG"}, {"env_step": 695000, "rew": 244.6373, "rew_std": 437.9303, "Agent": "DDPG"}, {"env_step": 700000, "rew": 91.1048, "rew_std": 759.342, "Agent": "DDPG"}, {"env_step": 705000, "rew": 178.5016, "rew_std": 626.6264, "Agent": "DDPG"}, {"env_step": 710000, "rew": 108.6379, "rew_std": 898.4505, "Agent": "DDPG"}, {"env_step": 715000, "rew": 94.0608, "rew_std": 967.2715, "Agent": "DDPG"}, {"env_step": 720000, "rew": 162.4966, "rew_std": 747.3213, "Agent": "DDPG"}, {"env_step": 725000, "rew": 39.8885, "rew_std": 568.4475, "Agent": "DDPG"}, {"env_step": 730000, "rew": 52.2043, "rew_std": 812.1541, "Agent": "DDPG"}, {"env_step": 735000, "rew": 111.9638, "rew_std": 643.1707, "Agent": "DDPG"}, {"env_step": 740000, "rew": 34.238, "rew_std": 905.4223, "Agent": "DDPG"}, {"env_step": 745000, "rew": 35.7718, "rew_std": 826.4736, "Agent": "DDPG"}, {"env_step": 750000, "rew": 136.6419, "rew_std": 934.359, "Agent": "DDPG"}, {"env_step": 755000, "rew": 52.2149, "rew_std": 838.1785, "Agent": "DDPG"}, {"env_step": 760000, "rew": 104.1105, "rew_std": 826.4385, "Agent": "DDPG"}, {"env_step": 765000, "rew": 89.9899, "rew_std": 751.6642, "Agent": "DDPG"}, {"env_step": 770000, "rew": 182.7996, "rew_std": 809.7852, "Agent": "DDPG"}, {"env_step": 775000, "rew": 137.0194, "rew_std": 735.5012, "Agent": "DDPG"}, {"env_step": 780000, "rew": 183.6331, "rew_std": 557.8404, "Agent": "DDPG"}, {"env_step": 785000, "rew": 120.9358, "rew_std": 731.4159, "Agent": "DDPG"}, {"env_step": 790000, "rew": 149.1463, "rew_std": 582.7867, "Agent": "DDPG"}, {"env_step": 795000, "rew": 153.3002, "rew_std": 767.275, "Agent": "DDPG"}, {"env_step": 800000, "rew": 212.4554, "rew_std": 572.2873, "Agent": "DDPG"}, {"env_step": 805000, "rew": 186.4028, "rew_std": 478.7203, "Agent": "DDPG"}, {"env_step": 810000, "rew": 124.0634, "rew_std": 711.6635, "Agent": "DDPG"}, {"env_step": 815000, "rew": 121.4412, "rew_std": 562.7584, "Agent": "DDPG"}, {"env_step": 820000, "rew": 106.4889, "rew_std": 510.6887, "Agent": "DDPG"}, {"env_step": 825000, "rew": 201.6965, "rew_std": 494.3505, "Agent": "DDPG"}, {"env_step": 830000, "rew": 199.0214, "rew_std": 519.6556, "Agent": "DDPG"}, {"env_step": 835000, "rew": 306.1893, "rew_std": 582.493, "Agent": "DDPG"}, {"env_step": 840000, "rew": 304.76, "rew_std": 371.3446, "Agent": "DDPG"}, {"env_step": 845000, "rew": 194.2056, "rew_std": 570.5582, "Agent": "DDPG"}, {"env_step": 850000, "rew": 317.9959, "rew_std": 457.7196, "Agent": "DDPG"}, {"env_step": 855000, "rew": 313.0282, "rew_std": 375.4861, "Agent": "DDPG"}, {"env_step": 860000, "rew": 306.9646, "rew_std": 413.8683, "Agent": "DDPG"}, {"env_step": 865000, "rew": 383.4445, "rew_std": 301.2858, "Agent": "DDPG"}, {"env_step": 870000, "rew": 279.7083, "rew_std": 284.7498, "Agent": "DDPG"}, {"env_step": 875000, "rew": 358.8884, "rew_std": 412.0223, "Agent": "DDPG"}, {"env_step": 880000, "rew": 535.1728, "rew_std": 383.7316, "Agent": "DDPG"}, {"env_step": 885000, "rew": 346.6428, "rew_std": 225.1636, "Agent": "DDPG"}, {"env_step": 890000, "rew": 339.5073, "rew_std": 350.2322, "Agent": "DDPG"}, {"env_step": 895000, "rew": 331.3404, "rew_std": 685.289, "Agent": "DDPG"}, {"env_step": 900000, "rew": 346.2813, "rew_std": 604.3274, "Agent": "DDPG"}, {"env_step": 905000, "rew": 339.2269, "rew_std": 379.4845, "Agent": "DDPG"}, {"env_step": 910000, "rew": 324.2864, "rew_std": 606.8819, "Agent": "DDPG"}, {"env_step": 915000, "rew": 174.4781, "rew_std": 733.2932, "Agent": "DDPG"}, {"env_step": 920000, "rew": 255.1748, "rew_std": 575.7423, "Agent": "DDPG"}, {"env_step": 925000, "rew": 238.2941, "rew_std": 818.7228, "Agent": "DDPG"}, {"env_step": 930000, "rew": 260.7616, "rew_std": 750.9644, "Agent": "DDPG"}, {"env_step": 935000, "rew": 261.9765, "rew_std": 574.0636, "Agent": "DDPG"}, {"env_step": 940000, "rew": 159.742, "rew_std": 612.7265, "Agent": "DDPG"}, {"env_step": 945000, "rew": 470.1876, "rew_std": 621.5751, "Agent": "DDPG"}, {"env_step": 950000, "rew": 366.5236, "rew_std": 536.5978, "Agent": "DDPG"}, {"env_step": 955000, "rew": 339.7856, "rew_std": 443.0108, "Agent": "DDPG"}, {"env_step": 960000, "rew": 235.8162, "rew_std": 453.9982, "Agent": "DDPG"}, {"env_step": 965000, "rew": 229.7699, "rew_std": 661.4345, "Agent": "DDPG"}, {"env_step": 970000, "rew": 222.74, "rew_std": 424.5786, "Agent": "DDPG"}, {"env_step": 975000, "rew": 439.9229, "rew_std": 459.5935, "Agent": "DDPG"}, {"env_step": 980000, "rew": 437.2693, "rew_std": 377.1376, "Agent": "DDPG"}, {"env_step": 985000, "rew": 291.6736, "rew_std": 313.2381, "Agent": "DDPG"}, {"env_step": 990000, "rew": 469.9611, "rew_std": 448.3772, "Agent": "DDPG"}, {"env_step": 995000, "rew": 456.8604, "rew_std": 588.505, "Agent": "DDPG"}, {"env_step": 1000000, "rew": 385.1584, "rew_std": 334.4049, "Agent": "DDPG"}, {"env_step": 1005000, "rew": 551.8676, "rew_std": 488.84, "Agent": "DDPG"}, {"env_step": 1010000, "rew": 544.2, "rew_std": 328.5778, "Agent": "DDPG"}, {"env_step": 1015000, "rew": 582.8491, "rew_std": 286.5209, "Agent": "DDPG"}, {"env_step": 1020000, "rew": 484.5955, "rew_std": 273.9864, "Agent": "DDPG"}, {"env_step": 1025000, "rew": 563.1035, "rew_std": 287.232, "Agent": "DDPG"}, {"env_step": 1030000, "rew": 612.7206, "rew_std": 125.2816, "Agent": "DDPG"}, {"env_step": 1035000, "rew": 600.1382, "rew_std": 392.7771, "Agent": "DDPG"}, {"env_step": 1040000, "rew": 565.576, "rew_std": 396.5358, "Agent": "DDPG"}, {"env_step": 1045000, "rew": 487.78, "rew_std": 271.7867, "Agent": "DDPG"}, {"env_step": 1050000, "rew": 637.2793, "rew_std": 260.2136, "Agent": "DDPG"}, {"env_step": 1055000, "rew": 509.3906, "rew_std": 297.949, "Agent": "DDPG"}, {"env_step": 1060000, "rew": 583.282, "rew_std": 332.434, "Agent": "DDPG"}, {"env_step": 1065000, "rew": 601.1719, "rew_std": 217.739, "Agent": "DDPG"}, {"env_step": 1070000, "rew": 767.3685, "rew_std": 304.8501, "Agent": "DDPG"}, {"env_step": 1075000, "rew": 597.0315, "rew_std": 194.0678, "Agent": "DDPG"}, {"env_step": 1080000, "rew": 801.3029, "rew_std": 266.5503, "Agent": "DDPG"}, {"env_step": 1085000, "rew": 685.5964, "rew_std": 236.5172, "Agent": "DDPG"}, {"env_step": 1090000, "rew": 809.0626, "rew_std": 234.3018, "Agent": "DDPG"}, {"env_step": 1095000, "rew": 477.0418, "rew_std": 582.6256, "Agent": "DDPG"}, {"env_step": 1100000, "rew": 584.4327, "rew_std": 370.4071, "Agent": "DDPG"}, {"env_step": 1105000, "rew": 640.5093, "rew_std": 312.2578, "Agent": "DDPG"}, {"env_step": 1110000, "rew": 614.8422, "rew_std": 327.2431, "Agent": "DDPG"}, {"env_step": 1115000, "rew": 491.5984, "rew_std": 318.016, "Agent": "DDPG"}, {"env_step": 1120000, "rew": 538.005, "rew_std": 470.0626, "Agent": "DDPG"}, {"env_step": 1125000, "rew": 591.9692, "rew_std": 376.8948, "Agent": "DDPG"}, {"env_step": 1130000, "rew": 583.9439, "rew_std": 401.7359, "Agent": "DDPG"}, {"env_step": 1135000, "rew": 639.0098, "rew_std": 442.6075, "Agent": "DDPG"}, {"env_step": 1140000, "rew": 661.2861, "rew_std": 382.1447, "Agent": "DDPG"}, {"env_step": 1145000, "rew": 704.7731, "rew_std": 475.0417, "Agent": "DDPG"}, {"env_step": 1150000, "rew": 437.8826, "rew_std": 458.8954, "Agent": "DDPG"}, {"env_step": 1155000, "rew": 646.721, "rew_std": 467.7669, "Agent": "DDPG"}, {"env_step": 1160000, "rew": 724.8509, "rew_std": 380.5183, "Agent": "DDPG"}, {"env_step": 1165000, "rew": 694.4904, "rew_std": 368.5073, "Agent": "DDPG"}, {"env_step": 1170000, "rew": 703.0135, "rew_std": 374.4319, "Agent": "DDPG"}, {"env_step": 1175000, "rew": 726.9614, "rew_std": 465.1964, "Agent": "DDPG"}, {"env_step": 1180000, "rew": 730.3367, "rew_std": 284.869, "Agent": "DDPG"}, {"env_step": 1185000, "rew": 588.1819, "rew_std": 720.0913, "Agent": "DDPG"}, {"env_step": 1190000, "rew": 440.9309, "rew_std": 521.7464, "Agent": "DDPG"}, {"env_step": 1195000, "rew": 740.2113, "rew_std": 274.7408, "Agent": "DDPG"}, {"env_step": 1200000, "rew": 763.1286, "rew_std": 323.932, "Agent": "DDPG"}, {"env_step": 1205000, "rew": 632.2507, "rew_std": 406.6145, "Agent": "DDPG"}, {"env_step": 1210000, "rew": 751.4243, "rew_std": 444.0591, "Agent": "DDPG"}, {"env_step": 1215000, "rew": 671.4103, "rew_std": 475.4886, "Agent": "DDPG"}, {"env_step": 1220000, "rew": 818.7525, "rew_std": 396.8029, "Agent": "DDPG"}, {"env_step": 1225000, "rew": 717.9299, "rew_std": 538.4126, "Agent": "DDPG"}, {"env_step": 1230000, "rew": 658.2258, "rew_std": 608.8801, "Agent": "DDPG"}, {"env_step": 1235000, "rew": 585.0669, "rew_std": 530.2994, "Agent": "DDPG"}, {"env_step": 1240000, "rew": 772.0731, "rew_std": 481.3012, "Agent": "DDPG"}, {"env_step": 1245000, "rew": 801.4048, "rew_std": 588.8195, "Agent": "DDPG"}, {"env_step": 1250000, "rew": 615.916, "rew_std": 440.107, "Agent": "DDPG"}, {"env_step": 0, "rew": -46.1947, "rew_std": 25.5804, "Agent": "NPG"}, {"env_step": 30720, "rew": -29.0009, "rew_std": 15.8916, "Agent": "NPG"}, {"env_step": 61440, "rew": -10.4279, "rew_std": 11.0242, "Agent": "NPG"}, {"env_step": 92160, "rew": 11.1187, "rew_std": 9.0737, "Agent": "NPG"}, {"env_step": 122880, "rew": 27.5852, "rew_std": 16.4638, "Agent": "NPG"}, {"env_step": 153600, "rew": 56.7285, "rew_std": 23.8642, "Agent": "NPG"}, {"env_step": 184320, "rew": 81.2319, "rew_std": 29.1525, "Agent": "NPG"}, {"env_step": 215040, "rew": 159.4704, "rew_std": 47.3793, "Agent": "NPG"}, {"env_step": 245760, "rew": 174.9781, "rew_std": 57.693, "Agent": "NPG"}, {"env_step": 276480, "rew": 178.6358, "rew_std": 32.807, "Agent": "NPG"}, {"env_step": 307200, "rew": 218.3212, "rew_std": 41.035, "Agent": "NPG"}, {"env_step": 337920, "rew": 368.663, "rew_std": 80.0623, "Agent": "NPG"}, {"env_step": 368640, "rew": 432.2163, "rew_std": 63.1225, "Agent": "NPG"}, {"env_step": 399360, "rew": 568.0807, "rew_std": 125.517, "Agent": "NPG"}, {"env_step": 430080, "rew": 631.1259, "rew_std": 114.6371, "Agent": "NPG"}, {"env_step": 460800, "rew": 753.5929, "rew_std": 118.5185, "Agent": "NPG"}, {"env_step": 491520, "rew": 864.7371, "rew_std": 183.4071, "Agent": "NPG"}, {"env_step": 522240, "rew": 940.2978, "rew_std": 158.8018, "Agent": "NPG"}, {"env_step": 552960, "rew": 1021.7661, "rew_std": 159.2406, "Agent": "NPG"}, {"env_step": 583680, "rew": 1131.714, "rew_std": 150.4756, "Agent": "NPG"}, {"env_step": 614400, "rew": 1201.5181, "rew_std": 164.258, "Agent": "NPG"}, {"env_step": 645120, "rew": 1343.1191, "rew_std": 184.6686, "Agent": "NPG"}, {"env_step": 675840, "rew": 1318.401, "rew_std": 229.7468, "Agent": "NPG"}, {"env_step": 706560, "rew": 1459.1159, "rew_std": 222.6298, "Agent": "NPG"}, {"env_step": 737280, "rew": 1542.0295, "rew_std": 203.9479, "Agent": "NPG"}, {"env_step": 768000, "rew": 1634.9176, "rew_std": 218.2131, "Agent": "NPG"}, {"env_step": 798720, "rew": 1692.0983, "rew_std": 343.9785, "Agent": "NPG"}, {"env_step": 829440, "rew": 1906.1507, "rew_std": 457.5102, "Agent": "NPG"}, {"env_step": 860160, "rew": 1775.1748, "rew_std": 342.0144, "Agent": "NPG"}, {"env_step": 890880, "rew": 2102.0494, "rew_std": 355.8503, "Agent": "NPG"}, {"env_step": 921600, "rew": 2046.7794, "rew_std": 340.8884, "Agent": "NPG"}, {"env_step": 952320, "rew": 2164.3512, "rew_std": 405.7482, "Agent": "NPG"}, {"env_step": 983040, "rew": 2348.312, "rew_std": 509.9401, "Agent": "NPG"}, {"env_step": 1013760, "rew": 2365.8958, "rew_std": 523.6603, "Agent": "NPG"}, {"env_step": 1044480, "rew": 2324.9164, "rew_std": 528.4526, "Agent": "NPG"}, {"env_step": 1075200, "rew": 2493.722, "rew_std": 583.8895, "Agent": "NPG"}, {"env_step": 1105920, "rew": 2638.7282, "rew_std": 650.3356, "Agent": "NPG"}, {"env_step": 1136640, "rew": 2588.3598, "rew_std": 506.4239, "Agent": "NPG"}, {"env_step": 1167360, "rew": 2657.8218, "rew_std": 542.1361, "Agent": "NPG"}, {"env_step": 1198080, "rew": 2772.0887, "rew_std": 399.8722, "Agent": "NPG"}, {"env_step": 1228800, "rew": 2983.8532, "rew_std": 405.1427, "Agent": "NPG"}, {"env_step": 1259520, "rew": 2969.912, "rew_std": 543.0224, "Agent": "NPG"}, {"env_step": 1290240, "rew": 2898.5856, "rew_std": 687.1927, "Agent": "NPG"}, {"env_step": 1320960, "rew": 2979.687, "rew_std": 685.3181, "Agent": "NPG"}, {"env_step": 1351680, "rew": 2937.7865, "rew_std": 654.2811, "Agent": "NPG"}, {"env_step": 1382400, "rew": 3180.3262, "rew_std": 502.1675, "Agent": "NPG"}, {"env_step": 1413120, "rew": 3181.4746, "rew_std": 526.9918, "Agent": "NPG"}, {"env_step": 1443840, "rew": 3186.725, "rew_std": 483.0104, "Agent": "NPG"}, {"env_step": 1474560, "rew": 3347.1624, "rew_std": 474.3212, "Agent": "NPG"}, {"env_step": 1505280, "rew": 3264.1247, "rew_std": 542.1326, "Agent": "NPG"}, {"env_step": 1536000, "rew": 3267.3737, "rew_std": 536.477, "Agent": "NPG"}, {"env_step": 1566720, "rew": 3677.709, "rew_std": 486.0857, "Agent": "NPG"}, {"env_step": 1597440, "rew": 3379.1083, "rew_std": 683.1763, "Agent": "NPG"}, {"env_step": 1628160, "rew": 3533.6653, "rew_std": 437.9623, "Agent": "NPG"}, {"env_step": 1658880, "rew": 3534.0292, "rew_std": 787.6867, "Agent": "NPG"}, {"env_step": 1689600, "rew": 3399.7589, "rew_std": 685.1419, "Agent": "NPG"}, {"env_step": 1720320, "rew": 3587.7024, "rew_std": 471.134, "Agent": "NPG"}, {"env_step": 1751040, "rew": 3560.6233, "rew_std": 616.8093, "Agent": "NPG"}, {"env_step": 1781760, "rew": 3635.7303, "rew_std": 608.4666, "Agent": "NPG"}, {"env_step": 1812480, "rew": 3713.5899, "rew_std": 802.8577, "Agent": "NPG"}, {"env_step": 1843200, "rew": 3590.908, "rew_std": 557.7779, "Agent": "NPG"}, {"env_step": 1873920, "rew": 3903.7812, "rew_std": 655.7805, "Agent": "NPG"}, {"env_step": 1904640, "rew": 3770.5075, "rew_std": 645.9229, "Agent": "NPG"}, {"env_step": 1935360, "rew": 4110.3599, "rew_std": 657.3085, "Agent": "NPG"}, {"env_step": 1966080, "rew": 3851.8914, "rew_std": 745.2079, "Agent": "NPG"}, {"env_step": 1996800, "rew": 3998.0014, "rew_std": 650.7886, "Agent": "NPG"}, {"env_step": 2027520, "rew": 3739.3657, "rew_std": 715.6727, "Agent": "NPG"}, {"env_step": 2058240, "rew": 4230.5764, "rew_std": 578.5901, "Agent": "NPG"}, {"env_step": 2088960, "rew": 4140.935, "rew_std": 624.3245, "Agent": "NPG"}, {"env_step": 2119680, "rew": 4228.9808, "rew_std": 573.9637, "Agent": "NPG"}, {"env_step": 2150400, "rew": 4142.6649, "rew_std": 419.5781, "Agent": "NPG"}, {"env_step": 2181120, "rew": 4089.8147, "rew_std": 302.9776, "Agent": "NPG"}, {"env_step": 2211840, "rew": 4276.8854, "rew_std": 674.4424, "Agent": "NPG"}, {"env_step": 2242560, "rew": 4312.1654, "rew_std": 567.5481, "Agent": "NPG"}, {"env_step": 2273280, "rew": 4224.3566, "rew_std": 445.0954, "Agent": "NPG"}, {"env_step": 2304000, "rew": 3878.7632, "rew_std": 866.3551, "Agent": "NPG"}, {"env_step": 2334720, "rew": 4001.3801, "rew_std": 478.1705, "Agent": "NPG"}, {"env_step": 2365440, "rew": 4284.5594, "rew_std": 448.8121, "Agent": "NPG"}, {"env_step": 2396160, "rew": 4406.6923, "rew_std": 516.8683, "Agent": "NPG"}, {"env_step": 2426880, "rew": 4145.9032, "rew_std": 519.4268, "Agent": "NPG"}, {"env_step": 2457600, "rew": 4241.7632, "rew_std": 685.6791, "Agent": "NPG"}, {"env_step": 2488320, "rew": 4154.1219, "rew_std": 437.1567, "Agent": "NPG"}, {"env_step": 2519040, "rew": 4495.7374, "rew_std": 449.1806, "Agent": "NPG"}, {"env_step": 2549760, "rew": 4289.7487, "rew_std": 526.7084, "Agent": "NPG"}, {"env_step": 2580480, "rew": 4246.0211, "rew_std": 530.6265, "Agent": "NPG"}, {"env_step": 2611200, "rew": 4463.8985, "rew_std": 572.8797, "Agent": "NPG"}, {"env_step": 2641920, "rew": 4298.6282, "rew_std": 665.9416, "Agent": "NPG"}, {"env_step": 2672640, "rew": 4485.5394, "rew_std": 359.9158, "Agent": "NPG"}, {"env_step": 2703360, "rew": 4820.597, "rew_std": 318.5627, "Agent": "NPG"}, {"env_step": 2734080, "rew": 4540.1727, "rew_std": 412.9545, "Agent": "NPG"}, {"env_step": 2764800, "rew": 4500.1939, "rew_std": 596.1343, "Agent": "NPG"}, {"env_step": 2795520, "rew": 4664.0692, "rew_std": 426.6286, "Agent": "NPG"}, {"env_step": 2826240, "rew": 4516.467, "rew_std": 435.656, "Agent": "NPG"}, {"env_step": 2856960, "rew": 4545.139, "rew_std": 496.411, "Agent": "NPG"}, {"env_step": 2887680, "rew": 4444.0518, "rew_std": 596.6213, "Agent": "NPG"}, {"env_step": 2918400, "rew": 4658.8307, "rew_std": 652.0561, "Agent": "NPG"}, {"env_step": 2949120, "rew": 4509.4439, "rew_std": 466.3483, "Agent": "NPG"}, {"env_step": 2979840, "rew": 4589.8375, "rew_std": 414.0363, "Agent": "NPG"}, {"env_step": 3010560, "rew": 4693.0902, "rew_std": 490.4674, "Agent": "NPG"}, {"env_step": 3041280, "rew": 4678.8152, "rew_std": 313.0054, "Agent": "NPG"}, {"env_step": 3072000, "rew": 4736.6273, "rew_std": 376.7205, "Agent": "NPG"}]