[{"env_step": 0, "rew": 95.0, "rew_std": 75.92759709091287, "Agent": "c51"}, {"env_step": 100000, "rew": 251.5, "rew_std": 82.12186067059123, "Agent": "c51"}, {"env_step": 200000, "rew": 255.5, "rew_std": 117.85478352616833, "Agent": "c51"}, {"env_step": 300000, "rew": 320.0, "rew_std": 42.175229697062704, "Agent": "c51"}, {"env_step": 400000, "rew": 332.5, "rew_std": 83.60621986431393, "Agent": "c51"}, {"env_step": 500000, "rew": 430.25, "rew_std": 135.99839153460601, "Agent": "c51"}, {"env_step": 600000, "rew": 523.75, "rew_std": 108.9681719586045, "Agent": "c51"}, {"env_step": 700000, "rew": 1121.0, "rew_std": 516.2099863427673, "Agent": "c51"}, {"env_step": 800000, "rew": 1754.75, "rew_std": 1004.4398003364861, "Agent": "c51"}, {"env_step": 900000, "rew": 2517.0, "rew_std": 1108.9954914245593, "Agent": "c51"}, {"env_step": 1000000, "rew": 2285.0, "rew_std": 1031.815753901829, "Agent": "c51"}, {"env_step": 1100000, "rew": 2877.75, "rew_std": 1017.4357780715203, "Agent": "c51"}, {"env_step": 1200000, "rew": 3304.5, "rew_std": 804.6146593245738, "Agent": "c51"}, {"env_step": 1300000, "rew": 3511.25, "rew_std": 1172.84443235239, "Agent": "c51"}, {"env_step": 1400000, "rew": 3495.0, "rew_std": 713.4371030441296, "Agent": "c51"}, {"env_step": 1500000, "rew": 3199.0, "rew_std": 1272.923897960911, "Agent": "c51"}, {"env_step": 1600000, "rew": 3992.0, "rew_std": 1011.4944389367645, "Agent": "c51"}, {"env_step": 1700000, "rew": 4453.75, "rew_std": 1278.8536126156114, "Agent": "c51"}, {"env_step": 1800000, "rew": 3931.5, "rew_std": 1001.7822867270114, "Agent": "c51"}, {"env_step": 1900000, "rew": 4928.25, "rew_std": 1331.802842953866, "Agent": "c51"}, {"env_step": 2000000, "rew": 4457.0, "rew_std": 1296.9019816470325, "Agent": "c51"}, {"env_step": 2100000, "rew": 5236.75, "rew_std": 1800.0354336790151, "Agent": "c51"}, {"env_step": 2200000, "rew": 4757.25, "rew_std": 1431.1256277839482, "Agent": "c51"}, {"env_step": 2300000, "rew": 4738.25, "rew_std": 1369.4538373015719, "Agent": "c51"}, {"env_step": 2400000, "rew": 6592.0, "rew_std": 1420.6903251588644, "Agent": "c51"}, {"env_step": 2500000, "rew": 5894.25, "rew_std": 1735.2507203571477, "Agent": "c51"}, {"env_step": 2600000, "rew": 7282.25, "rew_std": 2613.5424833929906, "Agent": "c51"}, {"env_step": 2700000, "rew": 7078.25, "rew_std": 2062.308188050467, "Agent": "c51"}, {"env_step": 2800000, "rew": 6066.25, "rew_std": 1512.1017037554054, "Agent": "c51"}, {"env_step": 2900000, "rew": 7065.5, "rew_std": 2015.3544353289324, "Agent": "c51"}, {"env_step": 3000000, "rew": 6861.0, "rew_std": 1669.891538394036, "Agent": "c51"}, {"env_step": 3100000, "rew": 7762.75, "rew_std": 2067.515553145852, "Agent": "c51"}, {"env_step": 3200000, "rew": 7553.5, "rew_std": 2434.32644688423, "Agent": "c51"}, {"env_step": 3300000, "rew": 6468.25, "rew_std": 1466.2916873869265, "Agent": "c51"}, {"env_step": 3400000, "rew": 7396.25, "rew_std": 2111.3411762431956, "Agent": "c51"}, {"env_step": 3500000, "rew": 7398.75, "rew_std": 2466.653413534216, "Agent": "c51"}, {"env_step": 3600000, "rew": 7548.75, "rew_std": 2775.422546658436, "Agent": "c51"}, {"env_step": 3700000, "rew": 8335.5, "rew_std": 2109.992239322221, "Agent": "c51"}, {"env_step": 3800000, "rew": 6925.0, "rew_std": 1951.7191140120547, "Agent": "c51"}, {"env_step": 3900000, "rew": 7580.5, "rew_std": 2267.1120947143304, "Agent": "c51"}, {"env_step": 4000000, "rew": 8586.75, "rew_std": 2490.3042108344916, "Agent": "c51"}, {"env_step": 4100000, "rew": 8712.75, "rew_std": 2641.0264221510547, "Agent": "c51"}, {"env_step": 4200000, "rew": 9052.75, "rew_std": 1451.2083112013934, "Agent": "c51"}, {"env_step": 4300000, "rew": 7919.75, "rew_std": 1486.0133116833106, "Agent": "c51"}, {"env_step": 4400000, "rew": 9568.25, "rew_std": 2890.1516071825713, "Agent": "c51"}, {"env_step": 4500000, "rew": 8489.0, "rew_std": 1878.7070687044322, "Agent": "c51"}, {"env_step": 4600000, "rew": 8453.75, "rew_std": 2539.73577611924, "Agent": "c51"}, {"env_step": 4700000, "rew": 8407.0, "rew_std": 2617.2267765709566, "Agent": "c51"}, {"env_step": 4800000, "rew": 8893.25, "rew_std": 2978.127568204559, "Agent": "c51"}, {"env_step": 4900000, "rew": 10263.75, "rew_std": 2290.572322040935, "Agent": "c51"}, {"env_step": 5000000, "rew": 8514.5, "rew_std": 1787.0897431298743, "Agent": "c51"}, {"env_step": 5100000, "rew": 8638.75, "rew_std": 2969.4349736102995, "Agent": "c51"}, {"env_step": 5200000, "rew": 10585.75, "rew_std": 3481.069708078251, "Agent": "c51"}, {"env_step": 5300000, "rew": 9607.5, "rew_std": 2606.770032051159, "Agent": "c51"}, {"env_step": 5400000, "rew": 9306.5, "rew_std": 2684.2033734424817, "Agent": "c51"}, {"env_step": 5500000, "rew": 9660.75, "rew_std": 2237.9474552589477, "Agent": "c51"}, {"env_step": 5600000, "rew": 9766.25, "rew_std": 2911.0542012302003, "Agent": "c51"}, {"env_step": 5700000, "rew": 10415.5, "rew_std": 1625.4448621838885, "Agent": "c51"}, {"env_step": 5800000, "rew": 9485.5, "rew_std": 3670.640407340387, "Agent": "c51"}, {"env_step": 5900000, "rew": 10269.0, "rew_std": 2380.1436931412354, "Agent": "c51"}, {"env_step": 6000000, "rew": 10933.5, "rew_std": 2768.2542332668795, "Agent": "c51"}, {"env_step": 6100000, "rew": 10309.25, "rew_std": 2190.8112224698866, "Agent": "c51"}, {"env_step": 6200000, "rew": 10257.0, "rew_std": 3413.4135773445328, "Agent": "c51"}, {"env_step": 6300000, "rew": 9958.0, "rew_std": 2849.388925717232, "Agent": "c51"}, {"env_step": 6400000, "rew": 11790.0, "rew_std": 1323.6403401226482, "Agent": "c51"}, {"env_step": 6500000, "rew": 10310.75, "rew_std": 2311.68581613073, "Agent": "c51"}, {"env_step": 6600000, "rew": 9120.75, "rew_std": 2925.0596254606503, "Agent": "c51"}, {"env_step": 6700000, "rew": 10305.5, "rew_std": 2839.6374768621436, "Agent": "c51"}, {"env_step": 6800000, "rew": 10348.75, "rew_std": 3006.7963121069574, "Agent": "c51"}, {"env_step": 6900000, "rew": 10654.25, "rew_std": 1407.1265268269233, "Agent": "c51"}, {"env_step": 7000000, "rew": 11493.75, "rew_std": 1194.8479244238574, "Agent": "c51"}, {"env_step": 7100000, "rew": 11250.5, "rew_std": 1915.5099843122719, "Agent": "c51"}, {"env_step": 7200000, "rew": 10615.75, "rew_std": 2852.864141963301, "Agent": "c51"}, {"env_step": 7300000, "rew": 10428.75, "rew_std": 1486.1473892249046, "Agent": "c51"}, {"env_step": 7400000, "rew": 11293.0, "rew_std": 2100.1969550496924, "Agent": "c51"}, {"env_step": 7500000, "rew": 10405.0, "rew_std": 2845.91066268778, "Agent": "c51"}, {"env_step": 7600000, "rew": 11912.75, "rew_std": 1889.1385106709354, "Agent": "c51"}, {"env_step": 7700000, "rew": 10792.75, "rew_std": 2319.9715650197095, "Agent": "c51"}, {"env_step": 7800000, "rew": 11481.75, "rew_std": 2059.718442530435, "Agent": "c51"}, {"env_step": 7900000, "rew": 11188.0, "rew_std": 1572.3460973971348, "Agent": "c51"}, {"env_step": 8000000, "rew": 11333.25, "rew_std": 2443.5376634093445, "Agent": "c51"}, {"env_step": 8100000, "rew": 11388.75, "rew_std": 1806.7637677626813, "Agent": "c51"}, {"env_step": 8200000, "rew": 11084.25, "rew_std": 2011.5637729139983, "Agent": "c51"}, {"env_step": 8300000, "rew": 11189.25, "rew_std": 1837.155767075835, "Agent": "c51"}, {"env_step": 8400000, "rew": 12201.5, "rew_std": 1443.038547648676, "Agent": "c51"}, {"env_step": 8500000, "rew": 12172.0, "rew_std": 2153.40886735427, "Agent": "c51"}, {"env_step": 8600000, "rew": 10667.0, "rew_std": 2920.304093754621, "Agent": "c51"}, {"env_step": 8700000, "rew": 12087.25, "rew_std": 1455.5503469478479, "Agent": "c51"}, {"env_step": 8800000, "rew": 11311.0, "rew_std": 2612.836868233453, "Agent": "c51"}, {"env_step": 8900000, "rew": 12494.75, "rew_std": 2119.100767424711, "Agent": "c51"}, {"env_step": 9000000, "rew": 12513.25, "rew_std": 1274.6416408151745, "Agent": "c51"}, {"env_step": 9100000, "rew": 12241.0, "rew_std": 1972.8945106112492, "Agent": "c51"}, {"env_step": 9200000, "rew": 10962.25, "rew_std": 1657.8398784261403, "Agent": "c51"}, {"env_step": 9300000, "rew": 11570.25, "rew_std": 2591.904813549294, "Agent": "c51"}, {"env_step": 9400000, "rew": 11239.25, "rew_std": 2040.6086867648094, "Agent": "c51"}, {"env_step": 9500000, "rew": 11834.25, "rew_std": 1834.925083620582, "Agent": "c51"}, {"env_step": 9600000, "rew": 11510.5, "rew_std": 1754.8346788230508, "Agent": "c51"}, {"env_step": 9700000, "rew": 10276.75, "rew_std": 2304.5601668214263, "Agent": "c51"}, {"env_step": 9800000, "rew": 12446.75, "rew_std": 1572.9002074194027, "Agent": "c51"}, {"env_step": 9900000, "rew": 10765.0, "rew_std": 2277.32930205537, "Agent": "c51"}, {"env_step": 10000000, "rew": 11854.5, "rew_std": 2126.8074078298673, "Agent": "c51"}, {"env_step": 0, "rew": 79.5, "rew_std": 76.44278906476399, "Agent": "dqn"}, {"env_step": 100000, "rew": 306.5, "rew_std": 140.31749712705113, "Agent": "dqn"}, {"env_step": 200000, "rew": 409.5, "rew_std": 96.2925230742242, "Agent": "dqn"}, {"env_step": 300000, "rew": 537.25, "rew_std": 147.0180686174322, "Agent": "dqn"}, {"env_step": 400000, "rew": 534.25, "rew_std": 124.05165254844451, "Agent": "dqn"}, {"env_step": 500000, "rew": 725.25, "rew_std": 251.90883767744236, "Agent": "dqn"}, {"env_step": 600000, "rew": 669.5, "rew_std": 160.39326669159152, "Agent": "dqn"}, {"env_step": 700000, "rew": 958.5, "rew_std": 439.7985334218385, "Agent": "dqn"}, {"env_step": 800000, "rew": 818.5, "rew_std": 111.63668751803773, "Agent": "dqn"}, {"env_step": 900000, "rew": 778.75, "rew_std": 199.5408792703891, "Agent": "dqn"}, {"env_step": 1000000, "rew": 850.0, "rew_std": 283.47618947629445, "Agent": "dqn"}, {"env_step": 1100000, "rew": 1346.0, "rew_std": 645.7797612189469, "Agent": "dqn"}, {"env_step": 1200000, "rew": 1157.5, "rew_std": 768.8619837135922, "Agent": "dqn"}, {"env_step": 1300000, "rew": 1414.5, "rew_std": 999.8636156996613, "Agent": "dqn"}, {"env_step": 1400000, "rew": 1861.25, "rew_std": 1166.1422779832656, "Agent": "dqn"}, {"env_step": 1500000, "rew": 2099.75, "rew_std": 986.7018609995625, "Agent": "dqn"}, {"env_step": 1600000, "rew": 2019.0, "rew_std": 728.7679671884598, "Agent": "dqn"}, {"env_step": 1700000, "rew": 3189.0, "rew_std": 1119.5803901462368, "Agent": "dqn"}, {"env_step": 1800000, "rew": 3215.5, "rew_std": 1019.3391241387726, "Agent": "dqn"}, {"env_step": 1900000, "rew": 4062.5, "rew_std": 644.8352502771542, "Agent": "dqn"}, {"env_step": 2000000, "rew": 3697.75, "rew_std": 775.0285881823974, "Agent": "dqn"}, {"env_step": 2100000, "rew": 4084.75, "rew_std": 369.5460898183067, "Agent": "dqn"}, {"env_step": 2200000, "rew": 4364.5, "rew_std": 82.35441700358275, "Agent": "dqn"}, {"env_step": 2300000, "rew": 3960.5, "rew_std": 493.58357954859076, "Agent": "dqn"}, {"env_step": 2400000, "rew": 4298.5, "rew_std": 337.0908631215032, "Agent": "dqn"}, {"env_step": 2500000, "rew": 3868.5, "rew_std": 810.0564795123856, "Agent": "dqn"}, {"env_step": 2600000, "rew": 3593.0, "rew_std": 1069.2274079913964, "Agent": "dqn"}, {"env_step": 2700000, "rew": 3861.5, "rew_std": 863.5603626846244, "Agent": "dqn"}, {"env_step": 2800000, "rew": 4479.75, "rew_std": 226.15108334916283, "Agent": "dqn"}, {"env_step": 2900000, "rew": 4399.25, "rew_std": 278.67106505699513, "Agent": "dqn"}, {"env_step": 3000000, "rew": 4731.0, "rew_std": 975.6428649869787, "Agent": "dqn"}, {"env_step": 3100000, "rew": 4451.0, "rew_std": 1066.7041529871344, "Agent": "dqn"}, {"env_step": 3200000, "rew": 4260.0, "rew_std": 1112.3870729202133, "Agent": "dqn"}, {"env_step": 3300000, "rew": 4400.75, "rew_std": 758.1804287239285, "Agent": "dqn"}, {"env_step": 3400000, "rew": 4580.5, "rew_std": 901.3668786903588, "Agent": "dqn"}, {"env_step": 3500000, "rew": 4537.0, "rew_std": 1127.5176273566635, "Agent": "dqn"}, {"env_step": 3600000, "rew": 5060.75, "rew_std": 1816.7983686969778, "Agent": "dqn"}, {"env_step": 3700000, "rew": 5504.0, "rew_std": 1962.111808740776, "Agent": "dqn"}, {"env_step": 3800000, "rew": 5938.25, "rew_std": 1861.7293875587827, "Agent": "dqn"}, {"env_step": 3900000, "rew": 5781.75, "rew_std": 1370.2176150159507, "Agent": "dqn"}, {"env_step": 4000000, "rew": 5990.25, "rew_std": 3394.9163189245182, "Agent": "dqn"}, {"env_step": 4100000, "rew": 6092.75, "rew_std": 2065.6846473990167, "Agent": "dqn"}, {"env_step": 4200000, "rew": 6176.0, "rew_std": 1842.3508080710362, "Agent": "dqn"}, {"env_step": 4300000, "rew": 6576.5, "rew_std": 2726.7487966440913, "Agent": "dqn"}, {"env_step": 4400000, "rew": 6971.25, "rew_std": 3082.8676281183402, "Agent": "dqn"}, {"env_step": 4500000, "rew": 6908.25, "rew_std": 2762.2427595162594, "Agent": "dqn"}, {"env_step": 4600000, "rew": 7546.0, "rew_std": 2864.2300885229174, "Agent": "dqn"}, {"env_step": 4700000, "rew": 7737.75, "rew_std": 3928.65680767613, "Agent": "dqn"}, {"env_step": 4800000, "rew": 8261.75, "rew_std": 3556.5873829416873, "Agent": "dqn"}, {"env_step": 4900000, "rew": 8120.5, "rew_std": 2792.5308413695275, "Agent": "dqn"}, {"env_step": 5000000, "rew": 7459.25, "rew_std": 3016.322481516192, "Agent": "dqn"}, {"env_step": 5100000, "rew": 8186.25, "rew_std": 3262.4464076058016, "Agent": "dqn"}, {"env_step": 5200000, "rew": 8457.75, "rew_std": 3065.806062441002, "Agent": "dqn"}, {"env_step": 5300000, "rew": 7461.25, "rew_std": 2633.543062586978, "Agent": "dqn"}, {"env_step": 5400000, "rew": 8212.25, "rew_std": 2857.8948655435174, "Agent": "dqn"}, {"env_step": 5500000, "rew": 8331.0, "rew_std": 2962.497088606164, "Agent": "dqn"}, {"env_step": 5600000, "rew": 8116.0, "rew_std": 3106.8304186099376, "Agent": "dqn"}, {"env_step": 5700000, "rew": 8354.0, "rew_std": 2939.679446810485, "Agent": "dqn"}, {"env_step": 5800000, "rew": 8698.25, "rew_std": 2624.4728161099324, "Agent": "dqn"}, {"env_step": 5900000, "rew": 9697.25, "rew_std": 2572.896337301602, "Agent": "dqn"}, {"env_step": 6000000, "rew": 8455.0, "rew_std": 1774.5978417658464, "Agent": "dqn"}, {"env_step": 6100000, "rew": 9885.75, "rew_std": 3028.3760190075473, "Agent": "dqn"}, {"env_step": 6200000, "rew": 8983.5, "rew_std": 2107.2515274641514, "Agent": "dqn"}, {"env_step": 6300000, "rew": 9419.75, "rew_std": 2727.142838668338, "Agent": "dqn"}, {"env_step": 6400000, "rew": 8409.25, "rew_std": 3007.3811385489535, "Agent": "dqn"}, {"env_step": 6500000, "rew": 9823.75, "rew_std": 2742.98269453163, "Agent": "dqn"}, {"env_step": 6600000, "rew": 9702.25, "rew_std": 2529.285336315379, "Agent": "dqn"}, {"env_step": 6700000, "rew": 10412.5, "rew_std": 2968.082925054487, "Agent": "dqn"}, {"env_step": 6800000, "rew": 9085.25, "rew_std": 2521.6067422379724, "Agent": "dqn"}, {"env_step": 6900000, "rew": 9624.25, "rew_std": 2870.277654252285, "Agent": "dqn"}, {"env_step": 7000000, "rew": 10178.25, "rew_std": 2328.1741907554942, "Agent": "dqn"}, {"env_step": 7100000, "rew": 9411.75, "rew_std": 3466.6296762850225, "Agent": "dqn"}, {"env_step": 7200000, "rew": 10059.0, "rew_std": 2418.3835510522313, "Agent": "dqn"}, {"env_step": 7300000, "rew": 9972.25, "rew_std": 3165.8356815381308, "Agent": "dqn"}, {"env_step": 7400000, "rew": 9769.25, "rew_std": 3534.1402861940837, "Agent": "dqn"}, {"env_step": 7500000, "rew": 9630.75, "rew_std": 3561.6785105480812, "Agent": "dqn"}, {"env_step": 7600000, "rew": 10130.5, "rew_std": 2504.094846446516, "Agent": "dqn"}, {"env_step": 7700000, "rew": 9689.75, "rew_std": 2412.3324941848296, "Agent": "dqn"}, {"env_step": 7800000, "rew": 9682.5, "rew_std": 2696.419848614084, "Agent": "dqn"}, {"env_step": 7900000, "rew": 8600.25, "rew_std": 4069.30498519096, "Agent": "dqn"}, {"env_step": 8000000, "rew": 10808.25, "rew_std": 1838.3657994262187, "Agent": "dqn"}, {"env_step": 8100000, "rew": 10105.5, "rew_std": 3078.21819402069, "Agent": "dqn"}, {"env_step": 8200000, "rew": 9794.25, "rew_std": 3020.5171432223324, "Agent": "dqn"}, {"env_step": 8300000, "rew": 10248.5, "rew_std": 2272.298450908243, "Agent": "dqn"}, {"env_step": 8400000, "rew": 9916.5, "rew_std": 3159.7433044473723, "Agent": "dqn"}, {"env_step": 8500000, "rew": 10325.5, "rew_std": 2780.830316650047, "Agent": "dqn"}, {"env_step": 8600000, "rew": 10778.0, "rew_std": 1940.7523669958514, "Agent": "dqn"}, {"env_step": 8700000, "rew": 10993.0, "rew_std": 2580.0946688057784, "Agent": "dqn"}, {"env_step": 8800000, "rew": 10329.75, "rew_std": 2510.3706026202585, "Agent": "dqn"}, {"env_step": 8900000, "rew": 9983.0, "rew_std": 3615.9431342320636, "Agent": "dqn"}, {"env_step": 9000000, "rew": 11148.0, "rew_std": 1932.5183698997535, "Agent": "dqn"}, {"env_step": 9100000, "rew": 10034.75, "rew_std": 2345.046494741629, "Agent": "dqn"}, {"env_step": 9200000, "rew": 10810.75, "rew_std": 2402.0418527785896, "Agent": "dqn"}, {"env_step": 9300000, "rew": 10502.5, "rew_std": 2058.038811587381, "Agent": "dqn"}, {"env_step": 9400000, "rew": 10956.0, "rew_std": 1991.7147762669233, "Agent": "dqn"}, {"env_step": 9500000, "rew": 11620.25, "rew_std": 786.060947064539, "Agent": "dqn"}, {"env_step": 9600000, "rew": 10733.5, "rew_std": 2011.6753589980665, "Agent": "dqn"}, {"env_step": 9700000, "rew": 11486.25, "rew_std": 2341.8905957580514, "Agent": "dqn"}, {"env_step": 9800000, "rew": 11012.5, "rew_std": 2049.413025722243, "Agent": "dqn"}, {"env_step": 9900000, "rew": 10990.5, "rew_std": 1687.970601047305, "Agent": "dqn"}, {"env_step": 10000000, "rew": 11396.5, "rew_std": 1123.2326117060527, "Agent": "dqn"}, {"env_step": 0, "rew": 62.25, "rew_std": 64.61859252568102, "Agent": "fqf"}, {"env_step": 100000, "rew": 282.5, "rew_std": 133.41195598596101, "Agent": "fqf"}, {"env_step": 200000, "rew": 334.25, "rew_std": 97.66684442532174, "Agent": "fqf"}, {"env_step": 300000, "rew": 478.0, "rew_std": 103.5, "Agent": "fqf"}, {"env_step": 400000, "rew": 497.75, "rew_std": 127.49730389306278, "Agent": "fqf"}, {"env_step": 500000, "rew": 761.75, "rew_std": 323.0790344482291, "Agent": "fqf"}, {"env_step": 600000, "rew": 723.25, "rew_std": 85.77623505377233, "Agent": "fqf"}, {"env_step": 700000, "rew": 1184.75, "rew_std": 753.0441969101149, "Agent": "fqf"}, {"env_step": 800000, "rew": 1227.25, "rew_std": 684.0965301037567, "Agent": "fqf"}, {"env_step": 900000, "rew": 1899.75, "rew_std": 957.4160864013096, "Agent": "fqf"}, {"env_step": 1000000, "rew": 1912.5, "rew_std": 1270.665180132044, "Agent": "fqf"}, {"env_step": 1100000, "rew": 2567.5, "rew_std": 1188.7546004117082, "Agent": "fqf"}, {"env_step": 1200000, "rew": 3371.0, "rew_std": 1017.2175283586103, "Agent": "fqf"}, {"env_step": 1300000, "rew": 3156.25, "rew_std": 890.8782534667686, "Agent": "fqf"}, {"env_step": 1400000, "rew": 3885.0, "rew_std": 888.4551198569346, "Agent": "fqf"}, {"env_step": 1500000, "rew": 3952.75, "rew_std": 590.0110698114062, "Agent": "fqf"}, {"env_step": 1600000, "rew": 3700.0, "rew_std": 1213.4516883667022, "Agent": "fqf"}, {"env_step": 1700000, "rew": 4309.75, "rew_std": 1129.6019486969735, "Agent": "fqf"}, {"env_step": 1800000, "rew": 4612.75, "rew_std": 1088.452714866383, "Agent": "fqf"}, {"env_step": 1900000, "rew": 5602.25, "rew_std": 1122.1271374046703, "Agent": "fqf"}, {"env_step": 2000000, "rew": 6148.5, "rew_std": 2185.0435350354005, "Agent": "fqf"}, {"env_step": 2100000, "rew": 6673.75, "rew_std": 1807.6529153850304, "Agent": "fqf"}, {"env_step": 2200000, "rew": 6371.75, "rew_std": 2170.01153510759, "Agent": "fqf"}, {"env_step": 2300000, "rew": 6601.0, "rew_std": 2183.5877014674725, "Agent": "fqf"}, {"env_step": 2400000, "rew": 7732.0, "rew_std": 1939.5839760113508, "Agent": "fqf"}, {"env_step": 2500000, "rew": 8078.25, "rew_std": 2086.995762453772, "Agent": "fqf"}, {"env_step": 2600000, "rew": 9642.5, "rew_std": 2714.1858816227013, "Agent": "fqf"}, {"env_step": 2700000, "rew": 10048.5, "rew_std": 2313.9531110201865, "Agent": "fqf"}, {"env_step": 2800000, "rew": 9025.75, "rew_std": 3670.8754150066165, "Agent": "fqf"}, {"env_step": 2900000, "rew": 9993.5, "rew_std": 3190.4126300527337, "Agent": "fqf"}, {"env_step": 3000000, "rew": 10725.75, "rew_std": 1486.178846067996, "Agent": "fqf"}, {"env_step": 3100000, "rew": 12443.0, "rew_std": 1860.8062096843937, "Agent": "fqf"}, {"env_step": 3200000, "rew": 11651.5, "rew_std": 1916.6462245286687, "Agent": "fqf"}, {"env_step": 3300000, "rew": 11780.25, "rew_std": 2378.499645259591, "Agent": "fqf"}, {"env_step": 3400000, "rew": 12591.25, "rew_std": 1730.6852869600527, "Agent": "fqf"}, {"env_step": 3500000, "rew": 13177.25, "rew_std": 1040.0303180676995, "Agent": "fqf"}, {"env_step": 3600000, "rew": 12289.75, "rew_std": 3415.4978498748906, "Agent": "fqf"}, {"env_step": 3700000, "rew": 12660.0, "rew_std": 1981.2193215290426, "Agent": "fqf"}, {"env_step": 3800000, "rew": 12749.0, "rew_std": 2114.099453668157, "Agent": "fqf"}, {"env_step": 3900000, "rew": 13807.25, "rew_std": 1109.9293051811903, "Agent": "fqf"}, {"env_step": 4000000, "rew": 14015.25, "rew_std": 1171.8481396921702, "Agent": "fqf"}, {"env_step": 4100000, "rew": 13752.25, "rew_std": 1630.1025466209173, "Agent": "fqf"}, {"env_step": 4200000, "rew": 14020.5, "rew_std": 1309.8782386160938, "Agent": "fqf"}, {"env_step": 4300000, "rew": 13418.75, "rew_std": 1649.8266007371806, "Agent": "fqf"}, {"env_step": 4400000, "rew": 14221.5, "rew_std": 1284.3087634988715, "Agent": "fqf"}, {"env_step": 4500000, "rew": 14305.75, "rew_std": 859.7587234218679, "Agent": "fqf"}, {"env_step": 4600000, "rew": 14158.0, "rew_std": 1344.8414404679831, "Agent": "fqf"}, {"env_step": 4700000, "rew": 12771.5, "rew_std": 1663.6489263062685, "Agent": "fqf"}, {"env_step": 4800000, "rew": 14314.0, "rew_std": 1097.285970018755, "Agent": "fqf"}, {"env_step": 4900000, "rew": 14935.25, "rew_std": 337.25074128902963, "Agent": "fqf"}, {"env_step": 5000000, "rew": 14672.0, "rew_std": 807.711117912834, "Agent": "fqf"}, {"env_step": 5100000, "rew": 14673.0, "rew_std": 571.9405563517943, "Agent": "fqf"}, {"env_step": 5200000, "rew": 14309.75, "rew_std": 1108.4434187183394, "Agent": "fqf"}, {"env_step": 5300000, "rew": 14757.25, "rew_std": 947.0417427442151, "Agent": "fqf"}, {"env_step": 5400000, "rew": 14685.0, "rew_std": 655.1602857316674, "Agent": "fqf"}, {"env_step": 5500000, "rew": 14524.25, "rew_std": 979.248468214273, "Agent": "fqf"}, {"env_step": 5600000, "rew": 14862.5, "rew_std": 499.7686964986903, "Agent": "fqf"}, {"env_step": 5700000, "rew": 14338.0, "rew_std": 1270.7752555035056, "Agent": "fqf"}, {"env_step": 5800000, "rew": 14777.75, "rew_std": 538.4253081904676, "Agent": "fqf"}, {"env_step": 5900000, "rew": 14932.0, "rew_std": 720.0848908288522, "Agent": "fqf"}, {"env_step": 6000000, "rew": 15026.25, "rew_std": 556.9619039934419, "Agent": "fqf"}, {"env_step": 6100000, "rew": 15113.75, "rew_std": 255.20151351432068, "Agent": "fqf"}, {"env_step": 6200000, "rew": 14408.5, "rew_std": 1393.7912325739462, "Agent": "fqf"}, {"env_step": 6300000, "rew": 15156.5, "rew_std": 590.047879413188, "Agent": "fqf"}, {"env_step": 6400000, "rew": 14545.5, "rew_std": 1392.182100157878, "Agent": "fqf"}, {"env_step": 6500000, "rew": 14554.75, "rew_std": 1060.3109508535692, "Agent": "fqf"}, {"env_step": 6600000, "rew": 13926.25, "rew_std": 1543.7536437203962, "Agent": "fqf"}, {"env_step": 6700000, "rew": 14911.25, "rew_std": 508.5976430342555, "Agent": "fqf"}, {"env_step": 6800000, "rew": 14964.0, "rew_std": 1249.9880999433556, "Agent": "fqf"}, {"env_step": 6900000, "rew": 15271.75, "rew_std": 499.26827708157066, "Agent": "fqf"}, {"env_step": 7000000, "rew": 14915.25, "rew_std": 710.6022533738548, "Agent": "fqf"}, {"env_step": 7100000, "rew": 14988.5, "rew_std": 568.0396112948463, "Agent": "fqf"}, {"env_step": 7200000, "rew": 14881.25, "rew_std": 963.4282861220133, "Agent": "fqf"}, {"env_step": 7300000, "rew": 15227.75, "rew_std": 746.1756244343553, "Agent": "fqf"}, {"env_step": 7400000, "rew": 15052.0, "rew_std": 1012.3807337163228, "Agent": "fqf"}, {"env_step": 7500000, "rew": 15262.75, "rew_std": 626.2052878250071, "Agent": "fqf"}, {"env_step": 7600000, "rew": 14771.75, "rew_std": 516.1831675868557, "Agent": "fqf"}, {"env_step": 7700000, "rew": 14902.25, "rew_std": 1191.0822022429854, "Agent": "fqf"}, {"env_step": 7800000, "rew": 15195.0, "rew_std": 983.0596370515881, "Agent": "fqf"}, {"env_step": 7900000, "rew": 15172.75, "rew_std": 897.3812247311619, "Agent": "fqf"}, {"env_step": 8000000, "rew": 14729.5, "rew_std": 1125.9345007592583, "Agent": "fqf"}, {"env_step": 8100000, "rew": 14950.75, "rew_std": 407.5706227146407, "Agent": "fqf"}, {"env_step": 8200000, "rew": 14679.25, "rew_std": 1469.804004791115, "Agent": "fqf"}, {"env_step": 8300000, "rew": 14879.75, "rew_std": 1249.1259193932372, "Agent": "fqf"}, {"env_step": 8400000, "rew": 14759.25, "rew_std": 824.2845761628687, "Agent": "fqf"}, {"env_step": 8500000, "rew": 14181.25, "rew_std": 1934.2803086678, "Agent": "fqf"}, {"env_step": 8600000, "rew": 15150.75, "rew_std": 606.5559022052296, "Agent": "fqf"}, {"env_step": 8700000, "rew": 15301.25, "rew_std": 684.131977399098, "Agent": "fqf"}, {"env_step": 8800000, "rew": 15258.75, "rew_std": 178.02826320559328, "Agent": "fqf"}, {"env_step": 8900000, "rew": 14306.75, "rew_std": 2652.5966169962594, "Agent": "fqf"}, {"env_step": 9000000, "rew": 14469.5, "rew_std": 1781.5501676910476, "Agent": "fqf"}, {"env_step": 9100000, "rew": 14648.25, "rew_std": 983.8413553515628, "Agent": "fqf"}, {"env_step": 9200000, "rew": 15119.25, "rew_std": 669.5624037384417, "Agent": "fqf"}, {"env_step": 9300000, "rew": 14687.75, "rew_std": 914.5568940749395, "Agent": "fqf"}, {"env_step": 9400000, "rew": 14220.0, "rew_std": 3311.433790671346, "Agent": "fqf"}, {"env_step": 9500000, "rew": 15234.75, "rew_std": 382.4288332487497, "Agent": "fqf"}, {"env_step": 9600000, "rew": 14718.75, "rew_std": 632.6375838503432, "Agent": "fqf"}, {"env_step": 9700000, "rew": 14343.5, "rew_std": 1404.7336046382602, "Agent": "fqf"}, {"env_step": 9800000, "rew": 15267.5, "rew_std": 387.3209263646879, "Agent": "fqf"}, {"env_step": 9900000, "rew": 15137.75, "rew_std": 331.75, "Agent": "fqf"}, {"env_step": 10000000, "rew": 14602.75, "rew_std": 1270.1847552620052, "Agent": "fqf"}, {"env_step": 0, "rew": 63.5, "rew_std": 62.13091018164791, "Agent": "qrdqn"}, {"env_step": 100000, "rew": 270.75, "rew_std": 151.2119786921658, "Agent": "qrdqn"}, {"env_step": 200000, "rew": 330.0, "rew_std": 140.30324301312496, "Agent": "qrdqn"}, {"env_step": 300000, "rew": 482.5, "rew_std": 145.48625364617786, "Agent": "qrdqn"}, {"env_step": 400000, "rew": 655.25, "rew_std": 164.68701375639793, "Agent": "qrdqn"}, {"env_step": 500000, "rew": 624.5, "rew_std": 130.56033088193365, "Agent": "qrdqn"}, {"env_step": 600000, "rew": 676.5, "rew_std": 131.37351331223505, "Agent": "qrdqn"}, {"env_step": 700000, "rew": 628.25, "rew_std": 158.0587311729409, "Agent": "qrdqn"}, {"env_step": 800000, "rew": 1161.25, "rew_std": 710.1436914456116, "Agent": "qrdqn"}, {"env_step": 900000, "rew": 1550.25, "rew_std": 826.7983808039297, "Agent": "qrdqn"}, {"env_step": 1000000, "rew": 1962.5, "rew_std": 961.0228925473108, "Agent": "qrdqn"}, {"env_step": 1100000, "rew": 2176.0, "rew_std": 1403.9837071704214, "Agent": "qrdqn"}, {"env_step": 1200000, "rew": 2638.5, "rew_std": 1025.882668729714, "Agent": "qrdqn"}, {"env_step": 1300000, "rew": 3701.0, "rew_std": 630.7289433663243, "Agent": "qrdqn"}, {"env_step": 1400000, "rew": 3190.25, "rew_std": 947.5115104841735, "Agent": "qrdqn"}, {"env_step": 1500000, "rew": 3946.75, "rew_std": 637.7578400145309, "Agent": "qrdqn"}, {"env_step": 1600000, "rew": 4426.5, "rew_std": 815.5735711755256, "Agent": "qrdqn"}, {"env_step": 1700000, "rew": 4326.25, "rew_std": 986.4046139896143, "Agent": "qrdqn"}, {"env_step": 1800000, "rew": 4494.5, "rew_std": 949.5484453149297, "Agent": "qrdqn"}, {"env_step": 1900000, "rew": 4857.5, "rew_std": 1134.8067016016428, "Agent": "qrdqn"}, {"env_step": 2000000, "rew": 4661.0, "rew_std": 2612.279225121235, "Agent": "qrdqn"}, {"env_step": 2100000, "rew": 6238.5, "rew_std": 2523.3789846156683, "Agent": "qrdqn"}, {"env_step": 2200000, "rew": 6793.5, "rew_std": 2207.1540499022717, "Agent": "qrdqn"}, {"env_step": 2300000, "rew": 8352.75, "rew_std": 2463.5217296585797, "Agent": "qrdqn"}, {"env_step": 2400000, "rew": 10017.0, "rew_std": 1099.753836092423, "Agent": "qrdqn"}, {"env_step": 2500000, "rew": 9378.25, "rew_std": 2206.291869291096, "Agent": "qrdqn"}, {"env_step": 2600000, "rew": 9277.75, "rew_std": 2164.6920826066694, "Agent": "qrdqn"}, {"env_step": 2700000, "rew": 9680.25, "rew_std": 1852.4255889238843, "Agent": "qrdqn"}, {"env_step": 2800000, "rew": 9750.0, "rew_std": 3101.0985956592867, "Agent": "qrdqn"}, {"env_step": 2900000, "rew": 11197.0, "rew_std": 2089.198650200598, "Agent": "qrdqn"}, {"env_step": 3000000, "rew": 10168.5, "rew_std": 1820.62976741566, "Agent": "qrdqn"}, {"env_step": 3100000, "rew": 10809.0, "rew_std": 1863.6564195151423, "Agent": "qrdqn"}, {"env_step": 3200000, "rew": 11434.75, "rew_std": 1928.14951767232, "Agent": "qrdqn"}, {"env_step": 3300000, "rew": 12635.0, "rew_std": 2041.877812211103, "Agent": "qrdqn"}, {"env_step": 3400000, "rew": 11676.0, "rew_std": 3368.622715591641, "Agent": "qrdqn"}, {"env_step": 3500000, "rew": 11960.0, "rew_std": 1950.4877595104256, "Agent": "qrdqn"}, {"env_step": 3600000, "rew": 11736.0, "rew_std": 2031.8129835198908, "Agent": "qrdqn"}, {"env_step": 3700000, "rew": 12507.25, "rew_std": 1577.2018141315968, "Agent": "qrdqn"}, {"env_step": 3800000, "rew": 12923.5, "rew_std": 4095.112208474879, "Agent": "qrdqn"}, {"env_step": 3900000, "rew": 13316.75, "rew_std": 1166.7872824555468, "Agent": "qrdqn"}, {"env_step": 4000000, "rew": 13060.0, "rew_std": 2080.1246957814815, "Agent": "qrdqn"}, {"env_step": 4100000, "rew": 12532.75, "rew_std": 1183.963919424912, "Agent": "qrdqn"}, {"env_step": 4200000, "rew": 12320.25, "rew_std": 2122.9921249265153, "Agent": "qrdqn"}, {"env_step": 4300000, "rew": 12833.5, "rew_std": 1463.2879074194525, "Agent": "qrdqn"}, {"env_step": 4400000, "rew": 12643.5, "rew_std": 1230.7717091321201, "Agent": "qrdqn"}, {"env_step": 4500000, "rew": 12753.5, "rew_std": 2467.2244526998347, "Agent": "qrdqn"}, {"env_step": 4600000, "rew": 14206.0, "rew_std": 934.261874422798, "Agent": "qrdqn"}, {"env_step": 4700000, "rew": 13566.0, "rew_std": 1616.8879058240248, "Agent": "qrdqn"}, {"env_step": 4800000, "rew": 13339.0, "rew_std": 2508.4644705476694, "Agent": "qrdqn"}, {"env_step": 4900000, "rew": 13325.5, "rew_std": 1697.8286868821601, "Agent": "qrdqn"}, {"env_step": 5000000, "rew": 13318.25, "rew_std": 1575.3479972691748, "Agent": "qrdqn"}, {"env_step": 5100000, "rew": 12695.25, "rew_std": 1818.0165875205869, "Agent": "qrdqn"}, {"env_step": 5200000, "rew": 13957.5, "rew_std": 1218.8980679285696, "Agent": "qrdqn"}, {"env_step": 5300000, "rew": 13959.75, "rew_std": 1010.0305997839868, "Agent": "qrdqn"}, {"env_step": 5400000, "rew": 13414.0, "rew_std": 1498.4079884997943, "Agent": "qrdqn"}, {"env_step": 5500000, "rew": 12775.5, "rew_std": 1296.2314608124584, "Agent": "qrdqn"}, {"env_step": 5600000, "rew": 14213.75, "rew_std": 1282.7033220897185, "Agent": "qrdqn"}, {"env_step": 5700000, "rew": 12620.5, "rew_std": 2257.2158735929534, "Agent": "qrdqn"}, {"env_step": 5800000, "rew": 12587.5, "rew_std": 1430.5497195134462, "Agent": "qrdqn"}, {"env_step": 5900000, "rew": 13289.5, "rew_std": 1792.5658286378216, "Agent": "qrdqn"}, {"env_step": 6000000, "rew": 13572.75, "rew_std": 2379.9851496385436, "Agent": "qrdqn"}, {"env_step": 6100000, "rew": 12327.75, "rew_std": 2985.5888133666363, "Agent": "qrdqn"}, {"env_step": 6200000, "rew": 13057.75, "rew_std": 2234.581182794664, "Agent": "qrdqn"}, {"env_step": 6300000, "rew": 13167.75, "rew_std": 2580.7533904850343, "Agent": "qrdqn"}, {"env_step": 6400000, "rew": 14265.0, "rew_std": 1022.666856801373, "Agent": "qrdqn"}, {"env_step": 6500000, "rew": 13314.5, "rew_std": 1621.0269892879637, "Agent": "qrdqn"}, {"env_step": 6600000, "rew": 14761.5, "rew_std": 862.8928091020344, "Agent": "qrdqn"}, {"env_step": 6700000, "rew": 12912.5, "rew_std": 2490.064005201473, "Agent": "qrdqn"}, {"env_step": 6800000, "rew": 13582.25, "rew_std": 1415.470085342675, "Agent": "qrdqn"}, {"env_step": 6900000, "rew": 14093.0, "rew_std": 1151.0564712471755, "Agent": "qrdqn"}, {"env_step": 7000000, "rew": 13608.75, "rew_std": 1454.381419195116, "Agent": "qrdqn"}, {"env_step": 7100000, "rew": 14457.25, "rew_std": 1426.2934699773396, "Agent": "qrdqn"}, {"env_step": 7200000, "rew": 14363.5, "rew_std": 1147.3579432766394, "Agent": "qrdqn"}, {"env_step": 7300000, "rew": 14335.75, "rew_std": 1048.029132467223, "Agent": "qrdqn"}, {"env_step": 7400000, "rew": 14255.0, "rew_std": 996.4361494847525, "Agent": "qrdqn"}, {"env_step": 7500000, "rew": 13165.0, "rew_std": 2007.4355531373853, "Agent": "qrdqn"}, {"env_step": 7600000, "rew": 13882.25, "rew_std": 1050.5673764685444, "Agent": "qrdqn"}, {"env_step": 7700000, "rew": 14029.25, "rew_std": 1288.9787866757156, "Agent": "qrdqn"}, {"env_step": 7800000, "rew": 13062.75, "rew_std": 2194.7472662017376, "Agent": "qrdqn"}, {"env_step": 7900000, "rew": 13878.75, "rew_std": 1196.7911524154915, "Agent": "qrdqn"}, {"env_step": 8000000, "rew": 14246.25, "rew_std": 1554.0568884374857, "Agent": "qrdqn"}, {"env_step": 8100000, "rew": 14211.5, "rew_std": 1194.981276003938, "Agent": "qrdqn"}, {"env_step": 8200000, "rew": 14197.0, "rew_std": 1123.807034147767, "Agent": "qrdqn"}, {"env_step": 8300000, "rew": 13508.0, "rew_std": 1345.116073058381, "Agent": "qrdqn"}, {"env_step": 8400000, "rew": 11739.5, "rew_std": 2172.110954808709, "Agent": "qrdqn"}, {"env_step": 8500000, "rew": 13295.5, "rew_std": 1875.5738455203516, "Agent": "qrdqn"}, {"env_step": 8600000, "rew": 14682.0, "rew_std": 657.4094994750228, "Agent": "qrdqn"}, {"env_step": 8700000, "rew": 13262.75, "rew_std": 2101.4068055709727, "Agent": "qrdqn"}, {"env_step": 8800000, "rew": 13034.25, "rew_std": 2962.464567298654, "Agent": "qrdqn"}, {"env_step": 8900000, "rew": 13833.25, "rew_std": 1593.2596500570771, "Agent": "qrdqn"}, {"env_step": 9000000, "rew": 13900.75, "rew_std": 1380.3591244672525, "Agent": "qrdqn"}, {"env_step": 9100000, "rew": 13849.5, "rew_std": 1837.9743605393412, "Agent": "qrdqn"}, {"env_step": 9200000, "rew": 12643.25, "rew_std": 2829.352631345199, "Agent": "qrdqn"}, {"env_step": 9300000, "rew": 13530.75, "rew_std": 1416.5393790855233, "Agent": "qrdqn"}, {"env_step": 9400000, "rew": 13982.5, "rew_std": 1845.6198145880423, "Agent": "qrdqn"}, {"env_step": 9500000, "rew": 13809.25, "rew_std": 1238.4738844642627, "Agent": "qrdqn"}, {"env_step": 9600000, "rew": 12931.5, "rew_std": 1797.4736437567033, "Agent": "qrdqn"}, {"env_step": 9700000, "rew": 14342.75, "rew_std": 649.1700951984773, "Agent": "qrdqn"}, {"env_step": 9800000, "rew": 14729.75, "rew_std": 626.4367984880837, "Agent": "qrdqn"}, {"env_step": 9900000, "rew": 13490.75, "rew_std": 1119.1950511416676, "Agent": "qrdqn"}, {"env_step": 10000000, "rew": 14191.5, "rew_std": 1683.4767595663445, "Agent": "qrdqn"}, {"env_step": 0, "rew": 74.75, "rew_std": 68.97871048374273, "Agent": "iqn"}, {"env_step": 100000, "rew": 305.25, "rew_std": 107.32223674523374, "Agent": "iqn"}, {"env_step": 200000, "rew": 278.5, "rew_std": 60.28266749240614, "Agent": "iqn"}, {"env_step": 300000, "rew": 480.75, "rew_std": 128.17980535170116, "Agent": "iqn"}, {"env_step": 400000, "rew": 580.5, "rew_std": 164.20566372692508, "Agent": "iqn"}, {"env_step": 500000, "rew": 603.5, "rew_std": 163.69254717304634, "Agent": "iqn"}, {"env_step": 600000, "rew": 681.5, "rew_std": 165.10299815569672, "Agent": "iqn"}, {"env_step": 700000, "rew": 779.5, "rew_std": 202.94642150084834, "Agent": "iqn"}, {"env_step": 800000, "rew": 1212.0, "rew_std": 518.2033867122059, "Agent": "iqn"}, {"env_step": 900000, "rew": 1937.0, "rew_std": 1077.2446333122296, "Agent": "iqn"}, {"env_step": 1000000, "rew": 2055.75, "rew_std": 1114.4051384034444, "Agent": "iqn"}, {"env_step": 1100000, "rew": 2164.0, "rew_std": 763.3292212407435, "Agent": "iqn"}, {"env_step": 1200000, "rew": 2717.0, "rew_std": 926.5607103692666, "Agent": "iqn"}, {"env_step": 1300000, "rew": 3349.25, "rew_std": 801.4120740917247, "Agent": "iqn"}, {"env_step": 1400000, "rew": 3172.25, "rew_std": 848.1453663730057, "Agent": "iqn"}, {"env_step": 1500000, "rew": 3463.5, "rew_std": 827.8875225536377, "Agent": "iqn"}, {"env_step": 1600000, "rew": 4035.75, "rew_std": 911.0859248720726, "Agent": "iqn"}, {"env_step": 1700000, "rew": 4497.0, "rew_std": 543.007596631944, "Agent": "iqn"}, {"env_step": 1800000, "rew": 4461.25, "rew_std": 499.12705045909905, "Agent": "iqn"}, {"env_step": 1900000, "rew": 4384.25, "rew_std": 471.4711682595236, "Agent": "iqn"}, {"env_step": 2000000, "rew": 5132.0, "rew_std": 1111.9947167140679, "Agent": "iqn"}, {"env_step": 2100000, "rew": 4575.75, "rew_std": 2275.0469912729277, "Agent": "iqn"}, {"env_step": 2200000, "rew": 5614.5, "rew_std": 1350.1304566596518, "Agent": "iqn"}, {"env_step": 2300000, "rew": 5378.75, "rew_std": 2386.0001178751018, "Agent": "iqn"}, {"env_step": 2400000, "rew": 6720.5, "rew_std": 2223.6897265580915, "Agent": "iqn"}, {"env_step": 2500000, "rew": 7193.75, "rew_std": 1491.2818521325873, "Agent": "iqn"}, {"env_step": 2600000, "rew": 8060.25, "rew_std": 2501.7125259509735, "Agent": "iqn"}, {"env_step": 2700000, "rew": 8047.0, "rew_std": 1672.755511125281, "Agent": "iqn"}, {"env_step": 2800000, "rew": 8176.0, "rew_std": 3218.092447397992, "Agent": "iqn"}, {"env_step": 2900000, "rew": 9079.25, "rew_std": 2817.5170917848927, "Agent": "iqn"}, {"env_step": 3000000, "rew": 9333.5, "rew_std": 1586.5446731813133, "Agent": "iqn"}, {"env_step": 3100000, "rew": 11244.75, "rew_std": 1804.940944324772, "Agent": "iqn"}, {"env_step": 3200000, "rew": 9774.75, "rew_std": 2385.623988079429, "Agent": "iqn"}, {"env_step": 3300000, "rew": 10427.5, "rew_std": 2821.736167681167, "Agent": "iqn"}, {"env_step": 3400000, "rew": 9773.25, "rew_std": 2530.4006723244443, "Agent": "iqn"}, {"env_step": 3500000, "rew": 10958.5, "rew_std": 1914.0373559572968, "Agent": "iqn"}, {"env_step": 3600000, "rew": 11481.25, "rew_std": 2320.765027420915, "Agent": "iqn"}, {"env_step": 3700000, "rew": 10402.0, "rew_std": 2840.605525235773, "Agent": "iqn"}, {"env_step": 3800000, "rew": 11571.25, "rew_std": 1838.5531845720427, "Agent": "iqn"}, {"env_step": 3900000, "rew": 12558.75, "rew_std": 1597.0246749815733, "Agent": "iqn"}, {"env_step": 4000000, "rew": 12249.5, "rew_std": 1836.1981102266716, "Agent": "iqn"}, {"env_step": 4100000, "rew": 12411.5, "rew_std": 1798.764228574718, "Agent": "iqn"}, {"env_step": 4200000, "rew": 12926.75, "rew_std": 1323.884459648953, "Agent": "iqn"}, {"env_step": 4300000, "rew": 11794.75, "rew_std": 2639.6958750015124, "Agent": "iqn"}, {"env_step": 4400000, "rew": 12201.0, "rew_std": 1702.2159087495334, "Agent": "iqn"}, {"env_step": 4500000, "rew": 12271.25, "rew_std": 1584.632548100663, "Agent": "iqn"}, {"env_step": 4600000, "rew": 12395.25, "rew_std": 1911.1424757196937, "Agent": "iqn"}, {"env_step": 4700000, "rew": 12780.0, "rew_std": 1188.934396844502, "Agent": "iqn"}, {"env_step": 4800000, "rew": 12680.5, "rew_std": 1798.4388368804762, "Agent": "iqn"}, {"env_step": 4900000, "rew": 11659.0, "rew_std": 1524.3105818697186, "Agent": "iqn"}, {"env_step": 5000000, "rew": 12834.25, "rew_std": 1934.9157119885094, "Agent": "iqn"}, {"env_step": 5100000, "rew": 13496.0, "rew_std": 1634.7783488901484, "Agent": "iqn"}, {"env_step": 5200000, "rew": 13142.75, "rew_std": 1530.6499640675527, "Agent": "iqn"}, {"env_step": 5300000, "rew": 12664.75, "rew_std": 2404.7719356521106, "Agent": "iqn"}, {"env_step": 5400000, "rew": 12944.25, "rew_std": 2205.103186361128, "Agent": "iqn"}, {"env_step": 5500000, "rew": 13810.25, "rew_std": 2059.245750875791, "Agent": "iqn"}, {"env_step": 5600000, "rew": 13504.0, "rew_std": 849.1313208214616, "Agent": "iqn"}, {"env_step": 5700000, "rew": 13502.25, "rew_std": 1435.742599667503, "Agent": "iqn"}, {"env_step": 5800000, "rew": 14175.25, "rew_std": 1070.7231493247916, "Agent": "iqn"}, {"env_step": 5900000, "rew": 13746.0, "rew_std": 1353.6211619208677, "Agent": "iqn"}, {"env_step": 6000000, "rew": 14359.75, "rew_std": 987.1046360442241, "Agent": "iqn"}, {"env_step": 6100000, "rew": 13638.25, "rew_std": 2135.9354069119227, "Agent": "iqn"}, {"env_step": 6200000, "rew": 14398.0, "rew_std": 724.5531381479208, "Agent": "iqn"}, {"env_step": 6300000, "rew": 13681.25, "rew_std": 1508.860600751441, "Agent": "iqn"}, {"env_step": 6400000, "rew": 12862.0, "rew_std": 2345.081501781974, "Agent": "iqn"}, {"env_step": 6500000, "rew": 12578.5, "rew_std": 3452.268855405094, "Agent": "iqn"}, {"env_step": 6600000, "rew": 13525.25, "rew_std": 1754.864115109771, "Agent": "iqn"}, {"env_step": 6700000, "rew": 14026.75, "rew_std": 1140.708688710663, "Agent": "iqn"}, {"env_step": 6800000, "rew": 14103.75, "rew_std": 1377.3363106010092, "Agent": "iqn"}, {"env_step": 6900000, "rew": 13723.5, "rew_std": 1402.6114928945933, "Agent": "iqn"}, {"env_step": 7000000, "rew": 13494.25, "rew_std": 997.4141880382492, "Agent": "iqn"}, {"env_step": 7100000, "rew": 14152.25, "rew_std": 709.2394253705867, "Agent": "iqn"}, {"env_step": 7200000, "rew": 13685.25, "rew_std": 1417.7761856160514, "Agent": "iqn"}, {"env_step": 7300000, "rew": 13408.25, "rew_std": 2077.5096419752185, "Agent": "iqn"}, {"env_step": 7400000, "rew": 14233.0, "rew_std": 909.7477672410084, "Agent": "iqn"}, {"env_step": 7500000, "rew": 14091.5, "rew_std": 743.8003764451857, "Agent": "iqn"}, {"env_step": 7600000, "rew": 13211.75, "rew_std": 1589.0996074821742, "Agent": "iqn"}, {"env_step": 7700000, "rew": 13444.5, "rew_std": 1892.1039215645635, "Agent": "iqn"}, {"env_step": 7800000, "rew": 13603.25, "rew_std": 2529.7435764322045, "Agent": "iqn"}, {"env_step": 7900000, "rew": 13292.25, "rew_std": 3160.3117824828614, "Agent": "iqn"}, {"env_step": 8000000, "rew": 14121.75, "rew_std": 818.3054518332382, "Agent": "iqn"}, {"env_step": 8100000, "rew": 14027.0, "rew_std": 721.3241296393737, "Agent": "iqn"}, {"env_step": 8200000, "rew": 14095.25, "rew_std": 599.5054732861078, "Agent": "iqn"}, {"env_step": 8300000, "rew": 14409.25, "rew_std": 808.6462839214684, "Agent": "iqn"}, {"env_step": 8400000, "rew": 13536.75, "rew_std": 753.1708388539747, "Agent": "iqn"}, {"env_step": 8500000, "rew": 13976.5, "rew_std": 988.6829623291786, "Agent": "iqn"}, {"env_step": 8600000, "rew": 13914.5, "rew_std": 1239.5683724587361, "Agent": "iqn"}, {"env_step": 8700000, "rew": 14257.0, "rew_std": 1150.6013645046662, "Agent": "iqn"}, {"env_step": 8800000, "rew": 13446.5, "rew_std": 1551.8111193054392, "Agent": "iqn"}, {"env_step": 8900000, "rew": 14032.5, "rew_std": 1186.8413963120768, "Agent": "iqn"}, {"env_step": 9000000, "rew": 14378.5, "rew_std": 943.7049326987753, "Agent": "iqn"}, {"env_step": 9100000, "rew": 14320.75, "rew_std": 647.3224177332344, "Agent": "iqn"}, {"env_step": 9200000, "rew": 13960.25, "rew_std": 1017.343630490701, "Agent": "iqn"}, {"env_step": 9300000, "rew": 13514.25, "rew_std": 1402.1367845185434, "Agent": "iqn"}, {"env_step": 9400000, "rew": 13712.25, "rew_std": 1607.3042065831844, "Agent": "iqn"}, {"env_step": 9500000, "rew": 14267.75, "rew_std": 724.1317645981289, "Agent": "iqn"}, {"env_step": 9600000, "rew": 14351.75, "rew_std": 780.0296869350551, "Agent": "iqn"}, {"env_step": 9700000, "rew": 13220.25, "rew_std": 1425.2001833075942, "Agent": "iqn"}, {"env_step": 9800000, "rew": 14156.5, "rew_std": 853.8107225843443, "Agent": "iqn"}, {"env_step": 9900000, "rew": 14273.75, "rew_std": 895.3443820675931, "Agent": "iqn"}, {"env_step": 10000000, "rew": 13774.75, "rew_std": 1513.8219223211163, "Agent": "iqn"}, {"env_step": 0, "rew": 45.5, "rew_std": 47.75981574503821, "Agent": "rainbow"}, {"env_step": 100000, "rew": 284.5, "rew_std": 61.47967143698801, "Agent": "rainbow"}, {"env_step": 200000, "rew": 285.0, "rew_std": 74.47314952383846, "Agent": "rainbow"}, {"env_step": 300000, "rew": 377.75, "rew_std": 92.13746523537534, "Agent": "rainbow"}, {"env_step": 400000, "rew": 395.75, "rew_std": 96.40442157909564, "Agent": "rainbow"}, {"env_step": 500000, "rew": 446.5, "rew_std": 135.95587519485872, "Agent": "rainbow"}, {"env_step": 600000, "rew": 509.0, "rew_std": 112.18400064180275, "Agent": "rainbow"}, {"env_step": 700000, "rew": 842.0, "rew_std": 379.03957577012983, "Agent": "rainbow"}, {"env_step": 800000, "rew": 841.25, "rew_std": 334.61031439571616, "Agent": "rainbow"}, {"env_step": 900000, "rew": 1965.0, "rew_std": 1128.5698914998575, "Agent": "rainbow"}, {"env_step": 1000000, "rew": 2198.25, "rew_std": 836.4859906178943, "Agent": "rainbow"}, {"env_step": 1100000, "rew": 3015.75, "rew_std": 848.7866707836546, "Agent": "rainbow"}, {"env_step": 1200000, "rew": 2877.0, "rew_std": 996.3312702108672, "Agent": "rainbow"}, {"env_step": 1300000, "rew": 3242.0, "rew_std": 876.3666470148211, "Agent": "rainbow"}, {"env_step": 1400000, "rew": 3739.5, "rew_std": 779.8091112573641, "Agent": "rainbow"}, {"env_step": 1500000, "rew": 3878.5, "rew_std": 610.4621200369438, "Agent": "rainbow"}, {"env_step": 1600000, "rew": 3686.75, "rew_std": 1020.1911891895558, "Agent": "rainbow"}, {"env_step": 1700000, "rew": 3802.5, "rew_std": 775.4450335130144, "Agent": "rainbow"}, {"env_step": 1800000, "rew": 4826.75, "rew_std": 1208.2508276430024, "Agent": "rainbow"}, {"env_step": 1900000, "rew": 5678.25, "rew_std": 1521.4220527191, "Agent": "rainbow"}, {"env_step": 2000000, "rew": 5642.5, "rew_std": 2018.9904655545058, "Agent": "rainbow"}, {"env_step": 2100000, "rew": 7018.0, "rew_std": 2637.9750283124363, "Agent": "rainbow"}, {"env_step": 2200000, "rew": 6920.25, "rew_std": 1881.316178237991, "Agent": "rainbow"}, {"env_step": 2300000, "rew": 7435.0, "rew_std": 1537.6528379318916, "Agent": "rainbow"}, {"env_step": 2400000, "rew": 7692.5, "rew_std": 1343.7070923382075, "Agent": "rainbow"}, {"env_step": 2500000, "rew": 8006.25, "rew_std": 1876.4488568836616, "Agent": "rainbow"}, {"env_step": 2600000, "rew": 9979.75, "rew_std": 2021.7954427933603, "Agent": "rainbow"}, {"env_step": 2700000, "rew": 9089.75, "rew_std": 1605.1473647301048, "Agent": "rainbow"}, {"env_step": 2800000, "rew": 8764.75, "rew_std": 1827.6663569973596, "Agent": "rainbow"}, {"env_step": 2900000, "rew": 9663.0, "rew_std": 2015.3541252097607, "Agent": "rainbow"}, {"env_step": 3000000, "rew": 9934.5, "rew_std": 2286.617261371041, "Agent": "rainbow"}, {"env_step": 3100000, "rew": 10924.25, "rew_std": 2628.7715881186787, "Agent": "rainbow"}, {"env_step": 3200000, "rew": 9174.75, "rew_std": 1997.3590219337134, "Agent": "rainbow"}, {"env_step": 3300000, "rew": 10324.25, "rew_std": 1182.9740328933683, "Agent": "rainbow"}, {"env_step": 3400000, "rew": 10506.5, "rew_std": 1664.2221155843351, "Agent": "rainbow"}, {"env_step": 3500000, "rew": 10675.0, "rew_std": 2079.8194032175006, "Agent": "rainbow"}, {"env_step": 3600000, "rew": 10794.25, "rew_std": 2335.775848085599, "Agent": "rainbow"}, {"env_step": 3700000, "rew": 10830.25, "rew_std": 2143.70282746933, "Agent": "rainbow"}, {"env_step": 3800000, "rew": 11664.75, "rew_std": 1526.7708775386043, "Agent": "rainbow"}, {"env_step": 3900000, "rew": 10242.5, "rew_std": 2334.839662589275, "Agent": "rainbow"}, {"env_step": 4000000, "rew": 11877.25, "rew_std": 1986.8088263594966, "Agent": "rainbow"}, {"env_step": 4100000, "rew": 11280.25, "rew_std": 2765.102721871287, "Agent": "rainbow"}, {"env_step": 4200000, "rew": 12994.5, "rew_std": 1754.1610530393154, "Agent": "rainbow"}, {"env_step": 4300000, "rew": 10860.25, "rew_std": 1974.6045331913933, "Agent": "rainbow"}, {"env_step": 4400000, "rew": 10636.25, "rew_std": 2674.058537597859, "Agent": "rainbow"}, {"env_step": 4500000, "rew": 12535.5, "rew_std": 1929.7117012652434, "Agent": "rainbow"}, {"env_step": 4600000, "rew": 12290.5, "rew_std": 1829.934015203827, "Agent": "rainbow"}, {"env_step": 4700000, "rew": 12177.5, "rew_std": 946.7675269040442, "Agent": "rainbow"}, {"env_step": 4800000, "rew": 13175.75, "rew_std": 1413.9178945398492, "Agent": "rainbow"}, {"env_step": 4900000, "rew": 12883.5, "rew_std": 1610.216677966043, "Agent": "rainbow"}, {"env_step": 5000000, "rew": 12284.5, "rew_std": 1809.4221453270654, "Agent": "rainbow"}, {"env_step": 5100000, "rew": 12318.0, "rew_std": 2168.0633062712905, "Agent": "rainbow"}, {"env_step": 5200000, "rew": 12730.25, "rew_std": 1575.0005753967203, "Agent": "rainbow"}, {"env_step": 5300000, "rew": 11980.25, "rew_std": 1916.1492798057254, "Agent": "rainbow"}, {"env_step": 5400000, "rew": 12032.75, "rew_std": 2195.3403637021756, "Agent": "rainbow"}, {"env_step": 5500000, "rew": 12618.0, "rew_std": 2118.3926099757805, "Agent": "rainbow"}, {"env_step": 5600000, "rew": 13014.25, "rew_std": 1486.7145195026515, "Agent": "rainbow"}, {"env_step": 5700000, "rew": 12690.0, "rew_std": 1458.9743829142444, "Agent": "rainbow"}, {"env_step": 5800000, "rew": 12033.5, "rew_std": 1977.8407418192194, "Agent": "rainbow"}, {"env_step": 5900000, "rew": 12640.25, "rew_std": 2624.1961745456456, "Agent": "rainbow"}, {"env_step": 6000000, "rew": 13131.25, "rew_std": 1906.204097807997, "Agent": "rainbow"}, {"env_step": 6100000, "rew": 13501.75, "rew_std": 1226.5200008560805, "Agent": "rainbow"}, {"env_step": 6200000, "rew": 13880.0, "rew_std": 1096.272662251504, "Agent": "rainbow"}, {"env_step": 6300000, "rew": 12978.75, "rew_std": 1734.9788363262533, "Agent": "rainbow"}, {"env_step": 6400000, "rew": 12417.0, "rew_std": 1276.8250663266288, "Agent": "rainbow"}, {"env_step": 6500000, "rew": 13424.5, "rew_std": 1740.133543725883, "Agent": "rainbow"}, {"env_step": 6600000, "rew": 13237.0, "rew_std": 1644.9296337533713, "Agent": "rainbow"}, {"env_step": 6700000, "rew": 13351.75, "rew_std": 1120.8969901378093, "Agent": "rainbow"}, {"env_step": 6800000, "rew": 12263.0, "rew_std": 2282.7893573433357, "Agent": "rainbow"}, {"env_step": 6900000, "rew": 12439.0, "rew_std": 2598.2990108915487, "Agent": "rainbow"}, {"env_step": 7000000, "rew": 14034.5, "rew_std": 744.4837137238128, "Agent": "rainbow"}, {"env_step": 7100000, "rew": 13683.25, "rew_std": 901.8238810876545, "Agent": "rainbow"}, {"env_step": 7200000, "rew": 14111.25, "rew_std": 1060.766379793402, "Agent": "rainbow"}, {"env_step": 7300000, "rew": 13421.75, "rew_std": 1568.2095881928537, "Agent": "rainbow"}, {"env_step": 7400000, "rew": 14206.5, "rew_std": 607.6617068731582, "Agent": "rainbow"}, {"env_step": 7500000, "rew": 13354.25, "rew_std": 1601.6690708445362, "Agent": "rainbow"}, {"env_step": 7600000, "rew": 13701.75, "rew_std": 1030.2663793893305, "Agent": "rainbow"}, {"env_step": 7700000, "rew": 13039.0, "rew_std": 2426.61317477673, "Agent": "rainbow"}, {"env_step": 7800000, "rew": 13988.25, "rew_std": 1832.0964937742772, "Agent": "rainbow"}, {"env_step": 7900000, "rew": 13303.0, "rew_std": 1248.9764809635128, "Agent": "rainbow"}, {"env_step": 8000000, "rew": 13551.25, "rew_std": 1319.6809510256637, "Agent": "rainbow"}, {"env_step": 8100000, "rew": 13257.25, "rew_std": 1674.4097654098891, "Agent": "rainbow"}, {"env_step": 8200000, "rew": 13652.5, "rew_std": 1983.858613913804, "Agent": "rainbow"}, {"env_step": 8300000, "rew": 13802.5, "rew_std": 1365.1304882684292, "Agent": "rainbow"}, {"env_step": 8400000, "rew": 13834.5, "rew_std": 1055.2753195256678, "Agent": "rainbow"}, {"env_step": 8500000, "rew": 14132.75, "rew_std": 759.6795788357089, "Agent": "rainbow"}, {"env_step": 8600000, "rew": 13816.5, "rew_std": 838.3877384599563, "Agent": "rainbow"}, {"env_step": 8700000, "rew": 13764.0, "rew_std": 1449.42367857021, "Agent": "rainbow"}, {"env_step": 8800000, "rew": 13053.75, "rew_std": 1003.1601629351118, "Agent": "rainbow"}, {"env_step": 8900000, "rew": 13302.75, "rew_std": 1787.7211226866455, "Agent": "rainbow"}, {"env_step": 9000000, "rew": 13252.75, "rew_std": 1108.8256456720326, "Agent": "rainbow"}, {"env_step": 9100000, "rew": 13711.75, "rew_std": 1272.3845969281458, "Agent": "rainbow"}, {"env_step": 9200000, "rew": 13983.5, "rew_std": 1598.7660085203213, "Agent": "rainbow"}, {"env_step": 9300000, "rew": 13033.25, "rew_std": 1330.3514808124958, "Agent": "rainbow"}, {"env_step": 9400000, "rew": 14224.75, "rew_std": 1230.1089636694792, "Agent": "rainbow"}, {"env_step": 9500000, "rew": 13983.25, "rew_std": 1469.7389436563217, "Agent": "rainbow"}, {"env_step": 9600000, "rew": 12979.5, "rew_std": 1610.91891478125, "Agent": "rainbow"}, {"env_step": 9700000, "rew": 13711.25, "rew_std": 1179.091413970944, "Agent": "rainbow"}, {"env_step": 9800000, "rew": 13414.0, "rew_std": 2159.0412223947924, "Agent": "rainbow"}, {"env_step": 9900000, "rew": 13838.75, "rew_std": 1349.4764030912138, "Agent": "rainbow"}, {"env_step": 10000000, "rew": 14035.0, "rew_std": 1246.866572653225, "Agent": "rainbow"}, {"env_step": 0, "rew": 120.5, "rew_std": 101.5, "Agent": "ppo"}, {"env_step": 100000, "rew": 273.0, "rew_std": 28.956864471140516, "Agent": "ppo"}, {"env_step": 200000, "rew": 355.0, "rew_std": 89.81230427953622, "Agent": "ppo"}, {"env_step": 300000, "rew": 391.5, "rew_std": 92.91931984253867, "Agent": "ppo"}, {"env_step": 400000, "rew": 474.0, "rew_std": 108.15035829806575, "Agent": "ppo"}, {"env_step": 500000, "rew": 542.75, "rew_std": 105.84452040611266, "Agent": "ppo"}, {"env_step": 600000, "rew": 621.75, "rew_std": 77.6695725493581, "Agent": "ppo"}, {"env_step": 700000, "rew": 641.75, "rew_std": 85.77623505377233, "Agent": "ppo"}, {"env_step": 800000, "rew": 672.25, "rew_std": 64.53148456373835, "Agent": "ppo"}, {"env_step": 900000, "rew": 744.75, "rew_std": 134.25465541276398, "Agent": "ppo"}, {"env_step": 1000000, "rew": 791.25, "rew_std": 143.7891251103504, "Agent": "ppo"}, {"env_step": 1100000, "rew": 995.0, "rew_std": 389.2460661329797, "Agent": "ppo"}, {"env_step": 1200000, "rew": 817.25, "rew_std": 168.63588734311568, "Agent": "ppo"}, {"env_step": 1300000, "rew": 1099.0, "rew_std": 655.2797112684018, "Agent": "ppo"}, {"env_step": 1400000, "rew": 1188.0, "rew_std": 663.5, "Agent": "ppo"}, {"env_step": 1500000, "rew": 1322.0, "rew_std": 450.0927682156202, "Agent": "ppo"}, {"env_step": 1600000, "rew": 1452.75, "rew_std": 704.6368302182337, "Agent": "ppo"}, {"env_step": 1700000, "rew": 1558.5, "rew_std": 423.40170051618827, "Agent": "ppo"}, {"env_step": 1800000, "rew": 1552.75, "rew_std": 663.306537356598, "Agent": "ppo"}, {"env_step": 1900000, "rew": 1814.25, "rew_std": 756.1093257591788, "Agent": "ppo"}, {"env_step": 2000000, "rew": 1824.0, "rew_std": 703.5785315087435, "Agent": "ppo"}, {"env_step": 2100000, "rew": 1752.25, "rew_std": 750.6567541160207, "Agent": "ppo"}, {"env_step": 2200000, "rew": 2510.75, "rew_std": 872.3481601402045, "Agent": "ppo"}, {"env_step": 2300000, "rew": 2298.25, "rew_std": 906.4326022931876, "Agent": "ppo"}, {"env_step": 2400000, "rew": 2231.0, "rew_std": 897.2521942018309, "Agent": "ppo"}, {"env_step": 2500000, "rew": 2028.0, "rew_std": 938.4780231843471, "Agent": "ppo"}, {"env_step": 2600000, "rew": 2503.25, "rew_std": 949.5203065232465, "Agent": "ppo"}, {"env_step": 2700000, "rew": 2804.5, "rew_std": 959.1681291619317, "Agent": "ppo"}, {"env_step": 2800000, "rew": 2946.25, "rew_std": 708.6265324555665, "Agent": "ppo"}, {"env_step": 2900000, "rew": 3231.75, "rew_std": 616.26298160769, "Agent": "ppo"}, {"env_step": 3000000, "rew": 2883.25, "rew_std": 727.0738012746712, "Agent": "ppo"}, {"env_step": 3100000, "rew": 3300.5, "rew_std": 795.6183130119617, "Agent": "ppo"}, {"env_step": 3200000, "rew": 3390.5, "rew_std": 828.5211222413102, "Agent": "ppo"}, {"env_step": 3300000, "rew": 3235.5, "rew_std": 996.1192197724126, "Agent": "ppo"}, {"env_step": 3400000, "rew": 3114.0, "rew_std": 1074.6076028020648, "Agent": "ppo"}, {"env_step": 3500000, "rew": 3412.75, "rew_std": 1089.8081539885816, "Agent": "ppo"}, {"env_step": 3600000, "rew": 3153.75, "rew_std": 1106.7566636347847, "Agent": "ppo"}, {"env_step": 3700000, "rew": 3294.75, "rew_std": 694.6846856668138, "Agent": "ppo"}, {"env_step": 3800000, "rew": 3217.0, "rew_std": 1153.753548206895, "Agent": "ppo"}, {"env_step": 3900000, "rew": 3735.5, "rew_std": 868.4992803681532, "Agent": "ppo"}, {"env_step": 4000000, "rew": 3744.0, "rew_std": 798.573885122723, "Agent": "ppo"}, {"env_step": 4100000, "rew": 3626.75, "rew_std": 879.9460565852886, "Agent": "ppo"}, {"env_step": 4200000, "rew": 3621.5, "rew_std": 977.4035758068414, "Agent": "ppo"}, {"env_step": 4300000, "rew": 3884.5, "rew_std": 623.5030072100695, "Agent": "ppo"}, {"env_step": 4400000, "rew": 3692.25, "rew_std": 711.3521016346265, "Agent": "ppo"}, {"env_step": 4500000, "rew": 3992.75, "rew_std": 715.286175247362, "Agent": "ppo"}, {"env_step": 4600000, "rew": 4163.0, "rew_std": 830.2919667201412, "Agent": "ppo"}, {"env_step": 4700000, "rew": 4100.75, "rew_std": 683.023654422012, "Agent": "ppo"}, {"env_step": 4800000, "rew": 4077.5, "rew_std": 490.6844709179209, "Agent": "ppo"}, {"env_step": 4900000, "rew": 4007.25, "rew_std": 496.95126773155533, "Agent": "ppo"}, {"env_step": 5000000, "rew": 4787.5, "rew_std": 1021.3936557468918, "Agent": "ppo"}, {"env_step": 5100000, "rew": 4553.0, "rew_std": 615.2263810988602, "Agent": "ppo"}, {"env_step": 5200000, "rew": 4548.75, "rew_std": 416.08029573629176, "Agent": "ppo"}, {"env_step": 5300000, "rew": 4595.0, "rew_std": 509.9178855462907, "Agent": "ppo"}, {"env_step": 5400000, "rew": 5037.5, "rew_std": 584.2281232532374, "Agent": "ppo"}, {"env_step": 5500000, "rew": 5001.75, "rew_std": 1064.1552107188124, "Agent": "ppo"}, {"env_step": 5600000, "rew": 5132.75, "rew_std": 1378.285370487549, "Agent": "ppo"}, {"env_step": 5700000, "rew": 5175.5, "rew_std": 1010.7384676561984, "Agent": "ppo"}, {"env_step": 5800000, "rew": 4833.5, "rew_std": 789.5474969879899, "Agent": "ppo"}, {"env_step": 5900000, "rew": 5724.0, "rew_std": 707.8031152799484, "Agent": "ppo"}, {"env_step": 6000000, "rew": 6142.5, "rew_std": 1675.208569104158, "Agent": "ppo"}, {"env_step": 6100000, "rew": 6317.0, "rew_std": 1503.244324785562, "Agent": "ppo"}, {"env_step": 6200000, "rew": 6381.75, "rew_std": 1400.6998473977214, "Agent": "ppo"}, {"env_step": 6300000, "rew": 6283.0, "rew_std": 1507.1785726980065, "Agent": "ppo"}, {"env_step": 6400000, "rew": 6748.0, "rew_std": 1430.778983630945, "Agent": "ppo"}, {"env_step": 6500000, "rew": 7201.75, "rew_std": 1294.4265380854952, "Agent": "ppo"}, {"env_step": 6600000, "rew": 6559.0, "rew_std": 1157.9767916499882, "Agent": "ppo"}, {"env_step": 6700000, "rew": 7433.5, "rew_std": 1716.4509896877335, "Agent": "ppo"}, {"env_step": 6800000, "rew": 7610.5, "rew_std": 1812.574412265604, "Agent": "ppo"}, {"env_step": 6900000, "rew": 8195.0, "rew_std": 1976.1841386874858, "Agent": "ppo"}, {"env_step": 7000000, "rew": 8271.5, "rew_std": 1789.7011622055788, "Agent": "ppo"}, {"env_step": 7100000, "rew": 7825.5, "rew_std": 1272.6767067877058, "Agent": "ppo"}, {"env_step": 7200000, "rew": 8352.75, "rew_std": 1310.4419340436264, "Agent": "ppo"}, {"env_step": 7300000, "rew": 8443.0, "rew_std": 1754.0131841009634, "Agent": "ppo"}, {"env_step": 7400000, "rew": 8361.25, "rew_std": 1613.0232678111001, "Agent": "ppo"}, {"env_step": 7500000, "rew": 8785.5, "rew_std": 1928.0082987373264, "Agent": "ppo"}, {"env_step": 7600000, "rew": 9088.0, "rew_std": 1135.7738551313814, "Agent": "ppo"}, {"env_step": 7700000, "rew": 8585.25, "rew_std": 1348.3320483100592, "Agent": "ppo"}, {"env_step": 7800000, "rew": 8759.25, "rew_std": 1379.0055520192802, "Agent": "ppo"}, {"env_step": 7900000, "rew": 9218.5, "rew_std": 1970.6262329523577, "Agent": "ppo"}, {"env_step": 8000000, "rew": 9573.25, "rew_std": 1635.5530601298144, "Agent": "ppo"}, {"env_step": 8100000, "rew": 10431.25, "rew_std": 1564.9469839262927, "Agent": "ppo"}, {"env_step": 8200000, "rew": 9307.5, "rew_std": 1389.4486316521384, "Agent": "ppo"}, {"env_step": 8300000, "rew": 9908.75, "rew_std": 1632.5357002222033, "Agent": "ppo"}, {"env_step": 8400000, "rew": 10750.5, "rew_std": 2245.378531562106, "Agent": "ppo"}, {"env_step": 8500000, "rew": 10358.5, "rew_std": 2260.2992611599025, "Agent": "ppo"}, {"env_step": 8600000, "rew": 10700.25, "rew_std": 1594.5439982954374, "Agent": "ppo"}, {"env_step": 8700000, "rew": 10038.25, "rew_std": 1889.7635599460584, "Agent": "ppo"}, {"env_step": 8800000, "rew": 9823.0, "rew_std": 1878.6184418343178, "Agent": "ppo"}, {"env_step": 8900000, "rew": 10836.5, "rew_std": 1715.2179890614486, "Agent": "ppo"}, {"env_step": 9000000, "rew": 10589.0, "rew_std": 1656.9747282321478, "Agent": "ppo"}, {"env_step": 9100000, "rew": 10209.75, "rew_std": 1596.2845336906576, "Agent": "ppo"}, {"env_step": 9200000, "rew": 11638.75, "rew_std": 2334.8370526655603, "Agent": "ppo"}, {"env_step": 9300000, "rew": 11236.5, "rew_std": 1308.257046608196, "Agent": "ppo"}, {"env_step": 9400000, "rew": 12341.75, "rew_std": 1760.6944830094742, "Agent": "ppo"}, {"env_step": 9500000, "rew": 11866.0, "rew_std": 1635.246617486182, "Agent": "ppo"}, {"env_step": 9600000, "rew": 11265.5, "rew_std": 1304.1528859761804, "Agent": "ppo"}, {"env_step": 9700000, "rew": 11678.5, "rew_std": 1495.5292541438298, "Agent": "ppo"}, {"env_step": 9800000, "rew": 11504.25, "rew_std": 1666.65422703691, "Agent": "ppo"}, {"env_step": 9900000, "rew": 11494.0, "rew_std": 1494.6768881601133, "Agent": "ppo"}, {"env_step": 10000000, "rew": 12188.5, "rew_std": 1292.4967117946567, "Agent": "ppo"}]