[{"env_step": 0, "rew": 0.0800000011920929, "rew_std": 0.24000000357627865, "Agent": "c51"}, {"env_step": 100000, "rew": 0.0, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 200000, "rew": 0.0, "rew_std": 0.0, "Agent": "c51"}, {"env_step": 300000, "rew": 0.1, "rew_std": 0.30000000000000004, "Agent": "c51"}, {"env_step": 400000, "rew": 0.21000000238418579, "rew_std": 0.35623026856774925, "Agent": "c51"}, {"env_step": 500000, "rew": 0.05000000074505806, "rew_std": 0.12041594758226036, "Agent": "c51"}, {"env_step": 600000, "rew": 0.31999999061226847, "rew_std": 0.927146130289149, "Agent": "c51"}, {"env_step": 700000, "rew": 0.7299999989569187, "rew_std": 1.0354226172474177, "Agent": "c51"}, {"env_step": 800000, "rew": 29.999999809265137, "rew_std": 22.8517390602112, "Agent": "c51"}, {"env_step": 900000, "rew": 84.33000020980835, "rew_std": 38.11215200504169, "Agent": "c51"}, {"env_step": 1000000, "rew": 134.27000045776367, "rew_std": 33.76175580023914, "Agent": "c51"}, {"env_step": 1100000, "rew": 195.3500015258789, "rew_std": 55.070539310018276, "Agent": "c51"}, {"env_step": 1200000, "rew": 305.8000015258789, "rew_std": 63.623845163113806, "Agent": "c51"}, {"env_step": 1300000, "rew": 341.6900039672852, "rew_std": 75.15398169731095, "Agent": "c51"}, {"env_step": 1400000, "rew": 439.62000427246096, "rew_std": 35.53360923105612, "Agent": "c51"}, {"env_step": 1500000, "rew": 448.17999877929685, "rew_std": 63.31653151381171, "Agent": "c51"}, {"env_step": 1600000, "rew": 483.0900024414062, "rew_std": 63.598508175034475, "Agent": "c51"}, {"env_step": 1700000, "rew": 479.4499938964844, "rew_std": 60.719817637295435, "Agent": "c51"}, {"env_step": 1800000, "rew": 477.8299987792969, "rew_std": 88.50112258719895, "Agent": "c51"}, {"env_step": 1900000, "rew": 516.6200012207031, "rew_std": 90.65022983110897, "Agent": "c51"}, {"env_step": 2000000, "rew": 500.8199981689453, "rew_std": 56.8060386594065, "Agent": "c51"}, {"env_step": 2100000, "rew": 539.5200012207031, "rew_std": 80.30648599564611, "Agent": "c51"}, {"env_step": 2200000, "rew": 592.730014038086, "rew_std": 96.93099005249192, "Agent": "c51"}, {"env_step": 2300000, "rew": 573.3399963378906, "rew_std": 91.49156422648889, "Agent": "c51"}, {"env_step": 2400000, "rew": 606.1099975585937, "rew_std": 68.63315724977679, "Agent": "c51"}, {"env_step": 2500000, "rew": 652.9599975585937, "rew_std": 85.58606896755197, "Agent": "c51"}, {"env_step": 2600000, "rew": 655.4, "rew_std": 81.90140506345105, "Agent": "c51"}, {"env_step": 2700000, "rew": 625.2999969482422, "rew_std": 85.18681205945472, "Agent": "c51"}, {"env_step": 2800000, "rew": 637.7900024414063, "rew_std": 122.54666760609061, "Agent": "c51"}, {"env_step": 2900000, "rew": 644.1, "rew_std": 85.42630507564513, "Agent": "c51"}, {"env_step": 3000000, "rew": 710.5900024414062, "rew_std": 75.28909772977295, "Agent": "c51"}, {"env_step": 3100000, "rew": 671.3799987792969, "rew_std": 56.7536538058374, "Agent": "c51"}, {"env_step": 3200000, "rew": 668.2599975585938, "rew_std": 65.81738352088684, "Agent": "c51"}, {"env_step": 3300000, "rew": 690.7899993896484, "rew_std": 84.55681861003309, "Agent": "c51"}, {"env_step": 3400000, "rew": 738.3400024414062, "rew_std": 101.42283074745313, "Agent": "c51"}, {"env_step": 3500000, "rew": 730.4300048828125, "rew_std": 90.93792521834833, "Agent": "c51"}, {"env_step": 3600000, "rew": 742.3700012207031, "rew_std": 98.71111614905327, "Agent": "c51"}, {"env_step": 3700000, "rew": 708.8199981689453, "rew_std": 130.55409140026177, "Agent": "c51"}, {"env_step": 3800000, "rew": 705.9700012207031, "rew_std": 75.86588955018891, "Agent": "c51"}, {"env_step": 3900000, "rew": 755.3899963378906, "rew_std": 111.82682749974384, "Agent": "c51"}, {"env_step": 4000000, "rew": 792.8599975585937, "rew_std": 100.65659388596904, "Agent": "c51"}, {"env_step": 4100000, "rew": 780.4700012207031, "rew_std": 89.4066144108773, "Agent": "c51"}, {"env_step": 4200000, "rew": 749.0600036621094, "rew_std": 89.14610115546856, "Agent": "c51"}, {"env_step": 4300000, "rew": 735.3100067138672, "rew_std": 105.2854315881353, "Agent": "c51"}, {"env_step": 4400000, "rew": 794.9, "rew_std": 94.90966229691644, "Agent": "c51"}, {"env_step": 4500000, "rew": 775.8700012207031, "rew_std": 86.57670898287867, "Agent": "c51"}, {"env_step": 4600000, "rew": 764.4599975585937, "rew_std": 121.75587907672723, "Agent": "c51"}, {"env_step": 4700000, "rew": 761.55, "rew_std": 62.056058351897406, "Agent": "c51"}, {"env_step": 4800000, "rew": 746.5799987792968, "rew_std": 130.65757158616265, "Agent": "c51"}, {"env_step": 4900000, "rew": 792.0400085449219, "rew_std": 92.14410963183664, "Agent": "c51"}, {"env_step": 5000000, "rew": 784.8700012207031, "rew_std": 76.30846325078628, "Agent": "c51"}, {"env_step": 5100000, "rew": 806.9400024414062, "rew_std": 89.7122211065443, "Agent": "c51"}, {"env_step": 5200000, "rew": 809.7999938964844, "rew_std": 96.43909531778648, "Agent": "c51"}, {"env_step": 5300000, "rew": 801.8500061035156, "rew_std": 71.23311713783924, "Agent": "c51"}, {"env_step": 5400000, "rew": 865.3399963378906, "rew_std": 87.65904211044649, "Agent": "c51"}, {"env_step": 5500000, "rew": 800.1799987792969, "rew_std": 120.17872453215695, "Agent": "c51"}, {"env_step": 5600000, "rew": 808.1899963378906, "rew_std": 114.39077140355394, "Agent": "c51"}, {"env_step": 5700000, "rew": 787.6900024414062, "rew_std": 137.37429836391115, "Agent": "c51"}, {"env_step": 5800000, "rew": 817.6800048828125, "rew_std": 75.91765398683945, "Agent": "c51"}, {"env_step": 5900000, "rew": 788.95, "rew_std": 112.15058353811531, "Agent": "c51"}, {"env_step": 6000000, "rew": 824.4900024414062, "rew_std": 83.1460697372063, "Agent": "c51"}, {"env_step": 6100000, "rew": 791.3400024414062, "rew_std": 71.07509644467352, "Agent": "c51"}, {"env_step": 6200000, "rew": 852.5599975585938, "rew_std": 102.26750645543113, "Agent": "c51"}, {"env_step": 6300000, "rew": 791.0799957275391, "rew_std": 148.64477463928537, "Agent": "c51"}, {"env_step": 6400000, "rew": 799.7700012207031, "rew_std": 94.79903258127105, "Agent": "c51"}, {"env_step": 6500000, "rew": 856.9799987792969, "rew_std": 98.21994199980757, "Agent": "c51"}, {"env_step": 6600000, "rew": 830.3799987792969, "rew_std": 92.69931723386792, "Agent": "c51"}, {"env_step": 6700000, "rew": 828.5700012207031, "rew_std": 117.4840294040638, "Agent": "c51"}, {"env_step": 6800000, "rew": 836.3399963378906, "rew_std": 107.67462291584121, "Agent": "c51"}, {"env_step": 6900000, "rew": 809.05, "rew_std": 86.39843789136866, "Agent": "c51"}, {"env_step": 7000000, "rew": 802.610009765625, "rew_std": 85.19054082178417, "Agent": "c51"}, {"env_step": 7100000, "rew": 821.9500061035156, "rew_std": 84.06559770155239, "Agent": "c51"}, {"env_step": 7200000, "rew": 846.0100036621094, "rew_std": 109.6511176842256, "Agent": "c51"}, {"env_step": 7300000, "rew": 753.2699981689453, "rew_std": 118.18144461063531, "Agent": "c51"}, {"env_step": 7400000, "rew": 862.4699951171875, "rew_std": 94.61919535944561, "Agent": "c51"}, {"env_step": 7500000, "rew": 855.6, "rew_std": 83.0109175169287, "Agent": "c51"}, {"env_step": 7600000, "rew": 804.8099975585938, "rew_std": 87.84749020213859, "Agent": "c51"}, {"env_step": 7700000, "rew": 879.1099975585937, "rew_std": 124.99047443353965, "Agent": "c51"}, {"env_step": 7800000, "rew": 861.0999938964844, "rew_std": 149.99051826966058, "Agent": "c51"}, {"env_step": 7900000, "rew": 840.1100158691406, "rew_std": 74.45142853212236, "Agent": "c51"}, {"env_step": 8000000, "rew": 838.1, "rew_std": 81.488879742754, "Agent": "c51"}, {"env_step": 8100000, "rew": 853.1600036621094, "rew_std": 125.11934723061991, "Agent": "c51"}, {"env_step": 8200000, "rew": 883.8700012207031, "rew_std": 110.8634912939346, "Agent": "c51"}, {"env_step": 8300000, "rew": 843.6199951171875, "rew_std": 110.07341220660334, "Agent": "c51"}, {"env_step": 8400000, "rew": 833.9500122070312, "rew_std": 166.85491541704317, "Agent": "c51"}, {"env_step": 8500000, "rew": 883.5900085449218, "rew_std": 120.01639086371644, "Agent": "c51"}, {"env_step": 8600000, "rew": 816.3799987792969, "rew_std": 93.30947260374052, "Agent": "c51"}, {"env_step": 8700000, "rew": 816.5599975585938, "rew_std": 90.72039308816316, "Agent": "c51"}, {"env_step": 8800000, "rew": 885.2699951171875, "rew_std": 84.88027385527451, "Agent": "c51"}, {"env_step": 8900000, "rew": 940.8200012207031, "rew_std": 133.91121568644473, "Agent": "c51"}, {"env_step": 9000000, "rew": 858.2299926757812, "rew_std": 106.44362694927028, "Agent": "c51"}, {"env_step": 9100000, "rew": 843.5200012207031, "rew_std": 68.82380650364031, "Agent": "c51"}, {"env_step": 9200000, "rew": 847.75, "rew_std": 129.47580625363784, "Agent": "c51"}, {"env_step": 9300000, "rew": 898.089990234375, "rew_std": 74.57461814213535, "Agent": "c51"}, {"env_step": 9400000, "rew": 837.9999938964844, "rew_std": 75.13513732170806, "Agent": "c51"}, {"env_step": 9500000, "rew": 900.9, "rew_std": 78.32506786062443, "Agent": "c51"}, {"env_step": 9600000, "rew": 832.4200134277344, "rew_std": 69.69465721794408, "Agent": "c51"}, {"env_step": 9700000, "rew": 889.0700012207031, "rew_std": 126.08315874519296, "Agent": "c51"}, {"env_step": 9800000, "rew": 873.6100036621094, "rew_std": 72.68277945780702, "Agent": "c51"}, {"env_step": 9900000, "rew": 796.860009765625, "rew_std": 83.10054074269745, "Agent": "c51"}, {"env_step": 10000000, "rew": 821.8199951171875, "rew_std": 135.73986691667577, "Agent": "c51"}, {"env_step": 0, "rew": 0.010000000149011612, "rew_std": 0.03000000044703483, "Agent": "dqn"}, {"env_step": 100000, "rew": 0.28999999687075617, "rew_std": 0.6774215679654139, "Agent": "dqn"}, {"env_step": 200000, "rew": 0.44000001028180125, "rew_std": 0.8392854380207859, "Agent": "dqn"}, {"env_step": 300000, "rew": 0.3599999964237213, "rew_std": 0.8284925931025058, "Agent": "dqn"}, {"env_step": 400000, "rew": 0.33999999538064, "rew_std": 0.6873135967539007, "Agent": "dqn"}, {"env_step": 500000, "rew": 0.11000000089406967, "rew_std": 0.18138357257301754, "Agent": "dqn"}, {"env_step": 600000, "rew": 0.2100000001490116, "rew_std": 0.4548626165857307, "Agent": "dqn"}, {"env_step": 700000, "rew": 8.389999697357416, "rew_std": 23.108285476400564, "Agent": "dqn"}, {"env_step": 800000, "rew": 98.94999904632569, "rew_std": 35.660067729885725, "Agent": "dqn"}, {"env_step": 900000, "rew": 164.40999908447264, "rew_std": 59.0228520750357, "Agent": "dqn"}, {"env_step": 1000000, "rew": 210.4000030517578, "rew_std": 57.88502705780608, "Agent": "dqn"}, {"env_step": 1100000, "rew": 300.38000030517577, "rew_std": 82.23668084181749, "Agent": "dqn"}, {"env_step": 1200000, "rew": 302.7600036621094, "rew_std": 103.46174434569636, "Agent": "dqn"}, {"env_step": 1300000, "rew": 433.91000213623045, "rew_std": 126.5024948103054, "Agent": "dqn"}, {"env_step": 1400000, "rew": 416.14000244140624, "rew_std": 145.09603673682304, "Agent": "dqn"}, {"env_step": 1500000, "rew": 472.1600006103516, "rew_std": 86.80930065353702, "Agent": "dqn"}, {"env_step": 1600000, "rew": 536.65, "rew_std": 132.84745000480228, "Agent": "dqn"}, {"env_step": 1700000, "rew": 511.6300048828125, "rew_std": 113.56259400514695, "Agent": "dqn"}, {"env_step": 1800000, "rew": 559.5200012207031, "rew_std": 95.26979029881092, "Agent": "dqn"}, {"env_step": 1900000, "rew": 504.64000244140624, "rew_std": 183.2878214612098, "Agent": "dqn"}, {"env_step": 2000000, "rew": 574.7700103759765, "rew_std": 78.04244399982899, "Agent": "dqn"}, {"env_step": 2100000, "rew": 531.539998626709, "rew_std": 230.03735295552605, "Agent": "dqn"}, {"env_step": 2200000, "rew": 584.3100006103516, "rew_std": 116.97556069856971, "Agent": "dqn"}, {"env_step": 2300000, "rew": 609.7900024414063, "rew_std": 76.25380786006397, "Agent": "dqn"}, {"env_step": 2400000, "rew": 601.6499938964844, "rew_std": 156.2863846625289, "Agent": "dqn"}, {"env_step": 2500000, "rew": 614.8899978637695, "rew_std": 188.88530877823078, "Agent": "dqn"}, {"env_step": 2600000, "rew": 585.7100036621093, "rew_std": 183.29359497607433, "Agent": "dqn"}, {"env_step": 2700000, "rew": 681.8800048828125, "rew_std": 179.32764210720728, "Agent": "dqn"}, {"env_step": 2800000, "rew": 593.8799987792969, "rew_std": 178.6578949602182, "Agent": "dqn"}, {"env_step": 2900000, "rew": 685.2, "rew_std": 118.27089032922618, "Agent": "dqn"}, {"env_step": 3000000, "rew": 683.2299926757812, "rew_std": 131.34903655399373, "Agent": "dqn"}, {"env_step": 3100000, "rew": 662.1999938964843, "rew_std": 109.7032239820281, "Agent": "dqn"}, {"env_step": 3200000, "rew": 701.2099975585937, "rew_std": 88.04874320833147, "Agent": "dqn"}, {"env_step": 3300000, "rew": 688.9199981689453, "rew_std": 126.02541709175058, "Agent": "dqn"}, {"env_step": 3400000, "rew": 636.0799987792968, "rew_std": 172.2193654656943, "Agent": "dqn"}, {"env_step": 3500000, "rew": 653.7300018310547, "rew_std": 166.93894277813533, "Agent": "dqn"}, {"env_step": 3600000, "rew": 684.3899963378906, "rew_std": 172.87680391908185, "Agent": "dqn"}, {"env_step": 3700000, "rew": 643.3400039672852, "rew_std": 180.69860945189737, "Agent": "dqn"}, {"env_step": 3800000, "rew": 601.6399993896484, "rew_std": 220.07335285006258, "Agent": "dqn"}, {"env_step": 3900000, "rew": 787.8099914550781, "rew_std": 150.5371983171373, "Agent": "dqn"}, {"env_step": 4000000, "rew": 709.3800048828125, "rew_std": 144.69985159836313, "Agent": "dqn"}, {"env_step": 4100000, "rew": 764.1300018310546, "rew_std": 195.3602195608862, "Agent": "dqn"}, {"env_step": 4200000, "rew": 680.2700012207031, "rew_std": 210.1577440975007, "Agent": "dqn"}, {"env_step": 4300000, "rew": 705.5600036621094, "rew_std": 216.64282568222822, "Agent": "dqn"}, {"env_step": 4400000, "rew": 808.1700073242188, "rew_std": 171.82676781938977, "Agent": "dqn"}, {"env_step": 4500000, "rew": 715.6900006294251, "rew_std": 325.7469276625226, "Agent": "dqn"}, {"env_step": 4600000, "rew": 732.2800018310547, "rew_std": 201.57531656345432, "Agent": "dqn"}, {"env_step": 4700000, "rew": 786.0399963378907, "rew_std": 166.10157244455863, "Agent": "dqn"}, {"env_step": 4800000, "rew": 786.3699920654296, "rew_std": 178.73539138167627, "Agent": "dqn"}, {"env_step": 4900000, "rew": 775.7399993896485, "rew_std": 224.3126871078825, "Agent": "dqn"}, {"env_step": 5000000, "rew": 837.7899932861328, "rew_std": 153.09056362847045, "Agent": "dqn"}, {"env_step": 5100000, "rew": 830.0400085449219, "rew_std": 160.10900182067942, "Agent": "dqn"}, {"env_step": 5200000, "rew": 823.5699981689453, "rew_std": 194.98995547995364, "Agent": "dqn"}, {"env_step": 5300000, "rew": 855.3900024414063, "rew_std": 140.50763881053481, "Agent": "dqn"}, {"env_step": 5400000, "rew": 894.0799865722656, "rew_std": 140.23513752874317, "Agent": "dqn"}, {"env_step": 5500000, "rew": 833.1599899291992, "rew_std": 252.01737545461143, "Agent": "dqn"}, {"env_step": 5600000, "rew": 810.3499969482422, "rew_std": 203.2235554729935, "Agent": "dqn"}, {"env_step": 5700000, "rew": 725.3200134277344, "rew_std": 319.200193375417, "Agent": "dqn"}, {"env_step": 5800000, "rew": 766.3399963378906, "rew_std": 245.59766336856708, "Agent": "dqn"}, {"env_step": 5900000, "rew": 824.45, "rew_std": 157.8227175018482, "Agent": "dqn"}, {"env_step": 6000000, "rew": 839.1499938964844, "rew_std": 267.6931744720739, "Agent": "dqn"}, {"env_step": 6100000, "rew": 911.7200012207031, "rew_std": 149.13539534554963, "Agent": "dqn"}, {"env_step": 6200000, "rew": 865.1299987792969, "rew_std": 151.98633776803706, "Agent": "dqn"}, {"env_step": 6300000, "rew": 701.3800109863281, "rew_std": 231.76907968297863, "Agent": "dqn"}, {"env_step": 6400000, "rew": 848.5299987792969, "rew_std": 142.20331551456655, "Agent": "dqn"}, {"env_step": 6500000, "rew": 857.1699829101562, "rew_std": 245.273054002329, "Agent": "dqn"}, {"env_step": 6600000, "rew": 872.0099975585938, "rew_std": 275.1938175427823, "Agent": "dqn"}, {"env_step": 6700000, "rew": 780.0400024414063, "rew_std": 218.67946501129768, "Agent": "dqn"}, {"env_step": 6800000, "rew": 972.5299926757813, "rew_std": 84.68238747454869, "Agent": "dqn"}, {"env_step": 6900000, "rew": 839.6300048828125, "rew_std": 172.06233073457074, "Agent": "dqn"}, {"env_step": 7000000, "rew": 765.7000030517578, "rew_std": 228.73327046919016, "Agent": "dqn"}, {"env_step": 7100000, "rew": 803.6699981689453, "rew_std": 223.20593976154984, "Agent": "dqn"}, {"env_step": 7200000, "rew": 869.5399948120117, "rew_std": 296.05559318233026, "Agent": "dqn"}, {"env_step": 7300000, "rew": 899.0700073242188, "rew_std": 223.90129458785196, "Agent": "dqn"}, {"env_step": 7400000, "rew": 894.3500122070312, "rew_std": 124.86718242625085, "Agent": "dqn"}, {"env_step": 7500000, "rew": 844.4800048828125, "rew_std": 178.28963708114927, "Agent": "dqn"}, {"env_step": 7600000, "rew": 832.0400024414063, "rew_std": 169.4274077668312, "Agent": "dqn"}, {"env_step": 7700000, "rew": 792.3100036621094, "rew_std": 230.68153832883345, "Agent": "dqn"}, {"env_step": 7800000, "rew": 803.5799963474274, "rew_std": 309.8821414828576, "Agent": "dqn"}, {"env_step": 7900000, "rew": 673.1000030517578, "rew_std": 227.6657908497509, "Agent": "dqn"}, {"env_step": 8000000, "rew": 902.8799987792969, "rew_std": 131.25283923863736, "Agent": "dqn"}, {"env_step": 8100000, "rew": 724.4699996948242, "rew_std": 295.4643426314042, "Agent": "dqn"}, {"env_step": 8200000, "rew": 927.2100036621093, "rew_std": 143.6894016940865, "Agent": "dqn"}, {"env_step": 8300000, "rew": 942.3600006103516, "rew_std": 285.8560329981964, "Agent": "dqn"}, {"env_step": 8400000, "rew": 851.1799987792969, "rew_std": 200.8229014095921, "Agent": "dqn"}, {"env_step": 8500000, "rew": 901.9700012207031, "rew_std": 160.8610738450723, "Agent": "dqn"}, {"env_step": 8600000, "rew": 871.3400024414062, "rew_std": 190.1946167222594, "Agent": "dqn"}, {"env_step": 8700000, "rew": 833.9000122070313, "rew_std": 240.40292224599622, "Agent": "dqn"}, {"env_step": 8800000, "rew": 869.95, "rew_std": 184.55665785734556, "Agent": "dqn"}, {"env_step": 8900000, "rew": 875.4000030517578, "rew_std": 285.9085977204755, "Agent": "dqn"}, {"env_step": 9000000, "rew": 867.3599975585937, "rew_std": 361.56061577070335, "Agent": "dqn"}, {"env_step": 9100000, "rew": 856.3100036621094, "rew_std": 315.8472236982946, "Agent": "dqn"}, {"env_step": 9200000, "rew": 856.9499938964843, "rew_std": 170.14471559957494, "Agent": "dqn"}, {"env_step": 9300000, "rew": 888.9199951171875, "rew_std": 168.72139042881585, "Agent": "dqn"}, {"env_step": 9400000, "rew": 866.0400131225585, "rew_std": 299.502088920062, "Agent": "dqn"}, {"env_step": 9500000, "rew": 840.8400024414062, "rew_std": 331.5126113915152, "Agent": "dqn"}, {"env_step": 9600000, "rew": 807.6199981689454, "rew_std": 295.85304518327024, "Agent": "dqn"}, {"env_step": 9700000, "rew": 997.8700073242187, "rew_std": 180.62872163215707, "Agent": "dqn"}, {"env_step": 9800000, "rew": 902.3699951171875, "rew_std": 191.78846507427704, "Agent": "dqn"}, {"env_step": 9900000, "rew": 832.2099884033203, "rew_std": 279.22019714027266, "Agent": "dqn"}, {"env_step": 10000000, "rew": 833.1200012207031, "rew_std": 180.39020450524953, "Agent": "dqn"}, {"env_step": 0, "rew": 0.010000000149011612, "rew_std": 0.03000000044703483, "Agent": "fqf"}, {"env_step": 100000, "rew": 0.4000000074505806, "rew_std": 0.5949790043492437, "Agent": "fqf"}, {"env_step": 200000, "rew": 0.5199999868869781, "rew_std": 0.9031057265445962, "Agent": "fqf"}, {"env_step": 300000, "rew": 0.020000000298023225, "rew_std": 0.04000000059604644, "Agent": "fqf"}, {"env_step": 400000, "rew": 0.1600000001490116, "rew_std": 0.4476605856920158, "Agent": "fqf"}, {"env_step": 500000, "rew": 0.06999999880790711, "rew_std": 0.2099999964237213, "Agent": "fqf"}, {"env_step": 600000, "rew": 3.8100000239908693, "rew_std": 5.602936729313963, "Agent": "fqf"}, {"env_step": 700000, "rew": 12.430000038444996, "rew_std": 19.787372405641634, "Agent": "fqf"}, {"env_step": 800000, "rew": 85.2499984741211, "rew_std": 63.42670047163025, "Agent": "fqf"}, {"env_step": 900000, "rew": 133.19000046253205, "rew_std": 70.73937261722692, "Agent": "fqf"}, {"env_step": 1000000, "rew": 305.75999908447267, "rew_std": 103.32499176000272, "Agent": "fqf"}, {"env_step": 1100000, "rew": 413.0800033569336, "rew_std": 109.4271524578977, "Agent": "fqf"}, {"env_step": 1200000, "rew": 447.47999572753906, "rew_std": 130.462502495816, "Agent": "fqf"}, {"env_step": 1300000, "rew": 518.3400054931641, "rew_std": 135.58270493310644, "Agent": "fqf"}, {"env_step": 1400000, "rew": 657.4699951171875, "rew_std": 146.84401743315414, "Agent": "fqf"}, {"env_step": 1500000, "rew": 748.0899963378906, "rew_std": 115.51613589716597, "Agent": "fqf"}, {"env_step": 1600000, "rew": 675.2199920654297, "rew_std": 152.8333391660496, "Agent": "fqf"}, {"env_step": 1700000, "rew": 711.7800109863281, "rew_std": 140.070698003054, "Agent": "fqf"}, {"env_step": 1800000, "rew": 768.7699981689453, "rew_std": 205.88203217918607, "Agent": "fqf"}, {"env_step": 1900000, "rew": 830.1599975585938, "rew_std": 164.96536198083228, "Agent": "fqf"}, {"env_step": 2000000, "rew": 838.0, "rew_std": 134.02208935127933, "Agent": "fqf"}, {"env_step": 2100000, "rew": 860.7899963378907, "rew_std": 130.38507918675546, "Agent": "fqf"}, {"env_step": 2200000, "rew": 977.0700073242188, "rew_std": 126.20982209871863, "Agent": "fqf"}, {"env_step": 2300000, "rew": 950.0299987792969, "rew_std": 156.14618566531715, "Agent": "fqf"}, {"env_step": 2400000, "rew": 846.3499877929687, "rew_std": 248.7892251417476, "Agent": "fqf"}, {"env_step": 2500000, "rew": 992.1199951171875, "rew_std": 115.97767285528869, "Agent": "fqf"}, {"env_step": 2600000, "rew": 987.1100036621094, "rew_std": 102.14894278448398, "Agent": "fqf"}, {"env_step": 2700000, "rew": 1004.62001953125, "rew_std": 195.0578605917069, "Agent": "fqf"}, {"env_step": 2800000, "rew": 972.389990234375, "rew_std": 155.29393383794988, "Agent": "fqf"}, {"env_step": 2900000, "rew": 948.7399932861329, "rew_std": 274.68796913449233, "Agent": "fqf"}, {"env_step": 3000000, "rew": 1058.3299926757813, "rew_std": 170.51883401478082, "Agent": "fqf"}, {"env_step": 3100000, "rew": 1085.8400024414063, "rew_std": 143.12279720739653, "Agent": "fqf"}, {"env_step": 3200000, "rew": 1149.7299865722657, "rew_std": 218.88763506679157, "Agent": "fqf"}, {"env_step": 3300000, "rew": 1151.3599914550782, "rew_std": 190.10523364130052, "Agent": "fqf"}, {"env_step": 3400000, "rew": 1080.9000122070313, "rew_std": 332.21089689623733, "Agent": "fqf"}, {"env_step": 3500000, "rew": 1113.7200073242188, "rew_std": 122.5017752266977, "Agent": "fqf"}, {"env_step": 3600000, "rew": 1153.9199951171875, "rew_std": 110.683608376239, "Agent": "fqf"}, {"env_step": 3700000, "rew": 1151.8500061035156, "rew_std": 253.38377103265688, "Agent": "fqf"}, {"env_step": 3800000, "rew": 1277.9900146484374, "rew_std": 112.66564272737654, "Agent": "fqf"}, {"env_step": 3900000, "rew": 1282.3099731445313, "rew_std": 217.32348002992126, "Agent": "fqf"}, {"env_step": 4000000, "rew": 1248.0900024414063, "rew_std": 170.67968176451825, "Agent": "fqf"}, {"env_step": 4100000, "rew": 1322.8300170898438, "rew_std": 153.41429245269322, "Agent": "fqf"}, {"env_step": 4200000, "rew": 1236.4299896240234, "rew_std": 308.0954582465107, "Agent": "fqf"}, {"env_step": 4300000, "rew": 1342.439990234375, "rew_std": 193.51426337682267, "Agent": "fqf"}, {"env_step": 4400000, "rew": 1149.9899963378907, "rew_std": 244.50325562855912, "Agent": "fqf"}, {"env_step": 4500000, "rew": 1353.7800048828126, "rew_std": 228.50535375228858, "Agent": "fqf"}, {"env_step": 4600000, "rew": 1196.4300048828125, "rew_std": 221.77920221529982, "Agent": "fqf"}, {"env_step": 4700000, "rew": 1338.169989013672, "rew_std": 258.7844697757098, "Agent": "fqf"}, {"env_step": 4800000, "rew": 1455.7900146484376, "rew_std": 222.74215426809056, "Agent": "fqf"}, {"env_step": 4900000, "rew": 1465.7900024414062, "rew_std": 211.17771615384086, "Agent": "fqf"}, {"env_step": 5000000, "rew": 1360.9300048828125, "rew_std": 158.9558026017405, "Agent": "fqf"}, {"env_step": 5100000, "rew": 1326.210009765625, "rew_std": 153.008085562372, "Agent": "fqf"}, {"env_step": 5200000, "rew": 1324.9800048828124, "rew_std": 192.30021302076855, "Agent": "fqf"}, {"env_step": 5300000, "rew": 1373.3199951171875, "rew_std": 190.05878674516413, "Agent": "fqf"}, {"env_step": 5400000, "rew": 1444.8299926757813, "rew_std": 176.63967297772865, "Agent": "fqf"}, {"env_step": 5500000, "rew": 1380.8700012207032, "rew_std": 275.76877411799353, "Agent": "fqf"}, {"env_step": 5600000, "rew": 1449.3299926757813, "rew_std": 189.39536052457436, "Agent": "fqf"}, {"env_step": 5700000, "rew": 1399.7899780273438, "rew_std": 186.23228867562835, "Agent": "fqf"}, {"env_step": 5800000, "rew": 1526.0900024414063, "rew_std": 226.097034699169, "Agent": "fqf"}, {"env_step": 5900000, "rew": 1323.17001953125, "rew_std": 214.75273220122753, "Agent": "fqf"}, {"env_step": 6000000, "rew": 1335.5700073242188, "rew_std": 199.16455799287937, "Agent": "fqf"}, {"env_step": 6100000, "rew": 1455.260009765625, "rew_std": 188.3336061850183, "Agent": "fqf"}, {"env_step": 6200000, "rew": 1460.6299926757813, "rew_std": 168.61568012736888, "Agent": "fqf"}, {"env_step": 6300000, "rew": 1531.5299926757812, "rew_std": 223.6121634917823, "Agent": "fqf"}, {"env_step": 6400000, "rew": 1473.3, "rew_std": 157.68532141529403, "Agent": "fqf"}, {"env_step": 6500000, "rew": 1348.3100036621095, "rew_std": 336.5419653083397, "Agent": "fqf"}, {"env_step": 6600000, "rew": 1360.3900024414063, "rew_std": 385.11999323091857, "Agent": "fqf"}, {"env_step": 6700000, "rew": 1525.3900024414063, "rew_std": 223.73438160213453, "Agent": "fqf"}, {"env_step": 6800000, "rew": 1424.3700134277344, "rew_std": 227.2740165319224, "Agent": "fqf"}, {"env_step": 6900000, "rew": 1444.5199951171876, "rew_std": 206.8632128076105, "Agent": "fqf"}, {"env_step": 7000000, "rew": 1550.7000244140625, "rew_std": 243.50839787358856, "Agent": "fqf"}, {"env_step": 7100000, "rew": 1510.7899963378907, "rew_std": 258.7483723817995, "Agent": "fqf"}, {"env_step": 7200000, "rew": 1483.280010986328, "rew_std": 264.7287475532349, "Agent": "fqf"}, {"env_step": 7300000, "rew": 1499.6600219726563, "rew_std": 341.719842324931, "Agent": "fqf"}, {"env_step": 7400000, "rew": 1687.2500244140624, "rew_std": 256.1505463645012, "Agent": "fqf"}, {"env_step": 7500000, "rew": 1454.0300048828126, "rew_std": 280.16069877794627, "Agent": "fqf"}, {"env_step": 7600000, "rew": 1593.1700012207032, "rew_std": 356.6653348908056, "Agent": "fqf"}, {"env_step": 7700000, "rew": 1752.35, "rew_std": 272.67251651423953, "Agent": "fqf"}, {"env_step": 7800000, "rew": 1424.1700073242187, "rew_std": 240.21965983357364, "Agent": "fqf"}, {"env_step": 7900000, "rew": 1545.0499877929688, "rew_std": 274.2309684007817, "Agent": "fqf"}, {"env_step": 8000000, "rew": 1491.2900024414062, "rew_std": 221.5089150627939, "Agent": "fqf"}, {"env_step": 8100000, "rew": 1686.5300170898438, "rew_std": 233.44947282580907, "Agent": "fqf"}, {"env_step": 8200000, "rew": 1654.559991455078, "rew_std": 257.67832128859897, "Agent": "fqf"}, {"env_step": 8300000, "rew": 1608.6599975585937, "rew_std": 238.0655354689683, "Agent": "fqf"}, {"env_step": 8400000, "rew": 1575.3399780273437, "rew_std": 203.41885145877984, "Agent": "fqf"}, {"env_step": 8500000, "rew": 1501.899984741211, "rew_std": 443.3008682851743, "Agent": "fqf"}, {"env_step": 8600000, "rew": 1344.8300048828125, "rew_std": 226.3636211692771, "Agent": "fqf"}, {"env_step": 8700000, "rew": 1358.25, "rew_std": 207.60759860147468, "Agent": "fqf"}, {"env_step": 8800000, "rew": 1577.8999877929687, "rew_std": 218.78633687041156, "Agent": "fqf"}, {"env_step": 8900000, "rew": 1816.8199951171875, "rew_std": 314.3398063009122, "Agent": "fqf"}, {"env_step": 9000000, "rew": 1508.2200073242188, "rew_std": 202.8977505176873, "Agent": "fqf"}, {"env_step": 9100000, "rew": 1388.3, "rew_std": 358.01253786434296, "Agent": "fqf"}, {"env_step": 9200000, "rew": 1657.6999877929688, "rew_std": 162.50743736286006, "Agent": "fqf"}, {"env_step": 9300000, "rew": 1769.5699829101563, "rew_std": 430.9407204209698, "Agent": "fqf"}, {"env_step": 9400000, "rew": 1644.0599975585938, "rew_std": 363.31351881469755, "Agent": "fqf"}, {"env_step": 9500000, "rew": 1774.7999755859375, "rew_std": 458.10963716513834, "Agent": "fqf"}, {"env_step": 9600000, "rew": 1574.6399780273437, "rew_std": 286.1478292951951, "Agent": "fqf"}, {"env_step": 9700000, "rew": 1621.3900024414063, "rew_std": 203.88568091812692, "Agent": "fqf"}, {"env_step": 9800000, "rew": 1800.6699829101562, "rew_std": 246.23150505646822, "Agent": "fqf"}, {"env_step": 9900000, "rew": 1717.560009765625, "rew_std": 272.92596987574973, "Agent": "fqf"}, {"env_step": 10000000, "rew": 1663.030029296875, "rew_std": 215.58594858353038, "Agent": "fqf"}, {"env_step": 0, "rew": 0.2, "rew_std": 0.43817804165122526, "Agent": "qrdqn"}, {"env_step": 100000, "rew": 2.950000001490116, "rew_std": 8.683806768461812, "Agent": "qrdqn"}, {"env_step": 200000, "rew": 2.750000011920929, "rew_std": 7.12281545355883, "Agent": "qrdqn"}, {"env_step": 300000, "rew": 2.139999923855066, "rew_std": 6.060560801476709, "Agent": "qrdqn"}, {"env_step": 400000, "rew": 8.719999969005585, "rew_std": 12.750513633943633, "Agent": "qrdqn"}, {"env_step": 500000, "rew": 0.020000000298023225, "rew_std": 0.06000000089406966, "Agent": "qrdqn"}, {"env_step": 600000, "rew": 4.539999961853027, "rew_std": 8.518591324669725, "Agent": "qrdqn"}, {"env_step": 700000, "rew": 20.8, "rew_std": 19.17268910037082, "Agent": "qrdqn"}, {"env_step": 800000, "rew": 64.31000022888183, "rew_std": 55.11154952769602, "Agent": "qrdqn"}, {"env_step": 900000, "rew": 117.36000137329101, "rew_std": 81.42853758823472, "Agent": "qrdqn"}, {"env_step": 1000000, "rew": 212.5300022125244, "rew_std": 134.6447147733004, "Agent": "qrdqn"}, {"env_step": 1100000, "rew": 311.71999740600586, "rew_std": 143.0127312672216, "Agent": "qrdqn"}, {"env_step": 1200000, "rew": 427.21999702453616, "rew_std": 166.6607249218663, "Agent": "qrdqn"}, {"env_step": 1300000, "rew": 450.81999626159666, "rew_std": 170.6163965376507, "Agent": "qrdqn"}, {"env_step": 1400000, "rew": 446.6700017929077, "rew_std": 171.28357388934182, "Agent": "qrdqn"}, {"env_step": 1500000, "rew": 501.95000114440916, "rew_std": 214.17296736360868, "Agent": "qrdqn"}, {"env_step": 1600000, "rew": 515.3500011444091, "rew_std": 228.24397876121898, "Agent": "qrdqn"}, {"env_step": 1700000, "rew": 532.7900005340576, "rew_std": 260.70330697040697, "Agent": "qrdqn"}, {"env_step": 1800000, "rew": 535.5499984741211, "rew_std": 226.46023524425055, "Agent": "qrdqn"}, {"env_step": 1900000, "rew": 614.3999969482422, "rew_std": 229.86442537632706, "Agent": "qrdqn"}, {"env_step": 2000000, "rew": 495.1, "rew_std": 277.79406604885946, "Agent": "qrdqn"}, {"env_step": 2100000, "rew": 585.6600044250488, "rew_std": 230.43919543285637, "Agent": "qrdqn"}, {"env_step": 2200000, "rew": 716.0299999237061, "rew_std": 264.0099569711277, "Agent": "qrdqn"}, {"env_step": 2300000, "rew": 542.9899975776673, "rew_std": 303.6674555033, "Agent": "qrdqn"}, {"env_step": 2400000, "rew": 715.6400062561036, "rew_std": 286.50699130558786, "Agent": "qrdqn"}, {"env_step": 2500000, "rew": 648.0000051498413, "rew_std": 301.31887025376795, "Agent": "qrdqn"}, {"env_step": 2600000, "rew": 593.8800014495849, "rew_std": 302.4725858413253, "Agent": "qrdqn"}, {"env_step": 2700000, "rew": 662.1199962615967, "rew_std": 292.98960962786776, "Agent": "qrdqn"}, {"env_step": 2800000, "rew": 695.9800054550171, "rew_std": 284.20259753123815, "Agent": "qrdqn"}, {"env_step": 2900000, "rew": 729.7400060653687, "rew_std": 261.0564239167806, "Agent": "qrdqn"}, {"env_step": 3000000, "rew": 765.3200073242188, "rew_std": 267.8584904904683, "Agent": "qrdqn"}, {"env_step": 3100000, "rew": 763.0400096893311, "rew_std": 257.2424218386392, "Agent": "qrdqn"}, {"env_step": 3200000, "rew": 775.7299938201904, "rew_std": 273.62065502831194, "Agent": "qrdqn"}, {"env_step": 3300000, "rew": 768.5900030136108, "rew_std": 293.28401432770056, "Agent": "qrdqn"}, {"env_step": 3400000, "rew": 736.4700023651124, "rew_std": 251.00099161324306, "Agent": "qrdqn"}, {"env_step": 3500000, "rew": 704.0100011825562, "rew_std": 279.16315078624314, "Agent": "qrdqn"}, {"env_step": 3600000, "rew": 711.050004196167, "rew_std": 264.62492121177553, "Agent": "qrdqn"}, {"env_step": 3700000, "rew": 801.9700037002564, "rew_std": 277.7941106570264, "Agent": "qrdqn"}, {"env_step": 3800000, "rew": 844.069990158081, "rew_std": 287.56283848408725, "Agent": "qrdqn"}, {"env_step": 3900000, "rew": 759.6999963760376, "rew_std": 279.6283181481931, "Agent": "qrdqn"}, {"env_step": 4000000, "rew": 583.4499931335449, "rew_std": 287.06731842027597, "Agent": "qrdqn"}, {"env_step": 4100000, "rew": 749.8800132751464, "rew_std": 264.1112287832134, "Agent": "qrdqn"}, {"env_step": 4200000, "rew": 793.8099964141845, "rew_std": 302.25798478353556, "Agent": "qrdqn"}, {"env_step": 4300000, "rew": 721.4700023651124, "rew_std": 280.748223525854, "Agent": "qrdqn"}, {"env_step": 4400000, "rew": 782.9300025939941, "rew_std": 341.9947531259377, "Agent": "qrdqn"}, {"env_step": 4500000, "rew": 861.8200061798095, "rew_std": 300.90433581636256, "Agent": "qrdqn"}, {"env_step": 4600000, "rew": 699.4100095748902, "rew_std": 358.53734373918525, "Agent": "qrdqn"}, {"env_step": 4700000, "rew": 763.3199853897095, "rew_std": 321.5669115617899, "Agent": "qrdqn"}, {"env_step": 4800000, "rew": 875.8500049591064, "rew_std": 322.19139996909126, "Agent": "qrdqn"}, {"env_step": 4900000, "rew": 798.370009803772, "rew_std": 320.01471740842925, "Agent": "qrdqn"}, {"env_step": 5000000, "rew": 916.0799865722656, "rew_std": 321.69201590196326, "Agent": "qrdqn"}, {"env_step": 5100000, "rew": 854.7900035858154, "rew_std": 282.8008511766018, "Agent": "qrdqn"}, {"env_step": 5200000, "rew": 778.5300037384034, "rew_std": 300.45106950066236, "Agent": "qrdqn"}, {"env_step": 5300000, "rew": 824.4299976348877, "rew_std": 302.3329753994756, "Agent": "qrdqn"}, {"env_step": 5400000, "rew": 888.6600048065186, "rew_std": 338.1730635095935, "Agent": "qrdqn"}, {"env_step": 5500000, "rew": 839.840009689331, "rew_std": 347.04786183662765, "Agent": "qrdqn"}, {"env_step": 5600000, "rew": 743.8000047683715, "rew_std": 372.26147487134074, "Agent": "qrdqn"}, {"env_step": 5700000, "rew": 867.8499877929687, "rew_std": 316.0468936380672, "Agent": "qrdqn"}, {"env_step": 5800000, "rew": 823.3300037384033, "rew_std": 323.5871449731984, "Agent": "qrdqn"}, {"env_step": 5900000, "rew": 840.5399921417236, "rew_std": 379.45472835781385, "Agent": "qrdqn"}, {"env_step": 6000000, "rew": 795.1999963760376, "rew_std": 305.4413360252164, "Agent": "qrdqn"}, {"env_step": 6100000, "rew": 837.2100086212158, "rew_std": 294.2474416713455, "Agent": "qrdqn"}, {"env_step": 6200000, "rew": 832.8199975967407, "rew_std": 315.05369700324695, "Agent": "qrdqn"}, {"env_step": 6300000, "rew": 758.1000026702881, "rew_std": 356.9235426531571, "Agent": "qrdqn"}, {"env_step": 6400000, "rew": 869.2500061035156, "rew_std": 302.04547033603006, "Agent": "qrdqn"}, {"env_step": 6500000, "rew": 785.2299983978271, "rew_std": 393.64854338638054, "Agent": "qrdqn"}, {"env_step": 6600000, "rew": 790.1000085830689, "rew_std": 365.117793324928, "Agent": "qrdqn"}, {"env_step": 6700000, "rew": 871.6399927139282, "rew_std": 307.94262149553043, "Agent": "qrdqn"}, {"env_step": 6800000, "rew": 769.5600109100342, "rew_std": 397.7108398542242, "Agent": "qrdqn"}, {"env_step": 6900000, "rew": 897.1599975585938, "rew_std": 326.12778476504053, "Agent": "qrdqn"}, {"env_step": 7000000, "rew": 826.01999874115, "rew_std": 303.25010067918225, "Agent": "qrdqn"}, {"env_step": 7100000, "rew": 899.7099914550781, "rew_std": 354.635686696347, "Agent": "qrdqn"}, {"env_step": 7200000, "rew": 839.5300022125244, "rew_std": 366.1003253391808, "Agent": "qrdqn"}, {"env_step": 7300000, "rew": 789.2700035095215, "rew_std": 325.517405634325, "Agent": "qrdqn"}, {"env_step": 7400000, "rew": 791.4800006866456, "rew_std": 308.0200619677834, "Agent": "qrdqn"}, {"env_step": 7500000, "rew": 753.9000038146972, "rew_std": 353.6681404822802, "Agent": "qrdqn"}, {"env_step": 7600000, "rew": 760.5899974822999, "rew_std": 373.76654972757194, "Agent": "qrdqn"}, {"env_step": 7700000, "rew": 895.6800060272217, "rew_std": 332.0611307126876, "Agent": "qrdqn"}, {"env_step": 7800000, "rew": 797.7900001525879, "rew_std": 337.71737028991475, "Agent": "qrdqn"}, {"env_step": 7900000, "rew": 863.1199945449829, "rew_std": 383.8510796441181, "Agent": "qrdqn"}, {"env_step": 8000000, "rew": 936.8600036621094, "rew_std": 335.0957512819982, "Agent": "qrdqn"}, {"env_step": 8100000, "rew": 873.0900012969971, "rew_std": 323.48754155145383, "Agent": "qrdqn"}, {"env_step": 8200000, "rew": 897.2599962234497, "rew_std": 430.1072599184845, "Agent": "qrdqn"}, {"env_step": 8300000, "rew": 925.4600048065186, "rew_std": 328.0253425434283, "Agent": "qrdqn"}, {"env_step": 8400000, "rew": 800.1099956512451, "rew_std": 369.4526365613206, "Agent": "qrdqn"}, {"env_step": 8500000, "rew": 764.4199901580811, "rew_std": 386.03387542422104, "Agent": "qrdqn"}, {"env_step": 8600000, "rew": 951.6600109100342, "rew_std": 333.5321850552157, "Agent": "qrdqn"}, {"env_step": 8700000, "rew": 746.5100072860718, "rew_std": 286.61728504504305, "Agent": "qrdqn"}, {"env_step": 8800000, "rew": 849.2099956512451, "rew_std": 376.9793778487278, "Agent": "qrdqn"}, {"env_step": 8900000, "rew": 804.9700115203857, "rew_std": 377.45671631618694, "Agent": "qrdqn"}, {"env_step": 9000000, "rew": 855.3400024414062, "rew_std": 335.099863589258, "Agent": "qrdqn"}, {"env_step": 9100000, "rew": 660.5900043487549, "rew_std": 356.5631885015981, "Agent": "qrdqn"}, {"env_step": 9200000, "rew": 878.2999950408936, "rew_std": 312.5758680927236, "Agent": "qrdqn"}, {"env_step": 9300000, "rew": 826.950011062622, "rew_std": 350.83283915590056, "Agent": "qrdqn"}, {"env_step": 9400000, "rew": 790.7599872589111, "rew_std": 401.66813659775227, "Agent": "qrdqn"}, {"env_step": 9500000, "rew": 849.3099939346314, "rew_std": 313.7882372406271, "Agent": "qrdqn"}, {"env_step": 9600000, "rew": 854.3600103378296, "rew_std": 367.7412676045596, "Agent": "qrdqn"}, {"env_step": 9700000, "rew": 803.1500019073486, "rew_std": 384.89482159028836, "Agent": "qrdqn"}, {"env_step": 9800000, "rew": 655.2900049209595, "rew_std": 378.5388990350636, "Agent": "qrdqn"}, {"env_step": 9900000, "rew": 778.3899938583374, "rew_std": 332.5220751161268, "Agent": "qrdqn"}, {"env_step": 10000000, "rew": 805.2999959945679, "rew_std": 376.93931456836924, "Agent": "qrdqn"}, {"env_step": 0, "rew": 0.020000000298023225, "rew_std": 0.06000000089406966, "Agent": "iqn"}, {"env_step": 100000, "rew": 1.2300000190734863, "rew_std": 3.52648555976251, "Agent": "iqn"}, {"env_step": 200000, "rew": 0.17000000029802323, "rew_std": 0.2193171198611889, "Agent": "iqn"}, {"env_step": 300000, "rew": 2.0799999237060547, "rew_std": 5.910634254899296, "Agent": "iqn"}, {"env_step": 400000, "rew": 0.04000000059604645, "rew_std": 0.08000000119209288, "Agent": "iqn"}, {"env_step": 500000, "rew": 3.5900000773370264, "rew_std": 10.53740503238059, "Agent": "iqn"}, {"env_step": 600000, "rew": 4.530000066757202, "rew_std": 9.554166769060705, "Agent": "iqn"}, {"env_step": 700000, "rew": 3.480000114440918, "rew_std": 6.673799742209458, "Agent": "iqn"}, {"env_step": 800000, "rew": 37.689999313652514, "rew_std": 42.65694315548521, "Agent": "iqn"}, {"env_step": 900000, "rew": 123.90999913215637, "rew_std": 116.8702046746665, "Agent": "iqn"}, {"env_step": 1000000, "rew": 214.27999999523163, "rew_std": 131.19766379013453, "Agent": "iqn"}, {"env_step": 1100000, "rew": 314.01000213623047, "rew_std": 130.61631856241644, "Agent": "iqn"}, {"env_step": 1200000, "rew": 447.6299987792969, "rew_std": 132.88649299306232, "Agent": "iqn"}, {"env_step": 1300000, "rew": 488.24000244140626, "rew_std": 144.3410893300805, "Agent": "iqn"}, {"env_step": 1400000, "rew": 562.2800018310547, "rew_std": 126.35490427347918, "Agent": "iqn"}, {"env_step": 1500000, "rew": 503.0600067138672, "rew_std": 126.1369021393955, "Agent": "iqn"}, {"env_step": 1600000, "rew": 590.9699981689453, "rew_std": 106.22815802626981, "Agent": "iqn"}, {"env_step": 1700000, "rew": 656.8100067138672, "rew_std": 176.85540361563625, "Agent": "iqn"}, {"env_step": 1800000, "rew": 639.1500061035156, "rew_std": 159.90553612644817, "Agent": "iqn"}, {"env_step": 1900000, "rew": 654.3699951171875, "rew_std": 166.7387170420838, "Agent": "iqn"}, {"env_step": 2000000, "rew": 633.2700103759765, "rew_std": 194.57762929404822, "Agent": "iqn"}, {"env_step": 2100000, "rew": 700.1900115966797, "rew_std": 157.40320450762798, "Agent": "iqn"}, {"env_step": 2200000, "rew": 628.6800003051758, "rew_std": 207.51145605282667, "Agent": "iqn"}, {"env_step": 2300000, "rew": 684.490007019043, "rew_std": 224.21249061996116, "Agent": "iqn"}, {"env_step": 2400000, "rew": 756.5900001525879, "rew_std": 288.4319216808326, "Agent": "iqn"}, {"env_step": 2500000, "rew": 675.5500030517578, "rew_std": 244.21607763740568, "Agent": "iqn"}, {"env_step": 2600000, "rew": 779.7999938964844, "rew_std": 256.5563681757168, "Agent": "iqn"}, {"env_step": 2700000, "rew": 727.7399963378906, "rew_std": 269.84431788518737, "Agent": "iqn"}, {"env_step": 2800000, "rew": 792.0200012207031, "rew_std": 116.56821154467826, "Agent": "iqn"}, {"env_step": 2900000, "rew": 859.7300109863281, "rew_std": 185.18119041013455, "Agent": "iqn"}, {"env_step": 3000000, "rew": 899.7199981689453, "rew_std": 216.57974461966018, "Agent": "iqn"}, {"env_step": 3100000, "rew": 915.3699890136719, "rew_std": 114.51627047111124, "Agent": "iqn"}, {"env_step": 3200000, "rew": 795.7599945068359, "rew_std": 240.49648753795014, "Agent": "iqn"}, {"env_step": 3300000, "rew": 880.1699981689453, "rew_std": 189.51477550814192, "Agent": "iqn"}, {"env_step": 3400000, "rew": 945.1100036621094, "rew_std": 128.7564537028809, "Agent": "iqn"}, {"env_step": 3500000, "rew": 919.9100036621094, "rew_std": 244.82328680147785, "Agent": "iqn"}, {"env_step": 3600000, "rew": 982.8000061035157, "rew_std": 159.50998642265364, "Agent": "iqn"}, {"env_step": 3700000, "rew": 837.7000122070312, "rew_std": 188.50218141170882, "Agent": "iqn"}, {"env_step": 3800000, "rew": 1006.9300048828125, "rew_std": 142.2613367175323, "Agent": "iqn"}, {"env_step": 3900000, "rew": 913.0099868774414, "rew_std": 267.489982408041, "Agent": "iqn"}, {"env_step": 4000000, "rew": 874.3000061035157, "rew_std": 173.92007373390783, "Agent": "iqn"}, {"env_step": 4100000, "rew": 910.5500030517578, "rew_std": 194.92890230647552, "Agent": "iqn"}, {"env_step": 4200000, "rew": 983.5, "rew_std": 116.83092046232777, "Agent": "iqn"}, {"env_step": 4300000, "rew": 901.1400039672851, "rew_std": 305.8871257170003, "Agent": "iqn"}, {"env_step": 4400000, "rew": 813.9199890136719, "rew_std": 259.7093781051844, "Agent": "iqn"}, {"env_step": 4500000, "rew": 975.1299987792969, "rew_std": 249.7706832098956, "Agent": "iqn"}, {"env_step": 4600000, "rew": 964.7699890136719, "rew_std": 288.6829312458577, "Agent": "iqn"}, {"env_step": 4700000, "rew": 990.8800170898437, "rew_std": 227.1040665924821, "Agent": "iqn"}, {"env_step": 4800000, "rew": 1069.3499877929687, "rew_std": 184.13221489797237, "Agent": "iqn"}, {"env_step": 4900000, "rew": 985.4000122070313, "rew_std": 185.19558967958181, "Agent": "iqn"}, {"env_step": 5000000, "rew": 888.0499984741211, "rew_std": 383.0892119253023, "Agent": "iqn"}, {"env_step": 5100000, "rew": 1122.0600036621095, "rew_std": 252.77394487644332, "Agent": "iqn"}, {"env_step": 5200000, "rew": 972.6900054931641, "rew_std": 222.1775487183736, "Agent": "iqn"}, {"env_step": 5300000, "rew": 966.9400115966797, "rew_std": 369.08832261651287, "Agent": "iqn"}, {"env_step": 5400000, "rew": 789.2899993896484, "rew_std": 320.53568647830184, "Agent": "iqn"}, {"env_step": 5500000, "rew": 1027.3899841308594, "rew_std": 133.49564343614747, "Agent": "iqn"}, {"env_step": 5600000, "rew": 872.7399963378906, "rew_std": 283.1106543105209, "Agent": "iqn"}, {"env_step": 5700000, "rew": 1003.5799987792968, "rew_std": 303.12510600006334, "Agent": "iqn"}, {"env_step": 5800000, "rew": 898.3699935913086, "rew_std": 299.9163407129428, "Agent": "iqn"}, {"env_step": 5900000, "rew": 928.5400024414063, "rew_std": 183.30899650150636, "Agent": "iqn"}, {"env_step": 6000000, "rew": 1099.45, "rew_std": 215.64728660357196, "Agent": "iqn"}, {"env_step": 6100000, "rew": 1008.9999969482421, "rew_std": 270.1578310856458, "Agent": "iqn"}, {"env_step": 6200000, "rew": 1065.940008544922, "rew_std": 255.40183052553036, "Agent": "iqn"}, {"env_step": 6300000, "rew": 811.1000024795533, "rew_std": 373.20585603601734, "Agent": "iqn"}, {"env_step": 6400000, "rew": 940.3700012207031, "rew_std": 246.35399546539406, "Agent": "iqn"}, {"env_step": 6500000, "rew": 1068.6700012207032, "rew_std": 97.1969648010114, "Agent": "iqn"}, {"env_step": 6600000, "rew": 1245.320001220703, "rew_std": 287.68207875342046, "Agent": "iqn"}, {"env_step": 6700000, "rew": 1029.4099975585937, "rew_std": 181.585287367347, "Agent": "iqn"}, {"env_step": 6800000, "rew": 1042.259991455078, "rew_std": 164.0986750263718, "Agent": "iqn"}, {"env_step": 6900000, "rew": 838.8700035095214, "rew_std": 355.00632184818426, "Agent": "iqn"}, {"env_step": 7000000, "rew": 1098.1199951171875, "rew_std": 197.77309679595174, "Agent": "iqn"}, {"env_step": 7100000, "rew": 929.949984741211, "rew_std": 290.7787575853067, "Agent": "iqn"}, {"env_step": 7200000, "rew": 1002.5799926757812, "rew_std": 238.4512457320423, "Agent": "iqn"}, {"env_step": 7300000, "rew": 936.2500061035156, "rew_std": 200.61891005074025, "Agent": "iqn"}, {"env_step": 7400000, "rew": 1090.2499938964843, "rew_std": 137.09873398122215, "Agent": "iqn"}, {"env_step": 7500000, "rew": 1079.7300170898438, "rew_std": 129.4222508666326, "Agent": "iqn"}, {"env_step": 7600000, "rew": 968.8100051879883, "rew_std": 469.84580201774713, "Agent": "iqn"}, {"env_step": 7700000, "rew": 1022.8900024414063, "rew_std": 251.64726234338931, "Agent": "iqn"}, {"env_step": 7800000, "rew": 1021.4299987792969, "rew_std": 243.66798220474894, "Agent": "iqn"}, {"env_step": 7900000, "rew": 1113.2900024414062, "rew_std": 199.72603151675196, "Agent": "iqn"}, {"env_step": 8000000, "rew": 1132.0199890136719, "rew_std": 263.47352587686873, "Agent": "iqn"}, {"env_step": 8100000, "rew": 1050.8499877929687, "rew_std": 191.7771377236277, "Agent": "iqn"}, {"env_step": 8200000, "rew": 1099.139990234375, "rew_std": 223.08476706246242, "Agent": "iqn"}, {"env_step": 8300000, "rew": 1095.5199951171876, "rew_std": 152.96869354522246, "Agent": "iqn"}, {"env_step": 8400000, "rew": 1059.9700012207031, "rew_std": 121.60402177574996, "Agent": "iqn"}, {"env_step": 8500000, "rew": 1119.9500122070312, "rew_std": 173.45015933529174, "Agent": "iqn"}, {"env_step": 8600000, "rew": 940.7099975585937, "rew_std": 184.9244564548404, "Agent": "iqn"}, {"env_step": 8700000, "rew": 930.7999961853027, "rew_std": 366.8234875758687, "Agent": "iqn"}, {"env_step": 8800000, "rew": 1097.2800170898438, "rew_std": 296.206762846177, "Agent": "iqn"}, {"env_step": 8900000, "rew": 1139.8899780273437, "rew_std": 255.91239554199356, "Agent": "iqn"}, {"env_step": 9000000, "rew": 1043.5500061035157, "rew_std": 173.89118497858877, "Agent": "iqn"}, {"env_step": 9100000, "rew": 929.5200164794921, "rew_std": 373.30865054928415, "Agent": "iqn"}, {"env_step": 9200000, "rew": 1205.3200134277345, "rew_std": 275.42816935716706, "Agent": "iqn"}, {"env_step": 9300000, "rew": 1150.1200012207032, "rew_std": 260.06818848705825, "Agent": "iqn"}, {"env_step": 9400000, "rew": 1100.200018310547, "rew_std": 185.52076935234098, "Agent": "iqn"}, {"env_step": 9500000, "rew": 1058.1600158691406, "rew_std": 311.87799312292907, "Agent": "iqn"}, {"env_step": 9600000, "rew": 1252.6800048828125, "rew_std": 118.09878836211058, "Agent": "iqn"}, {"env_step": 9700000, "rew": 1132.0099853515626, "rew_std": 200.64719895414822, "Agent": "iqn"}, {"env_step": 9800000, "rew": 1039.539990234375, "rew_std": 270.93414588943654, "Agent": "iqn"}, {"env_step": 9900000, "rew": 1111.9599914550781, "rew_std": 303.33757722581527, "Agent": "iqn"}, {"env_step": 10000000, "rew": 1095.0599853515625, "rew_std": 200.86304116683058, "Agent": "iqn"}, {"env_step": 0, "rew": 0.2100000001490116, "rew_std": 0.5974110812223167, "Agent": "rainbow"}, {"env_step": 100000, "rew": 0.12999999523162842, "rew_std": 0.38999998569488525, "Agent": "rainbow"}, {"env_step": 200000, "rew": 2.7599999859929083, "rew_std": 6.376864428026797, "Agent": "rainbow"}, {"env_step": 300000, "rew": 0.7399999916553497, "rew_std": 1.967841428665537, "Agent": "rainbow"}, {"env_step": 400000, "rew": 0.7299999989569187, "rew_std": 1.9344508264320834, "Agent": "rainbow"}, {"env_step": 500000, "rew": 2.250000037252903, "rew_std": 6.453410065907903, "Agent": "rainbow"}, {"env_step": 600000, "rew": 0.3300000071525574, "rew_std": 0.7043436813838512, "Agent": "rainbow"}, {"env_step": 700000, "rew": 11.450000222027302, "rew_std": 19.350775633693363, "Agent": "rainbow"}, {"env_step": 800000, "rew": 51.87000031471253, "rew_std": 41.72313644425024, "Agent": "rainbow"}, {"env_step": 900000, "rew": 134.95999908447266, "rew_std": 26.553200308986938, "Agent": "rainbow"}, {"env_step": 1000000, "rew": 273.26000061035154, "rew_std": 40.46751980619983, "Agent": "rainbow"}, {"env_step": 1100000, "rew": 394.9699981689453, "rew_std": 35.29900920102157, "Agent": "rainbow"}, {"env_step": 1200000, "rew": 475.4699951171875, "rew_std": 51.0648386902766, "Agent": "rainbow"}, {"env_step": 1300000, "rew": 537.4499969482422, "rew_std": 87.05237149623139, "Agent": "rainbow"}, {"env_step": 1400000, "rew": 528.3800109863281, "rew_std": 74.70653568610189, "Agent": "rainbow"}, {"env_step": 1500000, "rew": 602.5700042724609, "rew_std": 63.9815013284615, "Agent": "rainbow"}, {"env_step": 1600000, "rew": 672.6400024414063, "rew_std": 75.62920855186832, "Agent": "rainbow"}, {"env_step": 1700000, "rew": 670.960009765625, "rew_std": 59.331076612532364, "Agent": "rainbow"}, {"env_step": 1800000, "rew": 704.7300048828125, "rew_std": 67.48957648360094, "Agent": "rainbow"}, {"env_step": 1900000, "rew": 787.0799987792968, "rew_std": 112.42707564022125, "Agent": "rainbow"}, {"env_step": 2000000, "rew": 823.6899963378906, "rew_std": 77.87041479137376, "Agent": "rainbow"}, {"env_step": 2100000, "rew": 840.9600036621093, "rew_std": 68.54743565383826, "Agent": "rainbow"}, {"env_step": 2200000, "rew": 822.8200012207031, "rew_std": 101.75918406873306, "Agent": "rainbow"}, {"env_step": 2300000, "rew": 846.6400024414063, "rew_std": 56.10774301137517, "Agent": "rainbow"}, {"env_step": 2400000, "rew": 935.4899963378906, "rew_std": 81.81529716155883, "Agent": "rainbow"}, {"env_step": 2500000, "rew": 871.6499938964844, "rew_std": 105.67288003470732, "Agent": "rainbow"}, {"env_step": 2600000, "rew": 935.3400085449218, "rew_std": 93.00937834754181, "Agent": "rainbow"}, {"env_step": 2700000, "rew": 962.9700134277343, "rew_std": 60.47081018959421, "Agent": "rainbow"}, {"env_step": 2800000, "rew": 939.1, "rew_std": 76.38223487303658, "Agent": "rainbow"}, {"env_step": 2900000, "rew": 983.4500122070312, "rew_std": 67.66671891975996, "Agent": "rainbow"}, {"env_step": 3000000, "rew": 1005.25, "rew_std": 46.68377918260524, "Agent": "rainbow"}, {"env_step": 3100000, "rew": 1027.85, "rew_std": 100.20803948410037, "Agent": "rainbow"}, {"env_step": 3200000, "rew": 1019.7700134277344, "rew_std": 74.38652294354544, "Agent": "rainbow"}, {"env_step": 3300000, "rew": 1025.939990234375, "rew_std": 67.48715328162088, "Agent": "rainbow"}, {"env_step": 3400000, "rew": 1048.9500061035155, "rew_std": 63.75370223721345, "Agent": "rainbow"}, {"env_step": 3500000, "rew": 1024.8799865722656, "rew_std": 81.16544192265837, "Agent": "rainbow"}, {"env_step": 3600000, "rew": 1057.9299865722655, "rew_std": 79.86718486180474, "Agent": "rainbow"}, {"env_step": 3700000, "rew": 1059.6200012207032, "rew_std": 100.3108670590954, "Agent": "rainbow"}, {"env_step": 3800000, "rew": 1100.7599975585938, "rew_std": 81.71528182411633, "Agent": "rainbow"}, {"env_step": 3900000, "rew": 1076.8199890136718, "rew_std": 65.37815728364572, "Agent": "rainbow"}, {"env_step": 4000000, "rew": 1191.0, "rew_std": 100.77746153732592, "Agent": "rainbow"}, {"env_step": 4100000, "rew": 1085.950018310547, "rew_std": 93.44744071480993, "Agent": "rainbow"}, {"env_step": 4200000, "rew": 1124.4300048828125, "rew_std": 98.69067996332086, "Agent": "rainbow"}, {"env_step": 4300000, "rew": 1204.660009765625, "rew_std": 81.11235149073514, "Agent": "rainbow"}, {"env_step": 4400000, "rew": 1136.6400024414063, "rew_std": 78.94447133335663, "Agent": "rainbow"}, {"env_step": 4500000, "rew": 1154.5200073242188, "rew_std": 74.92851522386881, "Agent": "rainbow"}, {"env_step": 4600000, "rew": 1206.0400085449219, "rew_std": 103.3929078135147, "Agent": "rainbow"}, {"env_step": 4700000, "rew": 1204.1800170898437, "rew_std": 82.69720477051608, "Agent": "rainbow"}, {"env_step": 4800000, "rew": 1142.9900146484374, "rew_std": 100.03756445774546, "Agent": "rainbow"}, {"env_step": 4900000, "rew": 1199.2599853515626, "rew_std": 43.66213881744983, "Agent": "rainbow"}, {"env_step": 5000000, "rew": 1174.4100036621094, "rew_std": 135.42985480511723, "Agent": "rainbow"}, {"env_step": 5100000, "rew": 1206.4500244140625, "rew_std": 65.40353311217433, "Agent": "rainbow"}, {"env_step": 5200000, "rew": 1213.0400024414062, "rew_std": 56.73084174140543, "Agent": "rainbow"}, {"env_step": 5300000, "rew": 1279.0799926757813, "rew_std": 122.6794261050074, "Agent": "rainbow"}, {"env_step": 5400000, "rew": 1260.5200073242188, "rew_std": 78.9505194850195, "Agent": "rainbow"}, {"env_step": 5500000, "rew": 1181.0700073242188, "rew_std": 114.83173344170228, "Agent": "rainbow"}, {"env_step": 5600000, "rew": 1176.05, "rew_std": 83.41206986065441, "Agent": "rainbow"}, {"env_step": 5700000, "rew": 1270.2599853515626, "rew_std": 124.96829424226486, "Agent": "rainbow"}, {"env_step": 5800000, "rew": 1261.5499755859375, "rew_std": 105.05167725943326, "Agent": "rainbow"}, {"env_step": 5900000, "rew": 1254.1099853515625, "rew_std": 103.52183258934855, "Agent": "rainbow"}, {"env_step": 6000000, "rew": 1285.210009765625, "rew_std": 135.08428673916382, "Agent": "rainbow"}, {"env_step": 6100000, "rew": 1321.8599975585937, "rew_std": 98.54867262115465, "Agent": "rainbow"}, {"env_step": 6200000, "rew": 1270.4499877929688, "rew_std": 134.84840828335157, "Agent": "rainbow"}, {"env_step": 6300000, "rew": 1291.8700073242187, "rew_std": 128.573159656795, "Agent": "rainbow"}, {"env_step": 6400000, "rew": 1372.1099975585937, "rew_std": 88.26145690808981, "Agent": "rainbow"}, {"env_step": 6500000, "rew": 1354.3300170898438, "rew_std": 76.23653593249794, "Agent": "rainbow"}, {"env_step": 6600000, "rew": 1337.8300048828125, "rew_std": 111.20302612183444, "Agent": "rainbow"}, {"env_step": 6700000, "rew": 1287.5800048828125, "rew_std": 156.0572077287139, "Agent": "rainbow"}, {"env_step": 6800000, "rew": 1319.3700073242187, "rew_std": 129.23841474784112, "Agent": "rainbow"}, {"env_step": 6900000, "rew": 1279.7999877929688, "rew_std": 117.75878546918071, "Agent": "rainbow"}, {"env_step": 7000000, "rew": 1328.610009765625, "rew_std": 100.9171629081728, "Agent": "rainbow"}, {"env_step": 7100000, "rew": 1364.7, "rew_std": 163.70892187079815, "Agent": "rainbow"}, {"env_step": 7200000, "rew": 1308.8900024414063, "rew_std": 88.94055366414823, "Agent": "rainbow"}, {"env_step": 7300000, "rew": 1322.25, "rew_std": 94.6752858690983, "Agent": "rainbow"}, {"env_step": 7400000, "rew": 1309.5300170898438, "rew_std": 130.62605278751548, "Agent": "rainbow"}, {"env_step": 7500000, "rew": 1346.460009765625, "rew_std": 117.62017984362635, "Agent": "rainbow"}, {"env_step": 7600000, "rew": 1307.6800170898437, "rew_std": 135.51715895844544, "Agent": "rainbow"}, {"env_step": 7700000, "rew": 1370.15, "rew_std": 121.40495533214569, "Agent": "rainbow"}, {"env_step": 7800000, "rew": 1366.02001953125, "rew_std": 155.8914434634503, "Agent": "rainbow"}, {"env_step": 7900000, "rew": 1383.0500122070312, "rew_std": 119.51592283983616, "Agent": "rainbow"}, {"env_step": 8000000, "rew": 1347.489990234375, "rew_std": 107.93389821410152, "Agent": "rainbow"}, {"env_step": 8100000, "rew": 1382.2799926757812, "rew_std": 81.35011185204777, "Agent": "rainbow"}, {"env_step": 8200000, "rew": 1357.7900024414062, "rew_std": 102.5295829744403, "Agent": "rainbow"}, {"env_step": 8300000, "rew": 1308.2999877929688, "rew_std": 108.36144846385606, "Agent": "rainbow"}, {"env_step": 8400000, "rew": 1368.2300048828124, "rew_std": 109.5325932250981, "Agent": "rainbow"}, {"env_step": 8500000, "rew": 1311.7599975585938, "rew_std": 113.36432112272027, "Agent": "rainbow"}, {"env_step": 8600000, "rew": 1384.7000122070312, "rew_std": 129.2364554734506, "Agent": "rainbow"}, {"env_step": 8700000, "rew": 1377.9300170898437, "rew_std": 130.36785628181076, "Agent": "rainbow"}, {"env_step": 8800000, "rew": 1420.160009765625, "rew_std": 126.74235879373302, "Agent": "rainbow"}, {"env_step": 8900000, "rew": 1345.9299926757812, "rew_std": 110.19251868290497, "Agent": "rainbow"}, {"env_step": 9000000, "rew": 1361.6299926757813, "rew_std": 146.04748540296958, "Agent": "rainbow"}, {"env_step": 9100000, "rew": 1334.089990234375, "rew_std": 85.54697028191892, "Agent": "rainbow"}, {"env_step": 9200000, "rew": 1292.2299926757812, "rew_std": 143.56093407787503, "Agent": "rainbow"}, {"env_step": 9300000, "rew": 1363.2300048828124, "rew_std": 162.6994478889228, "Agent": "rainbow"}, {"env_step": 9400000, "rew": 1438.1799926757812, "rew_std": 130.79961009153894, "Agent": "rainbow"}, {"env_step": 9500000, "rew": 1496.1199951171875, "rew_std": 112.32410367854669, "Agent": "rainbow"}, {"env_step": 9600000, "rew": 1472.02001953125, "rew_std": 126.8561263598282, "Agent": "rainbow"}, {"env_step": 9700000, "rew": 1391.2999877929688, "rew_std": 85.84510612212074, "Agent": "rainbow"}, {"env_step": 9800000, "rew": 1311.4199951171875, "rew_std": 129.5012392428379, "Agent": "rainbow"}, {"env_step": 9900000, "rew": 1416.0599975585938, "rew_std": 92.06283588597819, "Agent": "rainbow"}, {"env_step": 10000000, "rew": 1416.15, "rew_std": 73.5937659368437, "Agent": "rainbow"}, {"env_step": 0, "rew": 0.010000000149011612, "rew_std": 0.03000000044703483, "Agent": "ppo"}, {"env_step": 100000, "rew": 5.800000095367432, "rew_std": 9.745665904076512, "Agent": "ppo"}, {"env_step": 200000, "rew": 17.870000410079957, "rew_std": 24.34313324422257, "Agent": "ppo"}, {"env_step": 300000, "rew": 33.790000438690186, "rew_std": 34.83846926788018, "Agent": "ppo"}, {"env_step": 400000, "rew": 49.810000157356264, "rew_std": 45.02722450198439, "Agent": "ppo"}, {"env_step": 500000, "rew": 63.84000015258789, "rew_std": 55.360387449231766, "Agent": "ppo"}, {"env_step": 600000, "rew": 70.23000016212464, "rew_std": 58.73603829366222, "Agent": "ppo"}, {"env_step": 700000, "rew": 75.51999950408936, "rew_std": 67.29662320233204, "Agent": "ppo"}, {"env_step": 800000, "rew": 81.71000061035156, "rew_std": 56.81521740785272, "Agent": "ppo"}, {"env_step": 900000, "rew": 113.76000213623047, "rew_std": 79.55546964125922, "Agent": "ppo"}, {"env_step": 1000000, "rew": 116.16000061035156, "rew_std": 84.3558915187514, "Agent": "ppo"}, {"env_step": 1100000, "rew": 122.9199995458126, "rew_std": 82.33155847187241, "Agent": "ppo"}, {"env_step": 1200000, "rew": 150.4199990928173, "rew_std": 104.54179755010438, "Agent": "ppo"}, {"env_step": 1300000, "rew": 168.3199987411499, "rew_std": 108.28887045300536, "Agent": "ppo"}, {"env_step": 1400000, "rew": 176.67999801635742, "rew_std": 94.50735937346175, "Agent": "ppo"}, {"env_step": 1500000, "rew": 210.8900005340576, "rew_std": 108.90844271319088, "Agent": "ppo"}, {"env_step": 1600000, "rew": 211.0199996948242, "rew_std": 101.37994700391509, "Agent": "ppo"}, {"env_step": 1700000, "rew": 214.6699966430664, "rew_std": 100.4095196324463, "Agent": "ppo"}, {"env_step": 1800000, "rew": 247.6599998474121, "rew_std": 104.51677601247573, "Agent": "ppo"}, {"env_step": 1900000, "rew": 279.729997253418, "rew_std": 113.7720723989544, "Agent": "ppo"}, {"env_step": 2000000, "rew": 280.9099998474121, "rew_std": 106.76945620737145, "Agent": "ppo"}, {"env_step": 2100000, "rew": 288.3299987792969, "rew_std": 102.17095623218948, "Agent": "ppo"}, {"env_step": 2200000, "rew": 271.02000427246094, "rew_std": 118.16367469140917, "Agent": "ppo"}, {"env_step": 2300000, "rew": 269.90000305175784, "rew_std": 85.66159506214764, "Agent": "ppo"}, {"env_step": 2400000, "rew": 296.75999755859374, "rew_std": 95.57390780369239, "Agent": "ppo"}, {"env_step": 2500000, "rew": 300.6899978637695, "rew_std": 87.79065128890048, "Agent": "ppo"}, {"env_step": 2600000, "rew": 320.3000015258789, "rew_std": 91.139115860422, "Agent": "ppo"}, {"env_step": 2700000, "rew": 333.9300018310547, "rew_std": 89.31125875672396, "Agent": "ppo"}, {"env_step": 2800000, "rew": 327.020002746582, "rew_std": 120.26429493395794, "Agent": "ppo"}, {"env_step": 2900000, "rew": 361.1499954223633, "rew_std": 109.55767628353465, "Agent": "ppo"}, {"env_step": 3000000, "rew": 302.6900039672852, "rew_std": 98.16769631029796, "Agent": "ppo"}, {"env_step": 3100000, "rew": 315.95, "rew_std": 70.34762657993309, "Agent": "ppo"}, {"env_step": 3200000, "rew": 318.9499984741211, "rew_std": 115.132872934207, "Agent": "ppo"}, {"env_step": 3300000, "rew": 363.1899978637695, "rew_std": 85.86564602287181, "Agent": "ppo"}, {"env_step": 3400000, "rew": 368.1300018310547, "rew_std": 95.21212558703517, "Agent": "ppo"}, {"env_step": 3500000, "rew": 350.01000518798827, "rew_std": 93.16288451590842, "Agent": "ppo"}, {"env_step": 3600000, "rew": 388.5899993896484, "rew_std": 123.07756326920718, "Agent": "ppo"}, {"env_step": 3700000, "rew": 417.2999969482422, "rew_std": 100.34292919570994, "Agent": "ppo"}, {"env_step": 3800000, "rew": 461.9800048828125, "rew_std": 110.07789422926527, "Agent": "ppo"}, {"env_step": 3900000, "rew": 426.2000030517578, "rew_std": 88.50425199374192, "Agent": "ppo"}, {"env_step": 4000000, "rew": 449.4999969482422, "rew_std": 82.22106733939164, "Agent": "ppo"}, {"env_step": 4100000, "rew": 459.7000030517578, "rew_std": 107.17836845612624, "Agent": "ppo"}, {"env_step": 4200000, "rew": 465.42999572753905, "rew_std": 70.88704020848354, "Agent": "ppo"}, {"env_step": 4300000, "rew": 477.6600067138672, "rew_std": 132.27509463627436, "Agent": "ppo"}, {"env_step": 4400000, "rew": 410.0800048828125, "rew_std": 95.43147426617367, "Agent": "ppo"}, {"env_step": 4500000, "rew": 447.7100006103516, "rew_std": 70.30009378544847, "Agent": "ppo"}, {"env_step": 4600000, "rew": 462.73999786376953, "rew_std": 135.12483044104556, "Agent": "ppo"}, {"env_step": 4700000, "rew": 506.6499908447266, "rew_std": 102.90543516850502, "Agent": "ppo"}, {"env_step": 4800000, "rew": 504.0899993896484, "rew_std": 128.18980369342842, "Agent": "ppo"}, {"env_step": 4900000, "rew": 534.0000030517579, "rew_std": 116.97765592191337, "Agent": "ppo"}, {"env_step": 5000000, "rew": 513.1700057983398, "rew_std": 134.31567368090884, "Agent": "ppo"}, {"env_step": 5100000, "rew": 599.9900024414062, "rew_std": 114.45719219959994, "Agent": "ppo"}, {"env_step": 5200000, "rew": 602.4800048828125, "rew_std": 115.42681306636841, "Agent": "ppo"}, {"env_step": 5300000, "rew": 560.45, "rew_std": 147.17203595366996, "Agent": "ppo"}, {"env_step": 5400000, "rew": 542.2500030517579, "rew_std": 112.07122589244243, "Agent": "ppo"}, {"env_step": 5500000, "rew": 658.7099975585937, "rew_std": 119.60214061911367, "Agent": "ppo"}, {"env_step": 5600000, "rew": 624.2800048828125, "rew_std": 68.26668122502235, "Agent": "ppo"}, {"env_step": 5700000, "rew": 587.1499908447265, "rew_std": 79.0157166299757, "Agent": "ppo"}, {"env_step": 5800000, "rew": 649.9000061035156, "rew_std": 150.5787790102997, "Agent": "ppo"}, {"env_step": 5900000, "rew": 665.9100036621094, "rew_std": 119.23486176362321, "Agent": "ppo"}, {"env_step": 6000000, "rew": 706.7900024414063, "rew_std": 129.37492925213294, "Agent": "ppo"}, {"env_step": 6100000, "rew": 643.3500030517578, "rew_std": 116.35478540380245, "Agent": "ppo"}, {"env_step": 6200000, "rew": 721.2799926757813, "rew_std": 105.70935856689015, "Agent": "ppo"}, {"env_step": 6300000, "rew": 650.6100036621094, "rew_std": 148.55013326415474, "Agent": "ppo"}, {"env_step": 6400000, "rew": 768.1000030517578, "rew_std": 139.68046925775155, "Agent": "ppo"}, {"env_step": 6500000, "rew": 764.2999877929688, "rew_std": 118.32171828460929, "Agent": "ppo"}, {"env_step": 6600000, "rew": 782.5200073242188, "rew_std": 120.42663578622158, "Agent": "ppo"}, {"env_step": 6700000, "rew": 727.1499938964844, "rew_std": 130.45287574227336, "Agent": "ppo"}, {"env_step": 6800000, "rew": 783.6400024414063, "rew_std": 90.19995201850675, "Agent": "ppo"}, {"env_step": 6900000, "rew": 819.2, "rew_std": 132.53455239250277, "Agent": "ppo"}, {"env_step": 7000000, "rew": 794.2299987792969, "rew_std": 115.94847255070289, "Agent": "ppo"}, {"env_step": 7100000, "rew": 844.1199890136719, "rew_std": 122.43119457526758, "Agent": "ppo"}, {"env_step": 7200000, "rew": 889.6299987792969, "rew_std": 118.17887362331, "Agent": "ppo"}, {"env_step": 7300000, "rew": 861.8200012207031, "rew_std": 80.9622334545407, "Agent": "ppo"}, {"env_step": 7400000, "rew": 857.1600036621094, "rew_std": 95.34967659902838, "Agent": "ppo"}, {"env_step": 7500000, "rew": 892.6200073242187, "rew_std": 123.67628608131649, "Agent": "ppo"}, {"env_step": 7600000, "rew": 841.9999877929688, "rew_std": 86.62423578644787, "Agent": "ppo"}, {"env_step": 7700000, "rew": 890.85, "rew_std": 97.07490413687609, "Agent": "ppo"}, {"env_step": 7800000, "rew": 909.2900024414063, "rew_std": 86.85939542942558, "Agent": "ppo"}, {"env_step": 7900000, "rew": 906.0800048828125, "rew_std": 88.32103888799158, "Agent": "ppo"}, {"env_step": 8000000, "rew": 931.8700073242187, "rew_std": 80.47352350435204, "Agent": "ppo"}, {"env_step": 8100000, "rew": 938.1000061035156, "rew_std": 122.04440568291714, "Agent": "ppo"}, {"env_step": 8200000, "rew": 945.4200073242188, "rew_std": 66.3337244036705, "Agent": "ppo"}, {"env_step": 8300000, "rew": 971.860009765625, "rew_std": 91.97996093457455, "Agent": "ppo"}, {"env_step": 8400000, "rew": 1005.7700073242188, "rew_std": 129.41220377608226, "Agent": "ppo"}, {"env_step": 8500000, "rew": 972.6299926757813, "rew_std": 93.78562067872805, "Agent": "ppo"}, {"env_step": 8600000, "rew": 1000.3700012207031, "rew_std": 41.05399464776146, "Agent": "ppo"}, {"env_step": 8700000, "rew": 992.8999938964844, "rew_std": 132.0640325185449, "Agent": "ppo"}, {"env_step": 8800000, "rew": 1002.5400024414063, "rew_std": 93.22239772526292, "Agent": "ppo"}, {"env_step": 8900000, "rew": 979.8400085449218, "rew_std": 81.5561815195113, "Agent": "ppo"}, {"env_step": 9000000, "rew": 999.1100036621094, "rew_std": 134.88361081259976, "Agent": "ppo"}, {"env_step": 9100000, "rew": 1019.3699890136719, "rew_std": 110.85209895729604, "Agent": "ppo"}, {"env_step": 9200000, "rew": 1059.209979248047, "rew_std": 97.60941217671626, "Agent": "ppo"}, {"env_step": 9300000, "rew": 1088.9700012207031, "rew_std": 108.06601150231093, "Agent": "ppo"}, {"env_step": 9400000, "rew": 1053.210009765625, "rew_std": 92.88492116582314, "Agent": "ppo"}, {"env_step": 9500000, "rew": 1086.1199890136718, "rew_std": 105.10582835713497, "Agent": "ppo"}, {"env_step": 9600000, "rew": 1088.6500183105468, "rew_std": 111.11191848457115, "Agent": "ppo"}, {"env_step": 9700000, "rew": 1098.8700073242187, "rew_std": 110.51410372623518, "Agent": "ppo"}, {"env_step": 9800000, "rew": 1096.7400024414062, "rew_std": 105.4631692708768, "Agent": "ppo"}, {"env_step": 9900000, "rew": 1075.4200134277344, "rew_std": 89.31879559577925, "Agent": "ppo"}, {"env_step": 10000000, "rew": 1081.520001220703, "rew_std": 84.75678447189097, "Agent": "ppo"}]