[
    {
        "generation": 1,
        "timesteps": 500,
        "reward_mean": -38.969573510002185,
        "reward_max": -3.0626393210103044,
        "reward_min": -52.698529846225085,
        "leartime_s": 0.13352505100192502,
        "sampletime": 569.3318140329793,
        "best_mean": -38.969573510002185,
        "best_max": -3.0626393210103044,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 2,
        "timesteps": 1000,
        "reward_mean": -36.00596452000123,
        "reward_max": -1.5361505081598816,
        "reward_min": -158.18413656446944,
        "leartime_s": 0.015990548999980092,
        "sampletime": 570.3570530370343,
        "best_mean": -36.00596452000123,
        "best_max": -1.5361505081598816,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 3,
        "timesteps": 1500,
        "reward_mean": -18.021470680001038,
        "reward_max": -0.4931394318900337,
        "reward_min": -25.595242022139757,
        "leartime_s": 0.015438225003890693,
        "sampletime": 572.1265045939945,
        "best_mean": -18.021470680001038,
        "best_max": -0.4931394318900337,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 4,
        "timesteps": 2000,
        "reward_mean": -18.23203529999985,
        "reward_max": -6.807233279289347,
        "reward_min": -86.07694092823607,
        "leartime_s": 0.01535351702477783,
        "sampletime": 576.3418417530484,
        "best_mean": -18.021470680001038,
        "best_max": -0.4931394318900337,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 5,
        "timesteps": 2500,
        "reward_mean": -19.05257174000145,
        "reward_max": -5.868157011958701,
        "reward_min": -50.25943621089364,
        "leartime_s": 0.01544023200403899,
        "sampletime": 571.5733816460124,
        "best_mean": -18.021470680001038,
        "best_max": -0.4931394318900337,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 6,
        "timesteps": 3000,
        "reward_mean": -17.238844899999695,
        "reward_max": -2.0195320438598072,
        "reward_min": -109.56873689543237,
        "leartime_s": 0.015448181016836315,
        "sampletime": 576.1490322870086,
        "best_mean": -17.238844899999695,
        "best_max": -2.0195320438598072,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 7,
        "timesteps": 3500,
        "reward_mean": -9.88424845999993,
        "reward_max": -3.599876391200511,
        "reward_min": -64.66018317199676,
        "leartime_s": 0.018508541048504412,
        "sampletime": 578.2840277570067,
        "best_mean": -9.88424845999993,
        "best_max": -3.599876391200511,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 8,
        "timesteps": 4000,
        "reward_mean": -6.795460489999343,
        "reward_max": -3.0535337295802334,
        "reward_min": -21.507966221722256,
        "leartime_s": 0.015319808037020266,
        "sampletime": 578.5873949499801,
        "best_mean": -6.795460489999343,
        "best_max": -3.0535337295802334,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 9,
        "timesteps": 4500,
        "reward_mean": -4.0571886399998,
        "reward_max": -2.4542777730999896,
        "reward_min": -10.375665472850372,
        "leartime_s": 0.02034620800986886,
        "sampletime": 579.3548777420074,
        "best_mean": -4.0571886399998,
        "best_max": -2.4542777730999896,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 10,
        "timesteps": 5000,
        "reward_mean": -2.530362249999992,
        "reward_max": -1.9793265353200136,
        "reward_min": -4.926777901429993,
        "leartime_s": 0.015210821002256125,
        "sampletime": 577.2748982319608,
        "best_mean": -2.530362249999992,
        "best_max": -1.9793265353200136,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 11,
        "timesteps": 5500,
        "reward_mean": -2.2517815400000516,
        "reward_max": -1.9806720860001525,
        "reward_min": -2.651377428239794,
        "leartime_s": 0.015656024974305183,
        "sampletime": 582.4619523080182,
        "best_mean": -2.2517815400000516,
        "best_max": -1.9806720860001525,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 12,
        "timesteps": 6000,
        "reward_mean": -2.1988227299999172,
        "reward_max": -2.0139540041199036,
        "reward_min": -2.544266098259982,
        "leartime_s": 0.015297741978429258,
        "sampletime": 578.4189607020235,
        "best_mean": -2.1988227299999172,
        "best_max": -2.0139540041199036,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 13,
        "timesteps": 6500,
        "reward_mean": -2.0635411600000624,
        "reward_max": -1.9350540039901585,
        "reward_min": -2.303178705569923,
        "leartime_s": 0.01533948298310861,
        "sampletime": 576.0405339230201,
        "best_mean": -2.0635411600000624,
        "best_max": -1.9350540039901585,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 14,
        "timesteps": 7000,
        "reward_mean": -1.8987125099998816,
        "reward_max": -1.7809098849998395,
        "reward_min": -2.2835176060899856,
        "leartime_s": 0.015477192995604128,
        "sampletime": 583.0306227809633,
        "best_mean": -1.8987125099998816,
        "best_max": -1.7809098849998395,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 15,
        "timesteps": 7500,
        "reward_mean": -1.7555938200000822,
        "reward_max": -1.6640190994500021,
        "reward_min": -2.004013292950006,
        "leartime_s": 0.010900852968916297,
        "sampletime": 578.4146014400176,
        "best_mean": -1.7555938200000822,
        "best_max": -1.6640190994500021,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 16,
        "timesteps": 8000,
        "reward_mean": -1.659880679999978,
        "reward_max": -1.5074923218400167,
        "reward_min": -1.8421954286200097,
        "leartime_s": 0.015861889987718314,
        "sampletime": 575.4658144790446,
        "best_mean": -1.659880679999978,
        "best_max": -1.5074923218400167,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 17,
        "timesteps": 8500,
        "reward_mean": -1.5622210499999183,
        "reward_max": -1.4767481332199182,
        "reward_min": -1.7511194952098912,
        "leartime_s": 0.015406395017635077,
        "sampletime": 579.0646422600257,
        "best_mean": -1.5622210499999183,
        "best_max": -1.4767481332199182,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 18,
        "timesteps": 9000,
        "reward_mean": -1.4354465599999429,
        "reward_max": -1.2660411910299199,
        "reward_min": -1.6188315162299858,
        "leartime_s": 0.01684004400158301,
        "sampletime": 578.7767601879896,
        "best_mean": -1.4354465599999429,
        "best_max": -1.2660411910299199,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 19,
        "timesteps": 9500,
        "reward_mean": -1.280798009999978,
        "reward_max": -1.0832163080998878,
        "reward_min": -1.4204306605400359,
        "leartime_s": 0.015482005954254419,
        "sampletime": 578.7244094380294,
        "best_mean": -1.280798009999978,
        "best_max": -1.0832163080998878,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 20,
        "timesteps": 10000,
        "reward_mean": -1.112414020000001,
        "reward_max": -0.9298404931399847,
        "reward_min": -1.2536328813900213,
        "leartime_s": 0.01562481396831572,
        "sampletime": 577.1743047339842,
        "best_mean": -1.112414020000001,
        "best_max": -0.9298404931399847,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 21,
        "timesteps": 10500,
        "reward_mean": -0.9063415899999836,
        "reward_max": -0.7805896821899678,
        "reward_min": -1.0370808018799842,
        "leartime_s": 0.015680740005336702,
        "sampletime": 579.0684521019575,
        "best_mean": -0.9063415899999836,
        "best_max": -0.7805896821899678,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 22,
        "timesteps": 11000,
        "reward_mean": -0.7728065200000588,
        "reward_max": -0.7091834837700581,
        "reward_min": -0.8833285467200276,
        "leartime_s": 0.016128354996908456,
        "sampletime": 577.3858530229772,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 23,
        "timesteps": 11500,
        "reward_mean": -0.8023393299999607,
        "reward_max": -0.684423278249982,
        "reward_min": -0.9242597748000632,
        "leartime_s": 0.015048176981508732,
        "sampletime": 575.5236515970319,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 24,
        "timesteps": 12000,
        "reward_mean": -0.8239096999999613,
        "reward_max": -0.6506487846299853,
        "reward_min": -0.9234173972999108,
        "leartime_s": 0.015970590990036726,
        "sampletime": 578.0936175550451,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 25,
        "timesteps": 12500,
        "reward_mean": -0.8717786200000556,
        "reward_max": -0.6995515726801149,
        "reward_min": -0.979729980219979,
        "leartime_s": 0.024543028965126723,
        "sampletime": 576.5873234529863,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 26,
        "timesteps": 13000,
        "reward_mean": -0.906463810000028,
        "reward_max": -0.7188481588300366,
        "reward_min": -1.0006854669900906,
        "leartime_s": 0.015939772012643516,
        "sampletime": 575.1587596859899,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 27,
        "timesteps": 13500,
        "reward_mean": -0.9791180500001453,
        "reward_max": -0.80590419691006,
        "reward_min": -1.0811041509801682,
        "leartime_s": 0.016124108980875462,
        "sampletime": 578.4777256359812,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 28,
        "timesteps": 14000,
        "reward_mean": -1.0189938499999975,
        "reward_max": -0.862090814010123,
        "reward_min": -1.128991761539977,
        "leartime_s": 0.01582660200074315,
        "sampletime": 575.2251577160205,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 29,
        "timesteps": 14500,
        "reward_mean": -1.060063470000075,
        "reward_max": -0.9200836656299827,
        "reward_min": -1.1707854442101,
        "leartime_s": 0.016557891038246453,
        "sampletime": 573.8359876660397,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 30,
        "timesteps": 15000,
        "reward_mean": -1.1047275699999481,
        "reward_max": -1.0124810589299549,
        "reward_min": -1.203279676209929,
        "leartime_s": 0.01600425405194983,
        "sampletime": 574.882917187002,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 31,
        "timesteps": 15500,
        "reward_mean": -1.1460598599999192,
        "reward_max": -1.0575067579899713,
        "reward_min": -1.2498441531399098,
        "leartime_s": 0.016878699010703713,
        "sampletime": 575.9515746170073,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 32,
        "timesteps": 16000,
        "reward_mean": -1.181419219999985,
        "reward_max": -1.1081756879400064,
        "reward_min": -1.2810006667899374,
        "leartime_s": 0.015850648982450366,
        "sampletime": 577.3284293379984,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 33,
        "timesteps": 16500,
        "reward_mean": -1.2155162600000224,
        "reward_max": -1.122743865120024,
        "reward_min": -1.3274446370500226,
        "leartime_s": 0.01597649196628481,
        "sampletime": 578.5973263790365,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 34,
        "timesteps": 17000,
        "reward_mean": -1.2453718100000335,
        "reward_max": -1.1373223000800325,
        "reward_min": -1.3374564613300377,
        "leartime_s": 0.01633579400368035,
        "sampletime": 570.3328798239818,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 35,
        "timesteps": 17500,
        "reward_mean": -1.2422614700000532,
        "reward_max": -1.111239566620012,
        "reward_min": -1.329842333780091,
        "leartime_s": 0.01634980400558561,
        "sampletime": 576.9088695080136,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 36,
        "timesteps": 18000,
        "reward_mean": -1.2250346600001303,
        "reward_max": -1.1069120777900996,
        "reward_min": -1.31797322101013,
        "leartime_s": 0.016307048965245485,
        "sampletime": 574.2664974220097,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 37,
        "timesteps": 18500,
        "reward_mean": -1.1793172000001828,
        "reward_max": -1.0726386124001643,
        "reward_min": -1.2764956796701927,
        "leartime_s": 0.016407498042099178,
        "sampletime": 579.528542189044,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 38,
        "timesteps": 19000,
        "reward_mean": -1.1898425399999788,
        "reward_max": -1.0863361950200041,
        "reward_min": -1.2910624293299646,
        "leartime_s": 0.016423901019152254,
        "sampletime": 572.8804558860138,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 39,
        "timesteps": 19500,
        "reward_mean": -1.150309489999962,
        "reward_max": -1.0543066697699013,
        "reward_min": -1.2320367346600112,
        "leartime_s": 0.016135735029820353,
        "sampletime": 580.9815822630189,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 40,
        "timesteps": 20000,
        "reward_mean": -1.1430150499998641,
        "reward_max": -1.0660412350699016,
        "reward_min": -1.233300667629845,
        "leartime_s": 0.0162965269992128,
        "sampletime": 575.6593226679834,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 41,
        "timesteps": 20500,
        "reward_mean": -1.1777717100001512,
        "reward_max": -1.122523228470146,
        "reward_min": -1.2456773049901972,
        "leartime_s": 0.016619056987110525,
        "sampletime": 581.2026502980152,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 42,
        "timesteps": 21000,
        "reward_mean": -1.2464459400000178,
        "reward_max": -1.1772664625299925,
        "reward_min": -1.3349711935400561,
        "leartime_s": 0.01674718497088179,
        "sampletime": 574.9594769859686,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 43,
        "timesteps": 21500,
        "reward_mean": -1.317112050000051,
        "reward_max": -1.2268940432900346,
        "reward_min": -1.3895043435800611,
        "leartime_s": 0.016715829027816653,
        "sampletime": 576.506992397015,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 44,
        "timesteps": 22000,
        "reward_mean": -1.3598762300000846,
        "reward_max": -1.2707829450600914,
        "reward_min": -1.4312802099800819,
        "leartime_s": 0.016444709966890514,
        "sampletime": 576.677252191992,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 45,
        "timesteps": 22500,
        "reward_mean": -1.4005026700001084,
        "reward_max": -1.3064299614001145,
        "reward_min": -1.490116890070107,
        "leartime_s": 0.016943149967119098,
        "sampletime": 578.2712333320524,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 46,
        "timesteps": 23000,
        "reward_mean": -1.4050126299998236,
        "reward_max": -1.3154308266198258,
        "reward_min": -1.4801403800398003,
        "leartime_s": 0.016404339985456318,
        "sampletime": 574.807321524946,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 47,
        "timesteps": 23500,
        "reward_mean": -1.4116946400001138,
        "reward_max": -1.3401268889501157,
        "reward_min": -1.5048460376401085,
        "leartime_s": 0.02507382200565189,
        "sampletime": 576.4652032760205,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 48,
        "timesteps": 24000,
        "reward_mean": -1.4114152600001708,
        "reward_max": -1.3375867817201654,
        "reward_min": -1.499059890070184,
        "leartime_s": 0.01646416197763756,
        "sampletime": 575.6232168040005,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 49,
        "timesteps": 24500,
        "reward_mean": -1.3972900000001616,
        "reward_max": -1.0704837551700728,
        "reward_min": -1.4857777574101594,
        "leartime_s": 0.016519520024303347,
        "sampletime": 578.9487501589465,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 50,
        "timesteps": 25000,
        "reward_mean": -1.3883985499998994,
        "reward_max": -1.0842147277099803,
        "reward_min": -1.4626241054499194,
        "leartime_s": 0.01634271099464968,
        "sampletime": 574.3453725280124,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 51,
        "timesteps": 25500,
        "reward_mean": -1.3912732100000798,
        "reward_max": -1.3295005388200645,
        "reward_min": -1.461974942490079,
        "leartime_s": 0.01766339602181688,
        "sampletime": 577.6270200929721,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 52,
        "timesteps": 26000,
        "reward_mean": -1.377564259999965,
        "reward_max": -1.3160341025599454,
        "reward_min": -1.4280653554899918,
        "leartime_s": 0.01669265399686992,
        "sampletime": 576.5472749050241,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 53,
        "timesteps": 26500,
        "reward_mean": -1.3737464799999448,
        "reward_max": -1.2922787735499728,
        "reward_min": -1.4387921016899288,
        "leartime_s": 0.0172119089984335,
        "sampletime": 576.2457506339997,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 54,
        "timesteps": 27000,
        "reward_mean": -1.3484265600001581,
        "reward_max": -1.2676125047901652,
        "reward_min": -1.4352554251901495,
        "leartime_s": 0.01733241102192551,
        "sampletime": 578.3178159850067,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 55,
        "timesteps": 27500,
        "reward_mean": -1.306856659999839,
        "reward_max": -1.2303653531598704,
        "reward_min": -1.3654594786798109,
        "leartime_s": 0.016983508015982807,
        "sampletime": 574.869060940051,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 56,
        "timesteps": 28000,
        "reward_mean": -1.271962920000127,
        "reward_max": -1.2134630553300985,
        "reward_min": -1.3452480845801602,
        "leartime_s": 0.017145039048045874,
        "sampletime": 580.644496613997,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 57,
        "timesteps": 28500,
        "reward_mean": -1.2330831999999028,
        "reward_max": -1.1816731838499304,
        "reward_min": -1.29164336322989,
        "leartime_s": 0.017158861039206386,
        "sampletime": 573.8786813129555,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 58,
        "timesteps": 29000,
        "reward_mean": -1.19843672000005,
        "reward_max": -1.1442397474200308,
        "reward_min": -1.2606483281900958,
        "leartime_s": 0.017268991970922798,
        "sampletime": 580.5459396170336,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 59,
        "timesteps": 29500,
        "reward_mean": -1.2043012699999631,
        "reward_max": -1.1397771115199746,
        "reward_min": -1.2715559947499584,
        "leartime_s": 0.02008839201880619,
        "sampletime": 572.2734850250417,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 60,
        "timesteps": 30000,
        "reward_mean": -1.2155689199999595,
        "reward_max": -1.1667483701899495,
        "reward_min": -1.2936250140699674,
        "leartime_s": 0.0258518640184775,
        "sampletime": 576.3252799619804,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 61,
        "timesteps": 30500,
        "reward_mean": -1.2586682999998926,
        "reward_max": -1.185755746829922,
        "reward_min": -1.3522816039298622,
        "leartime_s": 0.01879865297814831,
        "sampletime": 574.785811534035,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 62,
        "timesteps": 31000,
        "reward_mean": -1.2591933599999838,
        "reward_max": -1.201486128819955,
        "reward_min": -1.3212316407600273,
        "leartime_s": 0.017119110969360918,
        "sampletime": 577.5831626210129,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 63,
        "timesteps": 31500,
        "reward_mean": -1.282278459999762,
        "reward_max": -1.217153552069766,
        "reward_min": -1.345305410769762,
        "leartime_s": 0.017494082974735647,
        "sampletime": 574.6926426650025,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 64,
        "timesteps": 32000,
        "reward_mean": -1.3044666299999277,
        "reward_max": -1.2347346251299358,
        "reward_min": -1.3650031412399184,
        "leartime_s": 0.017509242985397577,
        "sampletime": 578.1330372710363,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 65,
        "timesteps": 32500,
        "reward_mean": -1.3047923300000366,
        "reward_max": -1.243605412450038,
        "reward_min": -1.360869456730037,
        "leartime_s": 0.01752166502410546,
        "sampletime": 573.2219973119791,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 66,
        "timesteps": 33000,
        "reward_mean": -1.316492919999802,
        "reward_max": -1.2602342131698105,
        "reward_min": -1.3760333162597977,
        "leartime_s": 0.017284608038607985,
        "sampletime": 578.9508436930482,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 67,
        "timesteps": 33500,
        "reward_mean": -1.3107368300001454,
        "reward_max": -1.2615262058801298,
        "reward_min": -1.3688444618301632,
        "leartime_s": 0.017451262043323368,
        "sampletime": 576.5509438220179,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 68,
        "timesteps": 34000,
        "reward_mean": -1.3189490400000723,
        "reward_max": -1.2328634518300663,
        "reward_min": -1.3726061979000779,
        "leartime_s": 0.017188260972034186,
        "sampletime": 577.5487088849768,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 69,
        "timesteps": 34500,
        "reward_mean": -1.3245178199998753,
        "reward_max": -1.266751024879878,
        "reward_min": -1.3956965336298977,
        "leartime_s": 0.01739952602656558,
        "sampletime": 575.4116226100014,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 70,
        "timesteps": 35000,
        "reward_mean": -1.3231244499998607,
        "reward_max": -1.257938098829873,
        "reward_min": -1.3816418705298514,
        "leartime_s": 0.026174529979471117,
        "sampletime": 578.8145474939956,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 71,
        "timesteps": 35500,
        "reward_mean": -1.3119879600003235,
        "reward_max": -1.2426378255802788,
        "reward_min": -1.375483248100348,
        "leartime_s": 0.017368644010275602,
        "sampletime": 576.1358317830018,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 72,
        "timesteps": 36000,
        "reward_mean": -1.290885040000147,
        "reward_max": -1.2169253740901858,
        "reward_min": -1.3571257285501162,
        "leartime_s": 0.017654132971074432,
        "sampletime": 576.0462309040013,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 73,
        "timesteps": 36500,
        "reward_mean": -1.279595439999964,
        "reward_max": -1.2166888143999952,
        "reward_min": -1.3445285222799481,
        "leartime_s": 0.017387802014127374,
        "sampletime": 581.7105856279959,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 74,
        "timesteps": 37000,
        "reward_mean": -1.2664788099997824,
        "reward_max": -1.202345611009758,
        "reward_min": -1.321126014739809,
        "leartime_s": 0.017546247981954366,
        "sampletime": 575.039348307997,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 75,
        "timesteps": 37500,
        "reward_mean": -1.2615432600000045,
        "reward_max": -1.1757198848600559,
        "reward_min": -1.3255361025599601,
        "leartime_s": 0.028060341021046042,
        "sampletime": 579.1981604250032,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 76,
        "timesteps": 38000,
        "reward_mean": -1.2524786099999774,
        "reward_max": -1.1673896346600243,
        "reward_min": -1.3004196273399444,
        "leartime_s": 0.035504096013028175,
        "sampletime": 576.5975175400381,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 77,
        "timesteps": 38500,
        "reward_mean": -1.2380291500000766,
        "reward_max": -1.1875049448700534,
        "reward_min": -1.2899233076101075,
        "leartime_s": 0.01804789900779724,
        "sampletime": 575.8999252159847,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 78,
        "timesteps": 39000,
        "reward_mean": -1.235875640000041,
        "reward_max": -1.178653743880041,
        "reward_min": -1.2984674855500482,
        "leartime_s": 0.017873332020826638,
        "sampletime": 574.8935890329885,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 79,
        "timesteps": 39500,
        "reward_mean": -1.2290852399997216,
        "reward_max": -1.1738084733197214,
        "reward_min": -1.281733531469717,
        "leartime_s": 0.017637039010878652,
        "sampletime": 571.405817715975,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 80,
        "timesteps": 40000,
        "reward_mean": -1.2317683200000984,
        "reward_max": -1.1737400084301164,
        "reward_min": -1.29399127329007,
        "leartime_s": 0.017803544003982097,
        "sampletime": 572.1427131420351,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 81,
        "timesteps": 40500,
        "reward_mean": -1.2350247300000166,
        "reward_max": -1.1718965686900524,
        "reward_min": -1.2973175852199816,
        "leartime_s": 0.01904284203192219,
        "sampletime": 575.994149555976,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 82,
        "timesteps": 41000,
        "reward_mean": -1.2378056899999823,
        "reward_max": -1.1563567754400075,
        "reward_min": -1.2938738822999427,
        "leartime_s": 0.01817374798702076,
        "sampletime": 575.2360095659969,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 83,
        "timesteps": 41500,
        "reward_mean": -1.2358132799999035,
        "reward_max": -1.1693486066098686,
        "reward_min": -1.304924506569928,
        "leartime_s": 0.021485096018295735,
        "sampletime": 572.3678180009592,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 84,
        "timesteps": 42000,
        "reward_mean": -1.2396093099997447,
        "reward_max": -1.1800174901597464,
        "reward_min": -1.298925885849748,
        "leartime_s": 0.017800014000386,
        "sampletime": 576.3292965810397,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 85,
        "timesteps": 42500,
        "reward_mean": -1.233407060000151,
        "reward_max": -1.1691634146701455,
        "reward_min": -1.2874069819101561,
        "leartime_s": 0.018541826982982457,
        "sampletime": 571.5530495719868,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 86,
        "timesteps": 43000,
        "reward_mean": -1.2325132499998626,
        "reward_max": -1.1865325801498825,
        "reward_min": -1.2907249545398365,
        "leartime_s": 0.02229966997401789,
        "sampletime": 576.0879431780195,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 87,
        "timesteps": 43500,
        "reward_mean": -1.2272889099997928,
        "reward_max": -1.1774302515698327,
        "reward_min": -1.2746241520697712,
        "leartime_s": 0.022790032031480223,
        "sampletime": 574.7180906109861,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 88,
        "timesteps": 44000,
        "reward_mean": -1.2301710199999012,
        "reward_max": -1.1320766535499045,
        "reward_min": -1.2740522170598978,
        "leartime_s": 0.022925341967493296,
        "sampletime": 576.100211240002,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 89,
        "timesteps": 44500,
        "reward_mean": -1.231622019999988,
        "reward_max": -1.183627275480007,
        "reward_min": -1.2912169484699578,
        "leartime_s": 0.021239856025204062,
        "sampletime": 576.7341905159992,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 90,
        "timesteps": 45000,
        "reward_mean": -1.2386742999999183,
        "reward_max": -1.0763338260099387,
        "reward_min": -1.2935459901599107,
        "leartime_s": 0.01928971498273313,
        "sampletime": 577.6770152180106,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 91,
        "timesteps": 45500,
        "reward_mean": -1.2379817199998966,
        "reward_max": -1.1783920434398927,
        "reward_min": -1.2968601315098967,
        "leartime_s": 0.018466816982254386,
        "sampletime": 576.0224600019865,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 92,
        "timesteps": 46000,
        "reward_mean": -1.243397049999945,
        "reward_max": -1.1814886292199505,
        "reward_min": -1.3145752210699388,
        "leartime_s": 0.018227721971925348,
        "sampletime": 577.4651565990061,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 93,
        "timesteps": 46500,
        "reward_mean": -1.244936120000166,
        "reward_max": -1.1835050506601335,
        "reward_min": -1.2962669536201912,
        "leartime_s": 0.018032132007647306,
        "sampletime": 574.524297520984,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 94,
        "timesteps": 47000,
        "reward_mean": -1.2432278499998841,
        "reward_max": -1.1949243114498809,
        "reward_min": -1.2941669453498925,
        "leartime_s": 0.018672387988772243,
        "sampletime": 576.8336314369808,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 95,
        "timesteps": 47500,
        "reward_mean": -1.2402691900000513,
        "reward_max": -1.1800616530300483,
        "reward_min": -1.3016869001000568,
        "leartime_s": 0.018630284001119435,
        "sampletime": 575.233219144051,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 96,
        "timesteps": 48000,
        "reward_mean": -1.2403823100000981,
        "reward_max": -1.1890026812201282,
        "reward_min": -1.291550604120085,
        "leartime_s": 0.018615870969370008,
        "sampletime": 579.5473994080094,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 97,
        "timesteps": 48500,
        "reward_mean": -1.2322607499998508,
        "reward_max": -1.16812230066985,
        "reward_min": -1.2777048914598577,
        "leartime_s": 0.018681183049920946,
        "sampletime": 572.0527511830442,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 98,
        "timesteps": 49000,
        "reward_mean": -1.2279260499999187,
        "reward_max": -1.1561392124799343,
        "reward_min": -1.3103638952699044,
        "leartime_s": 0.018148672999814153,
        "sampletime": 574.9719248149777,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 99,
        "timesteps": 49500,
        "reward_mean": -1.2327187500000574,
        "reward_max": -1.181725958410025,
        "reward_min": -1.2868874570000848,
        "leartime_s": 0.018329024023842067,
        "sampletime": 577.7492186169839,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 100,
        "timesteps": 50000,
        "reward_mean": -1.216387739999842,
        "reward_max": -1.1555296207098658,
        "reward_min": -1.2793339622898072,
        "leartime_s": 0.01891111198347062,
        "sampletime": 572.5657221869915,
        "best_mean": -0.7728065200000588,
        "best_max": -0.7091834837700581,
        "params": {
            "agentsize": 1000000,
            "yellow": 0,
            "seeds": 126291,
            "it": 100,
            "envs": 10,
            "population": 1000,
            "sampling": 16,
            "method": "oes"
        }
    }
]