[
    {
        "generation": 1,
        "timesteps": 200,
        "reward_mean": -39.09397500000001,
        "reward_max": -6.5902562499999995,
        "reward_min": -75.95585625,
        "leartime_s": 0.013545885012717918,
        "sampletime": 0.643831033987226,
        "best_mean": -39.09397500000001,
        "best_max": -6.5902562499999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 2,
        "timesteps": 400,
        "reward_mean": -34.46722499999999,
        "reward_max": -1.6909124999999992,
        "reward_min": -228.5589125,
        "leartime_s": 0.033519440999953076,
        "sampletime": 0.7504375080170576,
        "best_mean": -34.46722499999999,
        "best_max": -1.6909124999999992,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 3,
        "timesteps": 600,
        "reward_mean": -18.11649999999999,
        "reward_max": 1.9054625000000005,
        "reward_min": -38.716999999999985,
        "leartime_s": 0.014883273979648948,
        "sampletime": 0.9136985490040388,
        "best_mean": -18.11649999999999,
        "best_max": 1.9054625000000005,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 4,
        "timesteps": 800,
        "reward_mean": -18.085475,
        "reward_max": -1.210225000000001,
        "reward_min": -35.58559375,
        "leartime_s": 0.026903769990894943,
        "sampletime": 0.7138109829975292,
        "best_mean": -18.085475,
        "best_max": -1.210225000000001,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 5,
        "timesteps": 1000,
        "reward_mean": -18.081175,
        "reward_max": 1.9188250000000011,
        "reward_min": -38.70617500000002,
        "leartime_s": 0.006792480009607971,
        "sampletime": 0.7889397199905943,
        "best_mean": -18.081175,
        "best_max": 1.9188250000000011,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 6,
        "timesteps": 1200,
        "reward_mean": -18.08150000000001,
        "reward_max": 1.9185000000000014,
        "reward_min": -35.58150000000001,
        "leartime_s": 0.030600933998357505,
        "sampletime": 0.7353992870193906,
        "best_mean": -18.081175,
        "best_max": 1.9188250000000011,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 7,
        "timesteps": 1400,
        "reward_mean": -18.082200000000004,
        "reward_max": -1.2072000000000016,
        "reward_min": -35.5822,
        "leartime_s": 0.008219709998229519,
        "sampletime": 0.8415609530056827,
        "best_mean": -18.081175,
        "best_max": 1.9188250000000011,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 8,
        "timesteps": 1600,
        "reward_mean": -18.080900000000007,
        "reward_max": -1.2059000000000013,
        "reward_min": -38.70590000000002,
        "leartime_s": 0.013081154000246897,
        "sampletime": 0.7981904570187908,
        "best_mean": -18.080900000000007,
        "best_max": -1.2059000000000013,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 9,
        "timesteps": 1800,
        "reward_mean": -18.08240000000001,
        "reward_max": -1.2074000000000016,
        "reward_min": -38.707399999999986,
        "leartime_s": 0.019480623013805598,
        "sampletime": 0.6717867880070116,
        "best_mean": -18.080900000000007,
        "best_max": -1.2059000000000013,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 10,
        "timesteps": 2000,
        "reward_mean": -18.082300000000004,
        "reward_max": -1.2073000000000012,
        "reward_min": -44.957300000000004,
        "leartime_s": 0.0213290510000661,
        "sampletime": 0.742573324998375,
        "best_mean": -18.080900000000007,
        "best_max": -1.2059000000000013,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 11,
        "timesteps": 2200,
        "reward_mean": -18.0818,
        "reward_max": -1.2067999999999999,
        "reward_min": -35.581800000000015,
        "leartime_s": 0.02064580499427393,
        "sampletime": 1.0112941570114344,
        "best_mean": -18.080900000000007,
        "best_max": -1.2059000000000013,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 12,
        "timesteps": 2400,
        "reward_mean": -18.081100000000006,
        "reward_max": -4.331100000000001,
        "reward_min": -38.7061,
        "leartime_s": 0.007142990012653172,
        "sampletime": 0.8870325000025332,
        "best_mean": -18.080900000000007,
        "best_max": -1.2059000000000013,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 13,
        "timesteps": 2600,
        "reward_mean": -18.083600000000004,
        "reward_max": -4.333600000000002,
        "reward_min": -38.708600000000004,
        "leartime_s": 0.037090931000420824,
        "sampletime": 0.8040875189763028,
        "best_mean": -18.080900000000007,
        "best_max": -1.2059000000000013,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 14,
        "timesteps": 2800,
        "reward_mean": -18.082200000000004,
        "reward_max": -4.332200000000004,
        "reward_min": -35.582200000000036,
        "leartime_s": 0.04544151801383123,
        "sampletime": 1.0259977669920772,
        "best_mean": -18.080900000000007,
        "best_max": -1.2059000000000013,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 15,
        "timesteps": 3000,
        "reward_mean": -18.082000000000008,
        "reward_max": -1.207262500000002,
        "reward_min": -41.83221249999997,
        "leartime_s": 0.04318494501058012,
        "sampletime": 0.9026020119781606,
        "best_mean": -18.080900000000007,
        "best_max": -1.2059000000000013,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 16,
        "timesteps": 3200,
        "reward_mean": -18.082850000000004,
        "reward_max": -1.207862500000001,
        "reward_min": -41.83283750000001,
        "leartime_s": 0.036878359998809174,
        "sampletime": 0.8243566110031679,
        "best_mean": -18.080900000000007,
        "best_max": -1.2059000000000013,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 17,
        "timesteps": 3400,
        "reward_mean": -18.082150000000006,
        "reward_max": 1.9177625000000011,
        "reward_min": -35.5822,
        "leartime_s": 0.02502431400353089,
        "sampletime": 1.1202949559956323,
        "best_mean": -18.080900000000007,
        "best_max": -1.2059000000000013,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 18,
        "timesteps": 3600,
        "reward_mean": -18.08195000000001,
        "reward_max": -1.207200000000002,
        "reward_min": -38.7072,
        "leartime_s": 0.038682593003613874,
        "sampletime": 0.7629877610015683,
        "best_mean": -18.080900000000007,
        "best_max": -1.2059000000000013,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 19,
        "timesteps": 3800,
        "reward_mean": -18.082,
        "reward_max": -1.207,
        "reward_min": -44.956999999999994,
        "leartime_s": 0.030836327001452446,
        "sampletime": 0.7874272739863954,
        "best_mean": -18.080900000000007,
        "best_max": -1.2059000000000013,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 20,
        "timesteps": 4000,
        "reward_mean": -18.081700000000005,
        "reward_max": -1.2069375000000002,
        "reward_min": -38.7069875,
        "leartime_s": 0.009516802994767204,
        "sampletime": 0.93850588001078,
        "best_mean": -18.080900000000007,
        "best_max": -1.2059000000000013,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 21,
        "timesteps": 4200,
        "reward_mean": -18.082275000000006,
        "reward_max": -4.332512499999992,
        "reward_min": -41.832525,
        "leartime_s": 0.01018225698499009,
        "sampletime": 1.1822802029782906,
        "best_mean": -18.080900000000007,
        "best_max": -1.2059000000000013,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 22,
        "timesteps": 4400,
        "reward_mean": -18.08150000000001,
        "reward_max": -1.2069500000000004,
        "reward_min": -35.581975,
        "leartime_s": 0.03965358700952493,
        "sampletime": 0.8011488849879242,
        "best_mean": -18.080900000000007,
        "best_max": -1.2059000000000013,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 23,
        "timesteps": 4600,
        "reward_mean": -18.08165000000001,
        "reward_max": -1.2078625000000007,
        "reward_min": -38.707887500000005,
        "leartime_s": 0.033773732982808724,
        "sampletime": 0.7822861500026193,
        "best_mean": -18.080900000000007,
        "best_max": -1.2059000000000013,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 24,
        "timesteps": 4800,
        "reward_mean": -18.08060000000001,
        "reward_max": -1.2058625000000005,
        "reward_min": -35.58085000000001,
        "leartime_s": 0.014820656972005963,
        "sampletime": 0.7121857409947552,
        "best_mean": -18.08060000000001,
        "best_max": -1.2058625000000005,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 25,
        "timesteps": 5000,
        "reward_mean": -18.083225000000006,
        "reward_max": -1.2081562500000005,
        "reward_min": -38.7082,
        "leartime_s": 0.006694827025057748,
        "sampletime": 0.794350933021633,
        "best_mean": -18.08060000000001,
        "best_max": -1.2058625000000005,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 26,
        "timesteps": 5200,
        "reward_mean": -18.082975000000005,
        "reward_max": 1.9171187500000013,
        "reward_min": -41.8330125,
        "leartime_s": 0.007045892009045929,
        "sampletime": 0.9087081569887232,
        "best_mean": -18.08060000000001,
        "best_max": -1.2058625000000005,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 27,
        "timesteps": 5400,
        "reward_mean": -18.081800000000012,
        "reward_max": -1.2072750000000014,
        "reward_min": -35.582300000000025,
        "leartime_s": 0.019608230999438092,
        "sampletime": 1.0229406020080205,
        "best_mean": -18.08060000000001,
        "best_max": -1.2058625000000005,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 28,
        "timesteps": 5600,
        "reward_mean": -18.081900000000008,
        "reward_max": -1.2068999999999996,
        "reward_min": -35.581900000000005,
        "leartime_s": 0.0516886469849851,
        "sampletime": 0.8421642720059026,
        "best_mean": -18.08060000000001,
        "best_max": -1.2058625000000005,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 29,
        "timesteps": 5800,
        "reward_mean": -18.08105000000001,
        "reward_max": -1.2060374999999997,
        "reward_min": -35.58105,
        "leartime_s": 0.03488552902126685,
        "sampletime": 0.8236997759959195,
        "best_mean": -18.08060000000001,
        "best_max": -1.2058625000000005,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 30,
        "timesteps": 6000,
        "reward_mean": -18.08215000000001,
        "reward_max": -1.2074000000000011,
        "reward_min": -35.5824,
        "leartime_s": 0.036798832996282727,
        "sampletime": 0.9541348140046466,
        "best_mean": -18.08060000000001,
        "best_max": -1.2058625000000005,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 31,
        "timesteps": 6200,
        "reward_mean": -18.080900000000007,
        "reward_max": -1.2059000000000015,
        "reward_min": -38.70590000000003,
        "leartime_s": 0.02968296001199633,
        "sampletime": 0.724537603004137,
        "best_mean": -18.08060000000001,
        "best_max": -1.2058625000000005,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 32,
        "timesteps": 6400,
        "reward_mean": -18.08090000000001,
        "reward_max": -1.2059000000000013,
        "reward_min": -35.58090000000002,
        "leartime_s": 0.02895358600653708,
        "sampletime": 0.8478896679880563,
        "best_mean": -18.08060000000001,
        "best_max": -1.2058625000000005,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 33,
        "timesteps": 6600,
        "reward_mean": -18.081900000000008,
        "reward_max": -1.2071249999999996,
        "reward_min": -38.7072,
        "leartime_s": 0.046376696991501376,
        "sampletime": 0.9069543700024951,
        "best_mean": -18.08060000000001,
        "best_max": -1.2058625000000005,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 34,
        "timesteps": 6800,
        "reward_mean": -18.08130000000001,
        "reward_max": -1.2065250000000007,
        "reward_min": -38.706537499999996,
        "leartime_s": 0.04724170800182037,
        "sampletime": 1.0998048309993464,
        "best_mean": -18.08060000000001,
        "best_max": -1.2058625000000005,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 35,
        "timesteps": 7000,
        "reward_mean": -18.082600000000006,
        "reward_max": -1.2076000000000011,
        "reward_min": -38.70760000000001,
        "leartime_s": 0.0752205699973274,
        "sampletime": 0.9055327879905235,
        "best_mean": -18.08060000000001,
        "best_max": -1.2058625000000005,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 36,
        "timesteps": 7200,
        "reward_mean": -18.08205000000001,
        "reward_max": 1.917637500000001,
        "reward_min": -35.58231250000001,
        "leartime_s": 0.020803679013624787,
        "sampletime": 0.8079174260201398,
        "best_mean": -18.08060000000001,
        "best_max": -1.2058625000000005,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 37,
        "timesteps": 7400,
        "reward_mean": -18.083000000000006,
        "reward_max": -1.2082500000000005,
        "reward_min": -38.64576250000002,
        "leartime_s": 0.01538606098620221,
        "sampletime": 1.0042427250009496,
        "best_mean": -18.08060000000001,
        "best_max": -1.2058625000000005,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 38,
        "timesteps": 7600,
        "reward_mean": -18.08240000000001,
        "reward_max": -1.2074000000000011,
        "reward_min": -38.707400000000014,
        "leartime_s": 0.03391506397747435,
        "sampletime": 0.8617186089977622,
        "best_mean": -18.08060000000001,
        "best_max": -1.2058625000000005,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 39,
        "timesteps": 7800,
        "reward_mean": -18.082050000000006,
        "reward_max": 1.9179125000000008,
        "reward_min": -35.58207500000001,
        "leartime_s": 0.019798524997895584,
        "sampletime": 0.8137543460179586,
        "best_mean": -18.08060000000001,
        "best_max": -1.2058625000000005,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 40,
        "timesteps": 8000,
        "reward_mean": -18.082650000000008,
        "reward_max": 1.917387500000001,
        "reward_min": -38.707687500000006,
        "leartime_s": 0.021533093007747084,
        "sampletime": 0.8621420859999489,
        "best_mean": -18.08060000000001,
        "best_max": -1.2058625000000005,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 41,
        "timesteps": 8200,
        "reward_mean": -18.080700000000004,
        "reward_max": -4.331687500000005,
        "reward_min": -47.2067,
        "leartime_s": 0.021946874010609463,
        "sampletime": 1.1064555119955912,
        "best_mean": -18.08060000000001,
        "best_max": -1.2058625000000005,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 42,
        "timesteps": 8400,
        "reward_mean": -18.082250000000002,
        "reward_max": -1.2075750000000014,
        "reward_min": -41.83246875000001,
        "leartime_s": 0.008903551992261782,
        "sampletime": 0.9744665359903593,
        "best_mean": -18.08060000000001,
        "best_max": -1.2058625000000005,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 43,
        "timesteps": 8600,
        "reward_mean": -18.081025000000004,
        "reward_max": -4.333268750000002,
        "reward_min": -38.7082875,
        "leartime_s": 0.04615735498373397,
        "sampletime": 0.7698055589862633,
        "best_mean": -18.08060000000001,
        "best_max": -1.2058625000000005,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 44,
        "timesteps": 8800,
        "reward_mean": -18.079850000000008,
        "reward_max": 1.9170000000000014,
        "reward_min": -44.95808749999998,
        "leartime_s": 0.021610715019050986,
        "sampletime": 0.8303490780235734,
        "best_mean": -18.079850000000008,
        "best_max": 1.9170000000000014,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 45,
        "timesteps": 9000,
        "reward_mean": -18.073400000000007,
        "reward_max": -1.201875000000001,
        "reward_min": -41.82986249999999,
        "leartime_s": 0.06049527900177054,
        "sampletime": 1.0698267499974463,
        "best_mean": -18.073400000000007,
        "best_max": -1.201875000000001,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 46,
        "timesteps": 9200,
        "reward_mean": -18.077625,
        "reward_max": -1.2081750000000007,
        "reward_min": -38.70844375000001,
        "leartime_s": 0.036500508984318,
        "sampletime": 0.8119867570057977,
        "best_mean": -18.073400000000007,
        "best_max": -1.201875000000001,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 47,
        "timesteps": 9400,
        "reward_mean": -18.073525,
        "reward_max": 1.2903562500000012,
        "reward_min": -41.83500625,
        "leartime_s": 0.012073109013726935,
        "sampletime": 0.9040708079992328,
        "best_mean": -18.073400000000007,
        "best_max": -1.201875000000001,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 48,
        "timesteps": 9600,
        "reward_mean": -18.061025000000004,
        "reward_max": -4.329250000000001,
        "reward_min": -38.70479375000001,
        "leartime_s": 0.044248605001484975,
        "sampletime": 0.8475416369910818,
        "best_mean": -18.061025000000004,
        "best_max": -4.329250000000001,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 49,
        "timesteps": 9800,
        "reward_mean": -18.06185,
        "reward_max": 1.9204687500000006,
        "reward_min": -35.513243749999994,
        "leartime_s": 0.022183995984960347,
        "sampletime": 0.812602316000266,
        "best_mean": -18.061025000000004,
        "best_max": -4.329250000000001,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 50,
        "timesteps": 10000,
        "reward_mean": -18.05005,
        "reward_max": -3.942306250000002,
        "reward_min": -40.94389374999999,
        "leartime_s": 0.02179268599138595,
        "sampletime": 0.8046539190108888,
        "best_mean": -18.05005,
        "best_max": -3.942306250000002,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 51,
        "timesteps": 10200,
        "reward_mean": -18.047774999999994,
        "reward_max": -0.08820625000000092,
        "reward_min": -43.086074999999994,
        "leartime_s": 0.03242346798651852,
        "sampletime": 0.938848595978925,
        "best_mean": -18.047774999999994,
        "best_max": -0.08820625000000092,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 52,
        "timesteps": 10400,
        "reward_mean": -17.970625,
        "reward_max": -0.9070250000000005,
        "reward_min": -39.84604375,
        "leartime_s": 0.037285183992935345,
        "sampletime": 0.8893670020042919,
        "best_mean": -17.970625,
        "best_max": -0.9070250000000005,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 53,
        "timesteps": 10600,
        "reward_mean": -17.941424999999995,
        "reward_max": -1.2005187500000003,
        "reward_min": -38.587374999999994,
        "leartime_s": 0.01750732201617211,
        "sampletime": 0.750399862008635,
        "best_mean": -17.941424999999995,
        "best_max": -1.2005187500000003,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 54,
        "timesteps": 10800,
        "reward_mean": -17.909075,
        "reward_max": -1.930231249999999,
        "reward_min": -39.9981875,
        "leartime_s": 0.010930541990092024,
        "sampletime": 0.7538803030038252,
        "best_mean": -17.909075,
        "best_max": -1.930231249999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 55,
        "timesteps": 11000,
        "reward_mean": -17.859599999999997,
        "reward_max": -1.9769500000000002,
        "reward_min": -43.71465624999998,
        "leartime_s": 0.0875762449868489,
        "sampletime": 1.0685128619952593,
        "best_mean": -17.859599999999997,
        "best_max": -1.9769500000000002,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 56,
        "timesteps": 11200,
        "reward_mean": -17.432299999999998,
        "reward_max": -3.919706249999998,
        "reward_min": -49.246124999999985,
        "leartime_s": 0.04367905200342648,
        "sampletime": 0.8871952760091517,
        "best_mean": -17.432299999999998,
        "best_max": -3.919706249999998,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 57,
        "timesteps": 11400,
        "reward_mean": -16.278325,
        "reward_max": -4.282125,
        "reward_min": -63.28694374999999,
        "leartime_s": 0.01678460798575543,
        "sampletime": 0.8471798140089959,
        "best_mean": -16.278325,
        "best_max": -4.282125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 58,
        "timesteps": 11600,
        "reward_mean": -15.182324999999999,
        "reward_max": -4.73595625,
        "reward_min": -39.381712500000006,
        "leartime_s": 0.030005515000084415,
        "sampletime": 1.0239873910031747,
        "best_mean": -15.182324999999999,
        "best_max": -4.73595625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 59,
        "timesteps": 11800,
        "reward_mean": -14.144474999999998,
        "reward_max": -3.478993749999999,
        "reward_min": -33.25439374999999,
        "leartime_s": 0.05340597699978389,
        "sampletime": 0.795999813999515,
        "best_mean": -14.144474999999998,
        "best_max": -3.478993749999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 60,
        "timesteps": 12000,
        "reward_mean": -14.4662,
        "reward_max": -4.73903125,
        "reward_min": -34.369531250000016,
        "leartime_s": 0.040050023002550006,
        "sampletime": 0.8315800109994598,
        "best_mean": -14.144474999999998,
        "best_max": -3.478993749999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 61,
        "timesteps": 12200,
        "reward_mean": -13.413475,
        "reward_max": -4.640131250000001,
        "reward_min": -30.617681249999997,
        "leartime_s": 0.03799918098957278,
        "sampletime": 0.7486433300073259,
        "best_mean": -13.413475,
        "best_max": -4.640131250000001,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 62,
        "timesteps": 12400,
        "reward_mean": -11.914375,
        "reward_max": -4.1091875,
        "reward_min": -25.6115375,
        "leartime_s": 0.013432625972200185,
        "sampletime": 0.8699475479952525,
        "best_mean": -11.914375,
        "best_max": -4.1091875,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 63,
        "timesteps": 12600,
        "reward_mean": -11.10425,
        "reward_max": -3.2478499999999992,
        "reward_min": -25.826981250000003,
        "leartime_s": 0.02774084999691695,
        "sampletime": 0.7853169859736226,
        "best_mean": -11.10425,
        "best_max": -3.2478499999999992,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 64,
        "timesteps": 12800,
        "reward_mean": -10.890324999999999,
        "reward_max": -3.3128375,
        "reward_min": -30.84599375,
        "leartime_s": 0.022464011010015383,
        "sampletime": 0.9307131509995088,
        "best_mean": -10.890324999999999,
        "best_max": -3.3128375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 65,
        "timesteps": 13000,
        "reward_mean": -10.472625,
        "reward_max": -3.2663749999999996,
        "reward_min": -24.43850000000001,
        "leartime_s": 0.018795948999468237,
        "sampletime": 0.7531335119856521,
        "best_mean": -10.472625,
        "best_max": -3.2663749999999996,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 66,
        "timesteps": 13200,
        "reward_mean": -10.111699999999999,
        "reward_max": -1.7620125,
        "reward_min": -21.789962499999998,
        "leartime_s": 0.03800748099456541,
        "sampletime": 0.798198405012954,
        "best_mean": -10.111699999999999,
        "best_max": -1.7620125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 67,
        "timesteps": 13400,
        "reward_mean": -9.273800000000001,
        "reward_max": -2.9587875,
        "reward_min": -25.9748125,
        "leartime_s": 0.04929428600007668,
        "sampletime": 0.7091460829833522,
        "best_mean": -9.273800000000001,
        "best_max": -2.9587875,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 68,
        "timesteps": 13600,
        "reward_mean": -8.536425,
        "reward_max": -3.33584375,
        "reward_min": -23.758249999999997,
        "leartime_s": 0.011776167986681685,
        "sampletime": 0.6525014429935254,
        "best_mean": -8.536425,
        "best_max": -3.33584375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 69,
        "timesteps": 13800,
        "reward_mean": -8.20035,
        "reward_max": -3.0537687499999997,
        "reward_min": -18.336812499999997,
        "leartime_s": 0.022415760002331808,
        "sampletime": 0.6924621450016275,
        "best_mean": -8.20035,
        "best_max": -3.0537687499999997,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 70,
        "timesteps": 14000,
        "reward_mean": -7.1914,
        "reward_max": -2.726393750000001,
        "reward_min": -17.8068125,
        "leartime_s": 0.00992512798984535,
        "sampletime": 0.76833062802325,
        "best_mean": -7.1914,
        "best_max": -2.726393750000001,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 71,
        "timesteps": 14200,
        "reward_mean": -6.7061,
        "reward_max": -2.893575,
        "reward_min": -18.257787499999996,
        "leartime_s": 0.010603920003632084,
        "sampletime": 0.7176470659906045,
        "best_mean": -6.7061,
        "best_max": -2.893575,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 72,
        "timesteps": 14400,
        "reward_mean": -6.109124999999999,
        "reward_max": -2.2863937500000002,
        "reward_min": -12.719512499999999,
        "leartime_s": 0.009262631996534765,
        "sampletime": 0.7028009400237352,
        "best_mean": -6.109124999999999,
        "best_max": -2.2863937500000002,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 73,
        "timesteps": 14600,
        "reward_mean": -5.418800000000001,
        "reward_max": -2.528737499999999,
        "reward_min": -10.207600000000001,
        "leartime_s": 0.03199534400482662,
        "sampletime": 0.6668530630122405,
        "best_mean": -5.418800000000001,
        "best_max": -2.528737499999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 74,
        "timesteps": 14800,
        "reward_mean": -4.662325,
        "reward_max": -1.9396375000000006,
        "reward_min": -7.716625,
        "leartime_s": 0.03440216902527027,
        "sampletime": 0.6849342380010057,
        "best_mean": -4.662325,
        "best_max": -1.9396375000000006,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 75,
        "timesteps": 15000,
        "reward_mean": -4.2704249999999995,
        "reward_max": -1.4717312499999997,
        "reward_min": -7.0769312499999995,
        "leartime_s": 0.03189601699705236,
        "sampletime": 0.702762080996763,
        "best_mean": -4.2704249999999995,
        "best_max": -1.4717312499999997,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 76,
        "timesteps": 15200,
        "reward_mean": -3.43345,
        "reward_max": -1.2264999999999993,
        "reward_min": -6.6688875,
        "leartime_s": 0.009511325013590977,
        "sampletime": 0.7606961590063293,
        "best_mean": -3.43345,
        "best_max": -1.2264999999999993,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 77,
        "timesteps": 15400,
        "reward_mean": -3.7866249999999995,
        "reward_max": -2.0370249999999994,
        "reward_min": -6.594875,
        "leartime_s": 0.029524910991312936,
        "sampletime": 0.7630914539913647,
        "best_mean": -3.43345,
        "best_max": -1.2264999999999993,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 78,
        "timesteps": 15600,
        "reward_mean": -2.7369499999999998,
        "reward_max": -0.7096312499999999,
        "reward_min": -5.1489312499999995,
        "leartime_s": 0.016386914998292923,
        "sampletime": 0.763470719975885,
        "best_mean": -2.7369499999999998,
        "best_max": -0.7096312499999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 79,
        "timesteps": 15800,
        "reward_mean": -2.897125,
        "reward_max": -0.6580562500000001,
        "reward_min": -5.108037500000002,
        "leartime_s": 0.009472323989029974,
        "sampletime": 0.7205684609944001,
        "best_mean": -2.7369499999999998,
        "best_max": -0.7096312499999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 80,
        "timesteps": 16000,
        "reward_mean": -2.4486,
        "reward_max": -0.5277687499999999,
        "reward_min": -5.10296875,
        "leartime_s": 0.009588214015820995,
        "sampletime": 0.7604124729987234,
        "best_mean": -2.4486,
        "best_max": -0.5277687499999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 81,
        "timesteps": 16200,
        "reward_mean": -2.4269499999999997,
        "reward_max": -1.023475,
        "reward_min": -4.19780625,
        "leartime_s": 0.017899844999192283,
        "sampletime": 0.759524197987048,
        "best_mean": -2.4269499999999997,
        "best_max": -1.023475,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 82,
        "timesteps": 16400,
        "reward_mean": -2.3192000000000004,
        "reward_max": -0.8511249999999999,
        "reward_min": -4.454862499999999,
        "leartime_s": 0.023763627017615363,
        "sampletime": 0.7636544449778739,
        "best_mean": -2.3192000000000004,
        "best_max": -0.8511249999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 83,
        "timesteps": 16600,
        "reward_mean": -2.28235,
        "reward_max": -0.8108562499999997,
        "reward_min": -4.1857875,
        "leartime_s": 0.01926165199256502,
        "sampletime": 0.8173944590089377,
        "best_mean": -2.28235,
        "best_max": -0.8108562499999997,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 84,
        "timesteps": 16800,
        "reward_mean": -1.8190500000000003,
        "reward_max": -0.23069374999999984,
        "reward_min": -3.6155812500000004,
        "leartime_s": 0.04504555999301374,
        "sampletime": 0.7055141879827715,
        "best_mean": -1.8190500000000003,
        "best_max": -0.23069374999999984,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 85,
        "timesteps": 17000,
        "reward_mean": -1.9408750000000001,
        "reward_max": -0.6690562500000001,
        "reward_min": -3.86300625,
        "leartime_s": 0.04852992299129255,
        "sampletime": 0.6806938520167023,
        "best_mean": -1.8190500000000003,
        "best_max": -0.23069374999999984,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 86,
        "timesteps": 17200,
        "reward_mean": -1.6920500000000003,
        "reward_max": -0.2340312499999999,
        "reward_min": -3.7999125000000005,
        "leartime_s": 0.03134432400111109,
        "sampletime": 0.875247458985541,
        "best_mean": -1.6920500000000003,
        "best_max": -0.2340312499999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 87,
        "timesteps": 17400,
        "reward_mean": -1.5661749999999997,
        "reward_max": -0.29635625000000004,
        "reward_min": -3.7066687499999995,
        "leartime_s": 0.030106374993920326,
        "sampletime": 0.8043014270078856,
        "best_mean": -1.5661749999999997,
        "best_max": -0.29635625000000004,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 88,
        "timesteps": 17600,
        "reward_mean": -1.9904500000000003,
        "reward_max": -0.7383250000000002,
        "reward_min": -3.7684374999999997,
        "leartime_s": 0.01479546498740092,
        "sampletime": 0.7210353609989397,
        "best_mean": -1.5661749999999997,
        "best_max": -0.29635625000000004,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 89,
        "timesteps": 17800,
        "reward_mean": -1.763775,
        "reward_max": -0.5710062500000003,
        "reward_min": -3.054312500000001,
        "leartime_s": 0.02739138199831359,
        "sampletime": 0.6565302160161082,
        "best_mean": -1.5661749999999997,
        "best_max": -0.29635625000000004,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 90,
        "timesteps": 18000,
        "reward_mean": -1.7624000000000002,
        "reward_max": -0.7629312499999997,
        "reward_min": -3.257268750000001,
        "leartime_s": 0.022773762000724673,
        "sampletime": 0.770028370025102,
        "best_mean": -1.5661749999999997,
        "best_max": -0.29635625000000004,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 91,
        "timesteps": 18200,
        "reward_mean": -1.84985,
        "reward_max": -0.56031875,
        "reward_min": -3.27489375,
        "leartime_s": 0.019518962973961607,
        "sampletime": 0.7592083600175101,
        "best_mean": -1.5661749999999997,
        "best_max": -0.29635625000000004,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 92,
        "timesteps": 18400,
        "reward_mean": -1.7313749999999997,
        "reward_max": -0.6943187500000001,
        "reward_min": -3.13181875,
        "leartime_s": 0.015201608010102063,
        "sampletime": 0.7025929609953891,
        "best_mean": -1.5661749999999997,
        "best_max": -0.29635625000000004,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 93,
        "timesteps": 18600,
        "reward_mean": -1.7858749999999999,
        "reward_max": -0.6648375,
        "reward_min": -2.9781062500000006,
        "leartime_s": 0.01841410601628013,
        "sampletime": 0.6537613259861246,
        "best_mean": -1.5661749999999997,
        "best_max": -0.29635625000000004,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 94,
        "timesteps": 18800,
        "reward_mean": -1.7013,
        "reward_max": -0.6698562499999999,
        "reward_min": -3.57475,
        "leartime_s": 0.06685068001388572,
        "sampletime": 0.811362153996015,
        "best_mean": -1.5661749999999997,
        "best_max": -0.29635625000000004,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 95,
        "timesteps": 19000,
        "reward_mean": -1.5756999999999999,
        "reward_max": -0.5198124999999998,
        "reward_min": -3.0232812499999997,
        "leartime_s": 0.03442622098373249,
        "sampletime": 0.6984484379936475,
        "best_mean": -1.5661749999999997,
        "best_max": -0.29635625000000004,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 96,
        "timesteps": 19200,
        "reward_mean": -1.5448999999999997,
        "reward_max": -0.3293312499999999,
        "reward_min": -3.1617250000000006,
        "leartime_s": 0.009760254994034767,
        "sampletime": 0.723135285981698,
        "best_mean": -1.5448999999999997,
        "best_max": -0.3293312499999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 97,
        "timesteps": 19400,
        "reward_mean": -1.643475,
        "reward_max": -0.6601812499999997,
        "reward_min": -3.15468125,
        "leartime_s": 0.03179522400023416,
        "sampletime": 0.6999121579865459,
        "best_mean": -1.5448999999999997,
        "best_max": -0.3293312499999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 98,
        "timesteps": 19600,
        "reward_mean": -1.5135499999999997,
        "reward_max": -0.54189375,
        "reward_min": -2.8666,
        "leartime_s": 0.011908401997061446,
        "sampletime": 0.7283511539862957,
        "best_mean": -1.5135499999999997,
        "best_max": -0.54189375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 99,
        "timesteps": 19800,
        "reward_mean": -1.8759,
        "reward_max": -0.7646437500000001,
        "reward_min": -2.9714687499999997,
        "leartime_s": 0.028552556002978235,
        "sampletime": 0.7019802719878498,
        "best_mean": -1.5135499999999997,
        "best_max": -0.54189375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 100,
        "timesteps": 20000,
        "reward_mean": -1.4370999999999996,
        "reward_max": -0.4230999999999999,
        "reward_min": -2.54565625,
        "leartime_s": 0.026054532994749025,
        "sampletime": 0.7751829600019846,
        "best_mean": -1.4370999999999996,
        "best_max": -0.4230999999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 101,
        "timesteps": 20200,
        "reward_mean": -1.7303,
        "reward_max": -0.5704499999999998,
        "reward_min": -3.1595500000000007,
        "leartime_s": 0.01379216299392283,
        "sampletime": 0.8386810029915068,
        "best_mean": -1.4370999999999996,
        "best_max": -0.4230999999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 102,
        "timesteps": 20400,
        "reward_mean": -1.5841249999999998,
        "reward_max": -0.4924312499999996,
        "reward_min": -2.9211437499999997,
        "leartime_s": 0.019605733978096396,
        "sampletime": 0.728898303990718,
        "best_mean": -1.4370999999999996,
        "best_max": -0.4230999999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 103,
        "timesteps": 20600,
        "reward_mean": -1.5763250000000002,
        "reward_max": -0.7137625000000001,
        "reward_min": -3.0885812500000007,
        "leartime_s": 0.023077054996974766,
        "sampletime": 0.6272482899948955,
        "best_mean": -1.4370999999999996,
        "best_max": -0.4230999999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 104,
        "timesteps": 20800,
        "reward_mean": -1.3877999999999997,
        "reward_max": -0.5116437499999997,
        "reward_min": -2.30573125,
        "leartime_s": 0.021250903024338186,
        "sampletime": 0.7123846480099019,
        "best_mean": -1.3877999999999997,
        "best_max": -0.5116437499999997,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 105,
        "timesteps": 21000,
        "reward_mean": -1.5924749999999996,
        "reward_max": -0.48574999999999946,
        "reward_min": -2.86671875,
        "leartime_s": 0.018780688988044858,
        "sampletime": 0.7301194230094552,
        "best_mean": -1.3877999999999997,
        "best_max": -0.5116437499999997,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 106,
        "timesteps": 21200,
        "reward_mean": -1.457725,
        "reward_max": -0.5114125,
        "reward_min": -3.0341249999999995,
        "leartime_s": 0.028404017008142546,
        "sampletime": 0.7815102660097182,
        "best_mean": -1.3877999999999997,
        "best_max": -0.5116437499999997,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 107,
        "timesteps": 21400,
        "reward_mean": -1.5365,
        "reward_max": -0.5411312499999998,
        "reward_min": -3.2747937500000006,
        "leartime_s": 0.016602146002696827,
        "sampletime": 0.7835388880048413,
        "best_mean": -1.3877999999999997,
        "best_max": -0.5116437499999997,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 108,
        "timesteps": 21600,
        "reward_mean": -1.531275,
        "reward_max": -0.5398687499999999,
        "reward_min": -2.9048374999999997,
        "leartime_s": 0.03073372700600885,
        "sampletime": 0.7724752070207614,
        "best_mean": -1.3877999999999997,
        "best_max": -0.5116437499999997,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 109,
        "timesteps": 21800,
        "reward_mean": -1.5757249999999998,
        "reward_max": -0.59760625,
        "reward_min": -2.8313999999999995,
        "leartime_s": 0.02441422300762497,
        "sampletime": 0.6874095279781613,
        "best_mean": -1.3877999999999997,
        "best_max": -0.5116437499999997,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 110,
        "timesteps": 22000,
        "reward_mean": -1.55475,
        "reward_max": -0.5410437499999998,
        "reward_min": -2.9477187500000004,
        "leartime_s": 0.021212312974967062,
        "sampletime": 0.6963092490041163,
        "best_mean": -1.3877999999999997,
        "best_max": -0.5116437499999997,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 111,
        "timesteps": 22200,
        "reward_mean": -1.6288500000000001,
        "reward_max": -0.7743250000000002,
        "reward_min": -2.9687250000000005,
        "leartime_s": 0.021860759996343404,
        "sampletime": 0.7162535369861871,
        "best_mean": -1.3877999999999997,
        "best_max": -0.5116437499999997,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 112,
        "timesteps": 22400,
        "reward_mean": -1.665225,
        "reward_max": -0.6767875000000001,
        "reward_min": -2.74770625,
        "leartime_s": 0.01345817800029181,
        "sampletime": 0.6877558029955253,
        "best_mean": -1.3877999999999997,
        "best_max": -0.5116437499999997,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 113,
        "timesteps": 22600,
        "reward_mean": -1.8258999999999999,
        "reward_max": -0.8286375000000001,
        "reward_min": -3.2570437500000002,
        "leartime_s": 0.016688936011632904,
        "sampletime": 0.7605450099799782,
        "best_mean": -1.3877999999999997,
        "best_max": -0.5116437499999997,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 114,
        "timesteps": 22800,
        "reward_mean": -1.7454750000000003,
        "reward_max": -0.5529562499999999,
        "reward_min": -3.1380749999999993,
        "leartime_s": 0.009834869008045644,
        "sampletime": 0.7098312230082229,
        "best_mean": -1.3877999999999997,
        "best_max": -0.5116437499999997,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 115,
        "timesteps": 23000,
        "reward_mean": -1.7635499999999997,
        "reward_max": -0.7963937499999998,
        "reward_min": -2.874762499999999,
        "leartime_s": 0.02089169100509025,
        "sampletime": 0.8755836789787281,
        "best_mean": -1.3877999999999997,
        "best_max": -0.5116437499999997,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 116,
        "timesteps": 23200,
        "reward_mean": -1.5779499999999997,
        "reward_max": -0.7178374999999997,
        "reward_min": -2.8367812500000005,
        "leartime_s": 0.02030450798338279,
        "sampletime": 0.7806011799839325,
        "best_mean": -1.3877999999999997,
        "best_max": -0.5116437499999997,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 117,
        "timesteps": 23400,
        "reward_mean": -1.5462249999999997,
        "reward_max": -0.7234437499999998,
        "reward_min": -3.2347687500000006,
        "leartime_s": 0.011009216017555445,
        "sampletime": 0.6381484750017989,
        "best_mean": -1.3877999999999997,
        "best_max": -0.5116437499999997,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 118,
        "timesteps": 23600,
        "reward_mean": -1.504525,
        "reward_max": -0.49818749999999984,
        "reward_min": -2.8106874999999993,
        "leartime_s": 0.030146747012622654,
        "sampletime": 0.738978617999237,
        "best_mean": -1.3877999999999997,
        "best_max": -0.5116437499999997,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 119,
        "timesteps": 23800,
        "reward_mean": -1.6816,
        "reward_max": -0.6511,
        "reward_min": -3.3949749999999996,
        "leartime_s": 0.04996513298829086,
        "sampletime": 0.7149824380176142,
        "best_mean": -1.3877999999999997,
        "best_max": -0.5116437499999997,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 120,
        "timesteps": 24000,
        "reward_mean": -1.6650249999999998,
        "reward_max": -0.8023625000000001,
        "reward_min": -3.6807625,
        "leartime_s": 0.06593473799875937,
        "sampletime": 0.6858246069750749,
        "best_mean": -1.3877999999999997,
        "best_max": -0.5116437499999997,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 121,
        "timesteps": 24200,
        "reward_mean": -1.589125,
        "reward_max": -0.7103499999999999,
        "reward_min": -3.3288124999999993,
        "leartime_s": 0.021270725992508233,
        "sampletime": 0.8548474549897946,
        "best_mean": -1.3877999999999997,
        "best_max": -0.5116437499999997,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 122,
        "timesteps": 24400,
        "reward_mean": -1.6499999999999997,
        "reward_max": -0.5847124999999999,
        "reward_min": -2.90174375,
        "leartime_s": 0.024224571010563523,
        "sampletime": 0.7518063960014842,
        "best_mean": -1.3877999999999997,
        "best_max": -0.5116437499999997,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 123,
        "timesteps": 24600,
        "reward_mean": -1.878575,
        "reward_max": -0.63775625,
        "reward_min": -3.078112499999999,
        "leartime_s": 0.03363203801563941,
        "sampletime": 0.6695458680042066,
        "best_mean": -1.3877999999999997,
        "best_max": -0.5116437499999997,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 124,
        "timesteps": 24800,
        "reward_mean": -1.731075,
        "reward_max": -0.7234562499999998,
        "reward_min": -3.1696625000000003,
        "leartime_s": 0.03879504598444328,
        "sampletime": 0.753405967989238,
        "best_mean": -1.3877999999999997,
        "best_max": -0.5116437499999997,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 125,
        "timesteps": 25000,
        "reward_mean": -1.5796750000000002,
        "reward_max": -0.46559375000000003,
        "reward_min": -2.84706875,
        "leartime_s": 0.020274281996535137,
        "sampletime": 0.8678662519960199,
        "best_mean": -1.3877999999999997,
        "best_max": -0.5116437499999997,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 126,
        "timesteps": 25200,
        "reward_mean": -1.8320750000000003,
        "reward_max": -0.824775,
        "reward_min": -3.0750125,
        "leartime_s": 0.029174330993555486,
        "sampletime": 0.7507228479953483,
        "best_mean": -1.3877999999999997,
        "best_max": -0.5116437499999997,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 127,
        "timesteps": 25400,
        "reward_mean": -1.6217249999999999,
        "reward_max": -0.7080187499999998,
        "reward_min": -2.73124375,
        "leartime_s": 0.018377197004156187,
        "sampletime": 0.7674120070005301,
        "best_mean": -1.3877999999999997,
        "best_max": -0.5116437499999997,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 128,
        "timesteps": 25600,
        "reward_mean": -1.5749000000000002,
        "reward_max": -0.57615,
        "reward_min": -2.8243,
        "leartime_s": 0.02343769697472453,
        "sampletime": 0.7399920540046878,
        "best_mean": -1.3877999999999997,
        "best_max": -0.5116437499999997,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 129,
        "timesteps": 25800,
        "reward_mean": -1.5928749999999998,
        "reward_max": -0.72011875,
        "reward_min": -3.0348500000000005,
        "leartime_s": 0.01336211001034826,
        "sampletime": 0.7164064759854227,
        "best_mean": -1.3877999999999997,
        "best_max": -0.5116437499999997,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 130,
        "timesteps": 26000,
        "reward_mean": -1.6556749999999998,
        "reward_max": -0.44318749999999996,
        "reward_min": -3.814675,
        "leartime_s": 0.02649765700334683,
        "sampletime": 0.7895573590067215,
        "best_mean": -1.3877999999999997,
        "best_max": -0.5116437499999997,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 131,
        "timesteps": 26200,
        "reward_mean": -1.8749999999999998,
        "reward_max": -0.9017375,
        "reward_min": -3.1712749999999996,
        "leartime_s": 0.0413803820265457,
        "sampletime": 0.6871260569896549,
        "best_mean": -1.3877999999999997,
        "best_max": -0.5116437499999997,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 132,
        "timesteps": 26400,
        "reward_mean": -1.555,
        "reward_max": -0.3419374999999998,
        "reward_min": -2.744225,
        "leartime_s": 0.03731146000791341,
        "sampletime": 0.7487422109988984,
        "best_mean": -1.3877999999999997,
        "best_max": -0.5116437499999997,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 133,
        "timesteps": 26600,
        "reward_mean": -1.6916,
        "reward_max": -0.6238062499999999,
        "reward_min": -2.82810625,
        "leartime_s": 0.07037870399653912,
        "sampletime": 0.6683397000015248,
        "best_mean": -1.3877999999999997,
        "best_max": -0.5116437499999997,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 134,
        "timesteps": 26800,
        "reward_mean": -1.83,
        "reward_max": -0.9242750000000001,
        "reward_min": -3.0470374999999996,
        "leartime_s": 0.024990556004922837,
        "sampletime": 0.7866064140107483,
        "best_mean": -1.3877999999999997,
        "best_max": -0.5116437499999997,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 135,
        "timesteps": 27000,
        "reward_mean": -1.6803500000000002,
        "reward_max": -0.86060625,
        "reward_min": -2.9091812500000005,
        "leartime_s": 0.03418604098260403,
        "sampletime": 0.8657319660123903,
        "best_mean": -1.3877999999999997,
        "best_max": -0.5116437499999997,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 136,
        "timesteps": 27200,
        "reward_mean": -1.6442249999999996,
        "reward_max": -0.7702437499999998,
        "reward_min": -3.1438125,
        "leartime_s": 0.012968606984941289,
        "sampletime": 0.7386079050193075,
        "best_mean": -1.3877999999999997,
        "best_max": -0.5116437499999997,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 137,
        "timesteps": 27400,
        "reward_mean": -1.5966749999999998,
        "reward_max": -0.6227874999999998,
        "reward_min": -2.938643749999999,
        "leartime_s": 0.03260091200354509,
        "sampletime": 0.6622022450028453,
        "best_mean": -1.3877999999999997,
        "best_max": -0.5116437499999997,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 138,
        "timesteps": 27600,
        "reward_mean": -1.0805749999999998,
        "reward_max": -0.23141250000000002,
        "reward_min": -2.3027249999999997,
        "leartime_s": 0.04016633701394312,
        "sampletime": 0.6657198260072619,
        "best_mean": -1.0805749999999998,
        "best_max": -0.23141250000000002,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 139,
        "timesteps": 27800,
        "reward_mean": -1.5244499999999999,
        "reward_max": -0.4970874999999999,
        "reward_min": -2.50173125,
        "leartime_s": 0.018903854012023658,
        "sampletime": 0.7657060869969428,
        "best_mean": -1.0805749999999998,
        "best_max": -0.23141250000000002,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 140,
        "timesteps": 28000,
        "reward_mean": -1.531825,
        "reward_max": -0.5639437499999997,
        "reward_min": -2.62384375,
        "leartime_s": 0.010492739995243028,
        "sampletime": 0.6857687180163339,
        "best_mean": -1.0805749999999998,
        "best_max": -0.23141250000000002,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 141,
        "timesteps": 28200,
        "reward_mean": -1.5344250000000001,
        "reward_max": -0.6506062499999997,
        "reward_min": -2.7845812499999996,
        "leartime_s": 0.020932004001224414,
        "sampletime": 0.7139361259760335,
        "best_mean": -1.0805749999999998,
        "best_max": -0.23141250000000002,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 142,
        "timesteps": 28400,
        "reward_mean": -1.4006750000000001,
        "reward_max": -0.4323625,
        "reward_min": -3.058025000000001,
        "leartime_s": 0.029316452011698857,
        "sampletime": 0.7263965190213639,
        "best_mean": -1.0805749999999998,
        "best_max": -0.23141250000000002,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 143,
        "timesteps": 28600,
        "reward_mean": -1.7100500000000003,
        "reward_max": -0.8899250000000001,
        "reward_min": -3.020493750000001,
        "leartime_s": 0.01663581599132158,
        "sampletime": 0.7657262840075418,
        "best_mean": -1.0805749999999998,
        "best_max": -0.23141250000000002,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 144,
        "timesteps": 28800,
        "reward_mean": -1.4469999999999998,
        "reward_max": -0.36225000000000007,
        "reward_min": -2.4772999999999987,
        "leartime_s": 0.03443038501427509,
        "sampletime": 0.7619201180059463,
        "best_mean": -1.0805749999999998,
        "best_max": -0.23141250000000002,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 145,
        "timesteps": 29000,
        "reward_mean": -1.6336499999999996,
        "reward_max": -0.6308750000000001,
        "reward_min": -2.93906875,
        "leartime_s": 0.016535359987756237,
        "sampletime": 0.6983385649800766,
        "best_mean": -1.0805749999999998,
        "best_max": -0.23141250000000002,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 146,
        "timesteps": 29200,
        "reward_mean": -1.4807999999999997,
        "reward_max": -0.6801562499999999,
        "reward_min": -2.66125,
        "leartime_s": 0.02176555700134486,
        "sampletime": 0.7048211570072453,
        "best_mean": -1.0805749999999998,
        "best_max": -0.23141250000000002,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 147,
        "timesteps": 29400,
        "reward_mean": -1.7743250000000004,
        "reward_max": -0.859475,
        "reward_min": -3.16291875,
        "leartime_s": 0.03211974902660586,
        "sampletime": 0.8287619890179485,
        "best_mean": -1.0805749999999998,
        "best_max": -0.23141250000000002,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 148,
        "timesteps": 29600,
        "reward_mean": -1.2843499999999999,
        "reward_max": -0.48039375000000006,
        "reward_min": -2.494475,
        "leartime_s": 0.05115747099625878,
        "sampletime": 0.7458203510032035,
        "best_mean": -1.0805749999999998,
        "best_max": -0.23141250000000002,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 149,
        "timesteps": 29800,
        "reward_mean": -1.464725,
        "reward_max": -0.6143749999999998,
        "reward_min": -2.9305000000000003,
        "leartime_s": 0.05753513201489113,
        "sampletime": 0.6804408910102211,
        "best_mean": -1.0805749999999998,
        "best_max": -0.23141250000000002,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 150,
        "timesteps": 30000,
        "reward_mean": -1.4336750000000003,
        "reward_max": -0.4679000000000002,
        "reward_min": -2.7821000000000002,
        "leartime_s": 0.050303408002946526,
        "sampletime": 0.7339456519985106,
        "best_mean": -1.0805749999999998,
        "best_max": -0.23141250000000002,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 151,
        "timesteps": 30200,
        "reward_mean": -1.129375,
        "reward_max": -0.030481249999999988,
        "reward_min": -3.0936624999999993,
        "leartime_s": 0.013440777984214947,
        "sampletime": 0.7659881720028352,
        "best_mean": -1.0805749999999998,
        "best_max": -0.23141250000000002,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 152,
        "timesteps": 30400,
        "reward_mean": -1.3579250000000003,
        "reward_max": -0.5361250000000001,
        "reward_min": -2.5358187499999993,
        "leartime_s": 0.024634398985654116,
        "sampletime": 0.7423785139981192,
        "best_mean": -1.0805749999999998,
        "best_max": -0.23141250000000002,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 153,
        "timesteps": 30600,
        "reward_mean": -1.3615249999999999,
        "reward_max": -0.30315625,
        "reward_min": -2.90873125,
        "leartime_s": 0.03518060699570924,
        "sampletime": 0.8175669980118982,
        "best_mean": -1.0805749999999998,
        "best_max": -0.23141250000000002,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 154,
        "timesteps": 30800,
        "reward_mean": -1.5682250000000002,
        "reward_max": -0.6356374999999999,
        "reward_min": -2.9547000000000003,
        "leartime_s": 0.017474075022619218,
        "sampletime": 0.7485584320093039,
        "best_mean": -1.0805749999999998,
        "best_max": -0.23141250000000002,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 155,
        "timesteps": 31000,
        "reward_mean": -1.018075,
        "reward_max": -0.21143750000000022,
        "reward_min": -2.0828562500000003,
        "leartime_s": 0.033005044009769335,
        "sampletime": 0.7029329930082895,
        "best_mean": -1.018075,
        "best_max": -0.21143750000000022,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 156,
        "timesteps": 31200,
        "reward_mean": -1.37765,
        "reward_max": -0.21472500000000022,
        "reward_min": -2.5161125,
        "leartime_s": 0.027307742013363168,
        "sampletime": 0.7350763450085651,
        "best_mean": -1.018075,
        "best_max": -0.21143750000000022,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 157,
        "timesteps": 31400,
        "reward_mean": -1.1446000000000003,
        "reward_max": -0.2515312500000001,
        "reward_min": -2.4437937500000007,
        "leartime_s": 0.01554199299425818,
        "sampletime": 0.7433979430061299,
        "best_mean": -1.018075,
        "best_max": -0.21143750000000022,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 158,
        "timesteps": 31600,
        "reward_mean": -1.2965000000000002,
        "reward_max": -0.34308125,
        "reward_min": -2.4859,
        "leartime_s": 0.02112059498904273,
        "sampletime": 0.731194651016267,
        "best_mean": -1.018075,
        "best_max": -0.21143750000000022,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 159,
        "timesteps": 31800,
        "reward_mean": -1.31315,
        "reward_max": -0.40642500000000015,
        "reward_min": -2.3918749999999998,
        "leartime_s": 0.014308555983006954,
        "sampletime": 0.7373867690039333,
        "best_mean": -1.018075,
        "best_max": -0.21143750000000022,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 160,
        "timesteps": 32000,
        "reward_mean": -1.3542750000000001,
        "reward_max": -0.35001250000000006,
        "reward_min": -2.32040625,
        "leartime_s": 0.022335904010105878,
        "sampletime": 0.737144721992081,
        "best_mean": -1.018075,
        "best_max": -0.21143750000000022,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 161,
        "timesteps": 32200,
        "reward_mean": -1.4585500000000002,
        "reward_max": -0.5655687500000002,
        "reward_min": -2.5773437500000007,
        "leartime_s": 0.02572073001647368,
        "sampletime": 0.8216651730181184,
        "best_mean": -1.018075,
        "best_max": -0.21143750000000022,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 162,
        "timesteps": 32400,
        "reward_mean": -1.3594750000000002,
        "reward_max": -0.2339812500000001,
        "reward_min": -2.43435625,
        "leartime_s": 0.01313533799839206,
        "sampletime": 0.7687308119784575,
        "best_mean": -1.018075,
        "best_max": -0.21143750000000022,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 163,
        "timesteps": 32600,
        "reward_mean": -1.35835,
        "reward_max": -0.32595,
        "reward_min": -2.45035,
        "leartime_s": 0.013861151994206011,
        "sampletime": 0.7445720469986554,
        "best_mean": -1.018075,
        "best_max": -0.21143750000000022,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 164,
        "timesteps": 32800,
        "reward_mean": -1.385875,
        "reward_max": -0.50783125,
        "reward_min": -2.6404875000000003,
        "leartime_s": 0.015207807009574026,
        "sampletime": 0.6363944490149152,
        "best_mean": -1.018075,
        "best_max": -0.21143750000000022,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 165,
        "timesteps": 33000,
        "reward_mean": -1.4004000000000003,
        "reward_max": -0.4306437500000001,
        "reward_min": -2.550925,
        "leartime_s": 0.06975943499128334,
        "sampletime": 0.6989593460166361,
        "best_mean": -1.018075,
        "best_max": -0.21143750000000022,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 166,
        "timesteps": 33200,
        "reward_mean": -1.2064750000000002,
        "reward_max": -0.10226875000000021,
        "reward_min": -2.4666625,
        "leartime_s": 0.07761913299327716,
        "sampletime": 0.8035531010245904,
        "best_mean": -1.018075,
        "best_max": -0.21143750000000022,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 167,
        "timesteps": 33400,
        "reward_mean": -1.2321000000000002,
        "reward_max": -0.2494812500000002,
        "reward_min": -2.3648812500000003,
        "leartime_s": 0.053087514999788254,
        "sampletime": 0.6564136249944568,
        "best_mean": -1.018075,
        "best_max": -0.21143750000000022,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 168,
        "timesteps": 33600,
        "reward_mean": -1.361,
        "reward_max": -0.5254812500000002,
        "reward_min": -2.3961062500000003,
        "leartime_s": 0.036850002012215555,
        "sampletime": 0.7462018299847841,
        "best_mean": -1.018075,
        "best_max": -0.21143750000000022,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 169,
        "timesteps": 33800,
        "reward_mean": -1.3657500000000002,
        "reward_max": -0.6209937500000006,
        "reward_min": -2.512575,
        "leartime_s": 0.02633660499122925,
        "sampletime": 0.6942236949980725,
        "best_mean": -1.018075,
        "best_max": -0.21143750000000022,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 170,
        "timesteps": 34000,
        "reward_mean": -1.0495999999999999,
        "reward_max": -0.11963750000000016,
        "reward_min": -2.1765562499999995,
        "leartime_s": 0.020661054004449397,
        "sampletime": 0.8371397139853798,
        "best_mean": -1.018075,
        "best_max": -0.21143750000000022,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 171,
        "timesteps": 34200,
        "reward_mean": -1.25565,
        "reward_max": -0.18766875000000002,
        "reward_min": -2.6266187499999996,
        "leartime_s": 0.01335204901988618,
        "sampletime": 0.7611963319941424,
        "best_mean": -1.018075,
        "best_max": -0.21143750000000022,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 172,
        "timesteps": 34400,
        "reward_mean": -1.3683000000000005,
        "reward_max": -0.34065625000000016,
        "reward_min": -2.5355562500000004,
        "leartime_s": 0.023694012983469293,
        "sampletime": 0.6712486280011944,
        "best_mean": -1.018075,
        "best_max": -0.21143750000000022,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 173,
        "timesteps": 34600,
        "reward_mean": -1.205875,
        "reward_max": -0.30711250000000007,
        "reward_min": -2.8697812499999995,
        "leartime_s": 0.021253827988402918,
        "sampletime": 0.7985679400153458,
        "best_mean": -1.018075,
        "best_max": -0.21143750000000022,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 174,
        "timesteps": 34800,
        "reward_mean": -1.2009,
        "reward_max": 0.03071249999999998,
        "reward_min": -2.3387687499999994,
        "leartime_s": 0.018007653998211026,
        "sampletime": 0.7510412579867989,
        "best_mean": -1.018075,
        "best_max": -0.21143750000000022,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 175,
        "timesteps": 35000,
        "reward_mean": -1.0752249999999999,
        "reward_max": -0.17386249999999995,
        "reward_min": -2.1306125000000002,
        "leartime_s": 0.03166489701834507,
        "sampletime": 0.7423435160017107,
        "best_mean": -1.018075,
        "best_max": -0.21143750000000022,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 176,
        "timesteps": 35200,
        "reward_mean": -1.1157000000000001,
        "reward_max": -0.1601750000000001,
        "reward_min": -2.2512687500000004,
        "leartime_s": 0.020837845018832013,
        "sampletime": 0.7869053600006737,
        "best_mean": -1.018075,
        "best_max": -0.21143750000000022,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 177,
        "timesteps": 35400,
        "reward_mean": -1.2260749999999998,
        "reward_max": -0.31200625,
        "reward_min": -2.2513437499999998,
        "leartime_s": 0.053669981978600845,
        "sampletime": 0.6726199019758496,
        "best_mean": -1.018075,
        "best_max": -0.21143750000000022,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 178,
        "timesteps": 35600,
        "reward_mean": -1.184,
        "reward_max": -0.2994125,
        "reward_min": -2.5456250000000002,
        "leartime_s": 0.04403916001319885,
        "sampletime": 0.7378318639821373,
        "best_mean": -1.018075,
        "best_max": -0.21143750000000022,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 179,
        "timesteps": 35800,
        "reward_mean": -1.181025,
        "reward_max": 0.05364374999999989,
        "reward_min": -2.8187374999999992,
        "leartime_s": 0.012349573982646689,
        "sampletime": 0.8146100709855091,
        "best_mean": -1.018075,
        "best_max": -0.21143750000000022,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 180,
        "timesteps": 36000,
        "reward_mean": -1.212625,
        "reward_max": -0.40726875,
        "reward_min": -2.84635,
        "leartime_s": 0.03085465100593865,
        "sampletime": 0.6522873240173794,
        "best_mean": -1.018075,
        "best_max": -0.21143750000000022,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 181,
        "timesteps": 36200,
        "reward_mean": -1.141375,
        "reward_max": -0.19126250000000009,
        "reward_min": -2.2554562499999995,
        "leartime_s": 0.027361323998775333,
        "sampletime": 0.7095737770141568,
        "best_mean": -1.018075,
        "best_max": -0.21143750000000022,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 182,
        "timesteps": 36400,
        "reward_mean": -1.2274,
        "reward_max": -0.32248124999999994,
        "reward_min": -2.3848562500000003,
        "leartime_s": 0.02174271800322458,
        "sampletime": 0.7353807020117529,
        "best_mean": -1.018075,
        "best_max": -0.21143750000000022,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 183,
        "timesteps": 36600,
        "reward_mean": -0.991475,
        "reward_max": 0.09004374999999999,
        "reward_min": -1.9563749999999998,
        "leartime_s": 0.04391770201618783,
        "sampletime": 0.6590601560019422,
        "best_mean": -0.991475,
        "best_max": 0.09004374999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 184,
        "timesteps": 36800,
        "reward_mean": -1.2248500000000002,
        "reward_max": -0.18482500000000007,
        "reward_min": -2.6121124999999994,
        "leartime_s": 0.043104759010020643,
        "sampletime": 0.7141679549822584,
        "best_mean": -0.991475,
        "best_max": 0.09004374999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 185,
        "timesteps": 37000,
        "reward_mean": -0.921875,
        "reward_max": -0.17420624999999998,
        "reward_min": -2.2875937499999996,
        "leartime_s": 0.029248006001580507,
        "sampletime": 0.673132001014892,
        "best_mean": -0.921875,
        "best_max": -0.17420624999999998,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 186,
        "timesteps": 37200,
        "reward_mean": -0.9785750000000001,
        "reward_max": -0.11030624999999995,
        "reward_min": -2.1103,
        "leartime_s": 0.02530730000580661,
        "sampletime": 0.7404955239908304,
        "best_mean": -0.921875,
        "best_max": -0.17420624999999998,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 187,
        "timesteps": 37400,
        "reward_mean": -1.1262750000000001,
        "reward_max": -0.2930499999999999,
        "reward_min": -2.3508562499999996,
        "leartime_s": 0.022030082007404417,
        "sampletime": 0.7624746359942947,
        "best_mean": -0.921875,
        "best_max": -0.17420624999999998,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 188,
        "timesteps": 37600,
        "reward_mean": -1.1870249999999998,
        "reward_max": -0.2570687499999999,
        "reward_min": -2.32363125,
        "leartime_s": 0.015539173997240141,
        "sampletime": 0.821753043011995,
        "best_mean": -0.921875,
        "best_max": -0.17420624999999998,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 189,
        "timesteps": 37800,
        "reward_mean": -0.9540749999999999,
        "reward_max": 0.10330000000000009,
        "reward_min": -2.1845375000000002,
        "leartime_s": 0.012083782989066094,
        "sampletime": 0.6630525159998797,
        "best_mean": -0.921875,
        "best_max": -0.17420624999999998,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 190,
        "timesteps": 38000,
        "reward_mean": -0.993625,
        "reward_max": 0.027712500000000168,
        "reward_min": -2.1724687499999997,
        "leartime_s": 0.02875465899705887,
        "sampletime": 0.698925862001488,
        "best_mean": -0.921875,
        "best_max": -0.17420624999999998,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 191,
        "timesteps": 38200,
        "reward_mean": -0.973475,
        "reward_max": -0.08608124999999994,
        "reward_min": -1.9714187500000007,
        "leartime_s": 0.016714569996111095,
        "sampletime": 0.6908192240225617,
        "best_mean": -0.921875,
        "best_max": -0.17420624999999998,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 192,
        "timesteps": 38400,
        "reward_mean": -1.074575,
        "reward_max": -0.14586874999999996,
        "reward_min": -2.577824999999999,
        "leartime_s": 0.011752320977393538,
        "sampletime": 0.8139855959743727,
        "best_mean": -0.921875,
        "best_max": -0.17420624999999998,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 193,
        "timesteps": 38600,
        "reward_mean": -1.1669499999999997,
        "reward_max": -0.23779999999999998,
        "reward_min": -2.652525,
        "leartime_s": 0.024290966015541926,
        "sampletime": 0.6708236580016091,
        "best_mean": -0.921875,
        "best_max": -0.17420624999999998,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 194,
        "timesteps": 38800,
        "reward_mean": -0.9524000000000001,
        "reward_max": 0.02621250000000007,
        "reward_min": -1.8609875,
        "leartime_s": 0.023174205009127036,
        "sampletime": 0.6415813409839757,
        "best_mean": -0.921875,
        "best_max": -0.17420624999999998,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 195,
        "timesteps": 39000,
        "reward_mean": -1.1127,
        "reward_max": -0.09558750000000002,
        "reward_min": -2.53985,
        "leartime_s": 0.020426713017513976,
        "sampletime": 0.728574740991462,
        "best_mean": -0.921875,
        "best_max": -0.17420624999999998,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 196,
        "timesteps": 39200,
        "reward_mean": -1.03935,
        "reward_max": -0.016006250000000055,
        "reward_min": -2.380662499999999,
        "leartime_s": 0.033826872997451574,
        "sampletime": 0.7684251910250168,
        "best_mean": -0.921875,
        "best_max": -0.17420624999999998,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 197,
        "timesteps": 39400,
        "reward_mean": -0.81285,
        "reward_max": 0.2050000000000003,
        "reward_min": -2.1846375,
        "leartime_s": 0.021440069016534835,
        "sampletime": 0.7240831179951783,
        "best_mean": -0.81285,
        "best_max": 0.2050000000000003,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 198,
        "timesteps": 39600,
        "reward_mean": -1.0255,
        "reward_max": -0.10388125000000004,
        "reward_min": -2.1606312500000002,
        "leartime_s": 0.018051378021482378,
        "sampletime": 0.6914199230086524,
        "best_mean": -0.81285,
        "best_max": 0.2050000000000003,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 199,
        "timesteps": 39800,
        "reward_mean": -1.03805,
        "reward_max": -0.01598124999999992,
        "reward_min": -2.4469,
        "leartime_s": 0.032595213007880375,
        "sampletime": 0.7148074450087734,
        "best_mean": -0.81285,
        "best_max": 0.2050000000000003,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 200,
        "timesteps": 40000,
        "reward_mean": -1.0072750000000001,
        "reward_max": -0.25756250000000014,
        "reward_min": -2.078775,
        "leartime_s": 0.05793495400575921,
        "sampletime": 0.7926828220079187,
        "best_mean": -0.81285,
        "best_max": 0.2050000000000003,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 201,
        "timesteps": 40200,
        "reward_mean": -1.1353499999999999,
        "reward_max": 0.02201875000000025,
        "reward_min": -2.17458125,
        "leartime_s": 0.059902245993725955,
        "sampletime": 0.7364034460042603,
        "best_mean": -0.81285,
        "best_max": 0.2050000000000003,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 202,
        "timesteps": 40400,
        "reward_mean": -0.8667999999999998,
        "reward_max": 0.05467500000000003,
        "reward_min": -1.7084624999999996,
        "leartime_s": 0.035760620987275615,
        "sampletime": 0.8214267040020786,
        "best_mean": -0.81285,
        "best_max": 0.2050000000000003,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 203,
        "timesteps": 40600,
        "reward_mean": -1.141775,
        "reward_max": -0.2653062500000002,
        "reward_min": -2.603175,
        "leartime_s": 0.055226682976353914,
        "sampletime": 0.7528758060070686,
        "best_mean": -0.81285,
        "best_max": 0.2050000000000003,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 204,
        "timesteps": 40800,
        "reward_mean": -0.9722999999999999,
        "reward_max": -0.07092499999999989,
        "reward_min": -1.9493625,
        "leartime_s": 0.044556854001712054,
        "sampletime": 0.8052904710057192,
        "best_mean": -0.81285,
        "best_max": 0.2050000000000003,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 205,
        "timesteps": 41000,
        "reward_mean": -0.8815749999999998,
        "reward_max": 0.2186625,
        "reward_min": -2.58710625,
        "leartime_s": 0.021804891002830118,
        "sampletime": 0.6893435259989928,
        "best_mean": -0.81285,
        "best_max": 0.2050000000000003,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 206,
        "timesteps": 41200,
        "reward_mean": -0.9971249999999999,
        "reward_max": -0.1491937499999998,
        "reward_min": -2.02419375,
        "leartime_s": 0.028623610007343814,
        "sampletime": 0.7703714260132983,
        "best_mean": -0.81285,
        "best_max": 0.2050000000000003,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 207,
        "timesteps": 41400,
        "reward_mean": -0.805525,
        "reward_max": 0.01690624999999997,
        "reward_min": -1.8477000000000001,
        "leartime_s": 0.03745121098472737,
        "sampletime": 0.7785398249980062,
        "best_mean": -0.805525,
        "best_max": 0.01690624999999997,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 208,
        "timesteps": 41600,
        "reward_mean": -1.046625,
        "reward_max": -0.0679375000000001,
        "reward_min": -2.1328562499999997,
        "leartime_s": 0.040716613992117345,
        "sampletime": 0.7610145349754021,
        "best_mean": -0.805525,
        "best_max": 0.01690624999999997,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 209,
        "timesteps": 41800,
        "reward_mean": -0.9345249999999999,
        "reward_max": 0.06406875000000009,
        "reward_min": -1.8948,
        "leartime_s": 0.061663512024097145,
        "sampletime": 0.701126808009576,
        "best_mean": -0.805525,
        "best_max": 0.01690624999999997,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 210,
        "timesteps": 42000,
        "reward_mean": -1.02375,
        "reward_max": 0.039881250000000035,
        "reward_min": -2.396724999999999,
        "leartime_s": 0.045856507000280544,
        "sampletime": 0.6950955159845762,
        "best_mean": -0.805525,
        "best_max": 0.01690624999999997,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 211,
        "timesteps": 42200,
        "reward_mean": -1.0517249999999998,
        "reward_max": -0.13049999999999998,
        "reward_min": -2.2683,
        "leartime_s": 0.03356667800107971,
        "sampletime": 0.7864926870097406,
        "best_mean": -0.805525,
        "best_max": 0.01690624999999997,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 212,
        "timesteps": 42400,
        "reward_mean": -1.0246999999999997,
        "reward_max": -0.10037499999999999,
        "reward_min": -2.2843812499999996,
        "leartime_s": 0.021287968003889546,
        "sampletime": 0.75808091199724,
        "best_mean": -0.805525,
        "best_max": 0.01690624999999997,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 213,
        "timesteps": 42600,
        "reward_mean": -0.82,
        "reward_max": 0.05966250000000006,
        "reward_min": -2.1166687500000005,
        "leartime_s": 0.05085931601934135,
        "sampletime": 0.7487901799904648,
        "best_mean": -0.805525,
        "best_max": 0.01690624999999997,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 214,
        "timesteps": 42800,
        "reward_mean": -0.978575,
        "reward_max": -0.10728750000000001,
        "reward_min": -1.9812937500000003,
        "leartime_s": 0.03922226600116119,
        "sampletime": 0.8839626899862196,
        "best_mean": -0.805525,
        "best_max": 0.01690624999999997,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 215,
        "timesteps": 43000,
        "reward_mean": -0.8212249999999998,
        "reward_max": 0.16227500000000006,
        "reward_min": -2.0242874999999994,
        "leartime_s": 0.027474124974105507,
        "sampletime": 0.7610120880126487,
        "best_mean": -0.805525,
        "best_max": 0.01690624999999997,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 216,
        "timesteps": 43200,
        "reward_mean": -1.1582,
        "reward_max": -0.06839999999999996,
        "reward_min": -2.5729124999999997,
        "leartime_s": 0.017659545002970845,
        "sampletime": 0.7620005809876602,
        "best_mean": -0.805525,
        "best_max": 0.01690624999999997,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 217,
        "timesteps": 43400,
        "reward_mean": -1.05475,
        "reward_max": -0.21842500000000012,
        "reward_min": -2.6578187500000006,
        "leartime_s": 0.03341954099596478,
        "sampletime": 0.787538467993727,
        "best_mean": -0.805525,
        "best_max": 0.01690624999999997,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 218,
        "timesteps": 43600,
        "reward_mean": -0.9672999999999999,
        "reward_max": 0.2978437500000001,
        "reward_min": -1.8868250000000002,
        "leartime_s": 0.024597017996711656,
        "sampletime": 0.7368000029819086,
        "best_mean": -0.805525,
        "best_max": 0.01690624999999997,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 219,
        "timesteps": 43800,
        "reward_mean": -0.9185499999999998,
        "reward_max": -0.03232499999999979,
        "reward_min": -2.240012499999999,
        "leartime_s": 0.022187333001056686,
        "sampletime": 0.8939627540239599,
        "best_mean": -0.805525,
        "best_max": 0.01690624999999997,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 220,
        "timesteps": 44000,
        "reward_mean": -0.9046000000000001,
        "reward_max": 0.20033125000000007,
        "reward_min": -2.1265875000000003,
        "leartime_s": 0.049587929010158405,
        "sampletime": 0.7210070110158995,
        "best_mean": -0.805525,
        "best_max": 0.01690624999999997,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 221,
        "timesteps": 44200,
        "reward_mean": -0.7620750000000001,
        "reward_max": 0.1871,
        "reward_min": -1.7692125000000003,
        "leartime_s": 0.03757636700174771,
        "sampletime": 0.8254776760004461,
        "best_mean": -0.7620750000000001,
        "best_max": 0.1871,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 222,
        "timesteps": 44400,
        "reward_mean": -0.9639249999999998,
        "reward_max": -0.019587499999999827,
        "reward_min": -2.442425,
        "leartime_s": 0.025921185995684937,
        "sampletime": 0.7247467940032948,
        "best_mean": -0.7620750000000001,
        "best_max": 0.1871,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 223,
        "timesteps": 44600,
        "reward_mean": -1.1044249999999998,
        "reward_max": -0.22144999999999995,
        "reward_min": -2.2738999999999994,
        "leartime_s": 0.03644682900630869,
        "sampletime": 0.7088264189951587,
        "best_mean": -0.7620750000000001,
        "best_max": 0.1871,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 224,
        "timesteps": 44800,
        "reward_mean": -0.9363500000000001,
        "reward_max": -0.08383750000000016,
        "reward_min": -2.0357625,
        "leartime_s": 0.025216562004061416,
        "sampletime": 0.8483067380147986,
        "best_mean": -0.7620750000000001,
        "best_max": 0.1871,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 225,
        "timesteps": 45000,
        "reward_mean": -0.8030749999999999,
        "reward_max": 0.27346250000000005,
        "reward_min": -1.9837124999999998,
        "leartime_s": 0.032205283001530915,
        "sampletime": 0.7638599150232039,
        "best_mean": -0.7620750000000001,
        "best_max": 0.1871,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 226,
        "timesteps": 45200,
        "reward_mean": -0.8465750000000001,
        "reward_max": 0.029643749999999955,
        "reward_min": -1.9703562500000003,
        "leartime_s": 0.029107725014910102,
        "sampletime": 0.6894757660047617,
        "best_mean": -0.7620750000000001,
        "best_max": 0.1871,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 227,
        "timesteps": 45400,
        "reward_mean": -0.8379999999999999,
        "reward_max": 0.12920000000000004,
        "reward_min": -2.0739499999999995,
        "leartime_s": 0.027391005016397685,
        "sampletime": 0.7306539240234997,
        "best_mean": -0.7620750000000001,
        "best_max": 0.1871,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 228,
        "timesteps": 45600,
        "reward_mean": -0.883875,
        "reward_max": 0.03140625000000009,
        "reward_min": -2.0951624999999994,
        "leartime_s": 0.022566886007552966,
        "sampletime": 0.6787333420070354,
        "best_mean": -0.7620750000000001,
        "best_max": 0.1871,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 229,
        "timesteps": 45800,
        "reward_mean": -0.8021999999999998,
        "reward_max": 0.1428,
        "reward_min": -2.2929749999999998,
        "leartime_s": 0.03700134198879823,
        "sampletime": 0.7532398600014858,
        "best_mean": -0.7620750000000001,
        "best_max": 0.1871,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 230,
        "timesteps": 46000,
        "reward_mean": -1.065825,
        "reward_max": -0.0980812499999999,
        "reward_min": -2.2694812499999997,
        "leartime_s": 0.04141831997549161,
        "sampletime": 0.7083853240183089,
        "best_mean": -0.7620750000000001,
        "best_max": 0.1871,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 231,
        "timesteps": 46200,
        "reward_mean": -1.0736749999999997,
        "reward_max": -0.15476874999999993,
        "reward_min": -2.287975,
        "leartime_s": 0.04495801098528318,
        "sampletime": 0.715319986018585,
        "best_mean": -0.7620750000000001,
        "best_max": 0.1871,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 232,
        "timesteps": 46400,
        "reward_mean": -0.9305749999999997,
        "reward_max": 0.07040625000000031,
        "reward_min": -2.0748499999999996,
        "leartime_s": 0.025058600993361324,
        "sampletime": 0.7528941470081918,
        "best_mean": -0.7620750000000001,
        "best_max": 0.1871,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 233,
        "timesteps": 46600,
        "reward_mean": -1.0003000000000002,
        "reward_max": 0.07216249999999996,
        "reward_min": -2.345225,
        "leartime_s": 0.03303827898344025,
        "sampletime": 0.7719774470024277,
        "best_mean": -0.7620750000000001,
        "best_max": 0.1871,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 234,
        "timesteps": 46800,
        "reward_mean": -0.898725,
        "reward_max": 0.04855,
        "reward_min": -2.2041375,
        "leartime_s": 0.023259869980392978,
        "sampletime": 0.6857052579871379,
        "best_mean": -0.7620750000000001,
        "best_max": 0.1871,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 235,
        "timesteps": 47000,
        "reward_mean": -0.9311499999999999,
        "reward_max": -0.013437499999999838,
        "reward_min": -2.4489375,
        "leartime_s": 0.016648010001517832,
        "sampletime": 0.7212048860092182,
        "best_mean": -0.7620750000000001,
        "best_max": 0.1871,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 236,
        "timesteps": 47200,
        "reward_mean": -0.9571000000000001,
        "reward_max": -0.03300000000000021,
        "reward_min": -1.9242000000000001,
        "leartime_s": 0.04469042900018394,
        "sampletime": 0.6955422209866811,
        "best_mean": -0.7620750000000001,
        "best_max": 0.1871,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 237,
        "timesteps": 47400,
        "reward_mean": -0.8311749999999998,
        "reward_max": 0.25709375000000007,
        "reward_min": -2.3055999999999996,
        "leartime_s": 0.04490301001351327,
        "sampletime": 0.7677890069899149,
        "best_mean": -0.7620750000000001,
        "best_max": 0.1871,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 238,
        "timesteps": 47600,
        "reward_mean": -0.9395749999999998,
        "reward_max": -0.04566874999999991,
        "reward_min": -1.8548312500000002,
        "leartime_s": 0.05954995800857432,
        "sampletime": 0.7354189720063005,
        "best_mean": -0.7620750000000001,
        "best_max": 0.1871,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 239,
        "timesteps": 47800,
        "reward_mean": -1.0682749999999999,
        "reward_max": -0.0754187499999998,
        "reward_min": -2.37954375,
        "leartime_s": 0.0445235280203633,
        "sampletime": 0.6356198410212528,
        "best_mean": -0.7620750000000001,
        "best_max": 0.1871,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 240,
        "timesteps": 48000,
        "reward_mean": -0.9449500000000001,
        "reward_max": 0.10165,
        "reward_min": -2.2197687499999996,
        "leartime_s": 0.04275565699208528,
        "sampletime": 0.6672173060069326,
        "best_mean": -0.7620750000000001,
        "best_max": 0.1871,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 241,
        "timesteps": 48200,
        "reward_mean": -1.2606749999999998,
        "reward_max": -0.2673375,
        "reward_min": -2.470674999999999,
        "leartime_s": 0.07245260599302128,
        "sampletime": 0.6704254799988121,
        "best_mean": -0.7620750000000001,
        "best_max": 0.1871,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 242,
        "timesteps": 48400,
        "reward_mean": -1.014325,
        "reward_max": -0.007043749999999932,
        "reward_min": -1.9607812499999995,
        "leartime_s": 0.06718724500387907,
        "sampletime": 0.7137972559721675,
        "best_mean": -0.7620750000000001,
        "best_max": 0.1871,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 243,
        "timesteps": 48600,
        "reward_mean": -1.2639749999999998,
        "reward_max": -0.4348062500000001,
        "reward_min": -3.141225,
        "leartime_s": 0.03440773699549027,
        "sampletime": 0.7656694129982498,
        "best_mean": -0.7620750000000001,
        "best_max": 0.1871,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 244,
        "timesteps": 48800,
        "reward_mean": -0.938675,
        "reward_max": -0.1891250000000001,
        "reward_min": -2.0498250000000002,
        "leartime_s": 0.039826049003750086,
        "sampletime": 0.6730190509988461,
        "best_mean": -0.7620750000000001,
        "best_max": 0.1871,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 245,
        "timesteps": 49000,
        "reward_mean": -0.91075,
        "reward_max": 0.12774375000000004,
        "reward_min": -2.0498250000000002,
        "leartime_s": 0.03164219998870976,
        "sampletime": 0.7313781319826376,
        "best_mean": -0.7620750000000001,
        "best_max": 0.1871,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 246,
        "timesteps": 49200,
        "reward_mean": -0.988425,
        "reward_max": 0.052625000000000144,
        "reward_min": -2.3888500000000006,
        "leartime_s": 0.026531003997661173,
        "sampletime": 0.7415906329988502,
        "best_mean": -0.7620750000000001,
        "best_max": 0.1871,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 247,
        "timesteps": 49400,
        "reward_mean": -1.04995,
        "reward_max": 0.07379374999999981,
        "reward_min": -2.2792000000000003,
        "leartime_s": 0.035569664993090555,
        "sampletime": 0.7248197059961967,
        "best_mean": -0.7620750000000001,
        "best_max": 0.1871,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 248,
        "timesteps": 49600,
        "reward_mean": -1.3597,
        "reward_max": -0.5455562499999999,
        "reward_min": -2.6285624999999997,
        "leartime_s": 0.07644917501602322,
        "sampletime": 0.6831057210220024,
        "best_mean": -0.7620750000000001,
        "best_max": 0.1871,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 249,
        "timesteps": 49800,
        "reward_mean": -0.9713249999999999,
        "reward_max": -0.11602499999999986,
        "reward_min": -2.52976875,
        "leartime_s": 0.049919715005671605,
        "sampletime": 0.7743593949999195,
        "best_mean": -0.7620750000000001,
        "best_max": 0.1871,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 250,
        "timesteps": 50000,
        "reward_mean": -1.007875,
        "reward_max": -0.0678625000000001,
        "reward_min": -2.33898125,
        "leartime_s": 0.0585160119808279,
        "sampletime": 0.8077011700079311,
        "best_mean": -0.7620750000000001,
        "best_max": 0.1871,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 251,
        "timesteps": 50200,
        "reward_mean": -1.0200749999999998,
        "reward_max": -0.04615624999999992,
        "reward_min": -2.1754,
        "leartime_s": 0.0686898980056867,
        "sampletime": 0.747606014017947,
        "best_mean": -0.7620750000000001,
        "best_max": 0.1871,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 252,
        "timesteps": 50400,
        "reward_mean": -1.1199,
        "reward_max": -0.013099999999999945,
        "reward_min": -2.51395,
        "leartime_s": 0.053015393001260236,
        "sampletime": 0.7085625089821406,
        "best_mean": -0.7620750000000001,
        "best_max": 0.1871,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 253,
        "timesteps": 50600,
        "reward_mean": -1.124825,
        "reward_max": -0.16240624999999997,
        "reward_min": -2.27206875,
        "leartime_s": 0.03665634500794113,
        "sampletime": 0.798499875003472,
        "best_mean": -0.7620750000000001,
        "best_max": 0.1871,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 254,
        "timesteps": 50800,
        "reward_mean": -1.0178999999999998,
        "reward_max": -0.006962499999999983,
        "reward_min": -1.9659,
        "leartime_s": 0.03186359201208688,
        "sampletime": 0.7885042490088381,
        "best_mean": -0.7620750000000001,
        "best_max": 0.1871,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 255,
        "timesteps": 51000,
        "reward_mean": -0.9963250000000003,
        "reward_max": -0.17101875000000016,
        "reward_min": -2.0846187500000006,
        "leartime_s": 0.02537397199193947,
        "sampletime": 0.8280241070024204,
        "best_mean": -0.7620750000000001,
        "best_max": 0.1871,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 256,
        "timesteps": 51200,
        "reward_mean": -0.9516749999999999,
        "reward_max": -0.11664374999999998,
        "reward_min": -1.9748125,
        "leartime_s": 0.029678608989343047,
        "sampletime": 0.7816903979983181,
        "best_mean": -0.7620750000000001,
        "best_max": 0.1871,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 257,
        "timesteps": 51400,
        "reward_mean": -1.10955,
        "reward_max": -0.1580125000000001,
        "reward_min": -2.4048875,
        "leartime_s": 0.040402255981462076,
        "sampletime": 0.7497712970071007,
        "best_mean": -0.7620750000000001,
        "best_max": 0.1871,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 258,
        "timesteps": 51600,
        "reward_mean": -1.0018500000000001,
        "reward_max": -0.10621250000000018,
        "reward_min": -2.2883187499999993,
        "leartime_s": 0.0260141369944904,
        "sampletime": 0.7313093440025114,
        "best_mean": -0.7620750000000001,
        "best_max": 0.1871,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 259,
        "timesteps": 51800,
        "reward_mean": -0.9933249999999999,
        "reward_max": -0.14535000000000006,
        "reward_min": -1.9277375,
        "leartime_s": 0.03915321599924937,
        "sampletime": 0.7332005359930918,
        "best_mean": -0.7620750000000001,
        "best_max": 0.1871,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 260,
        "timesteps": 52000,
        "reward_mean": -0.9316500000000001,
        "reward_max": -0.08825624999999997,
        "reward_min": -1.9807062500000003,
        "leartime_s": 0.05095321100088768,
        "sampletime": 0.7838185850123409,
        "best_mean": -0.7620750000000001,
        "best_max": 0.1871,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 261,
        "timesteps": 52200,
        "reward_mean": -0.998925,
        "reward_max": 0.013887500000000053,
        "reward_min": -2.38286875,
        "leartime_s": 0.04002823101473041,
        "sampletime": 0.6591222300194204,
        "best_mean": -0.7620750000000001,
        "best_max": 0.1871,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 262,
        "timesteps": 52400,
        "reward_mean": -1.1859749999999998,
        "reward_max": -0.16270624999999986,
        "reward_min": -2.3958312499999996,
        "leartime_s": 0.049195655999938026,
        "sampletime": 0.8620997109974269,
        "best_mean": -0.7620750000000001,
        "best_max": 0.1871,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 263,
        "timesteps": 52600,
        "reward_mean": -0.9777,
        "reward_max": -0.13324999999999998,
        "reward_min": -2.4356999999999998,
        "leartime_s": 0.037765421991935,
        "sampletime": 0.7416445609997027,
        "best_mean": -0.7620750000000001,
        "best_max": 0.1871,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 264,
        "timesteps": 52800,
        "reward_mean": -0.943725,
        "reward_max": 0.09620624999999994,
        "reward_min": -1.8956125,
        "leartime_s": 0.03324851000797935,
        "sampletime": 0.7359881469747052,
        "best_mean": -0.7620750000000001,
        "best_max": 0.1871,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 265,
        "timesteps": 53000,
        "reward_mean": -1.235225,
        "reward_max": -0.2904187500000001,
        "reward_min": -2.6926812499999997,
        "leartime_s": 0.03784199297660962,
        "sampletime": 0.7383289110148326,
        "best_mean": -0.7620750000000001,
        "best_max": 0.1871,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 266,
        "timesteps": 53200,
        "reward_mean": -1.0455999999999999,
        "reward_max": -0.247025,
        "reward_min": -2.0787000000000004,
        "leartime_s": 0.023876094026491046,
        "sampletime": 0.7160144810040947,
        "best_mean": -0.7620750000000001,
        "best_max": 0.1871,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 267,
        "timesteps": 53400,
        "reward_mean": -0.9213499999999999,
        "reward_max": 0.07382500000000011,
        "reward_min": -2.1200375000000005,
        "leartime_s": 0.032920227997237816,
        "sampletime": 0.8083435019943863,
        "best_mean": -0.7620750000000001,
        "best_max": 0.1871,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 268,
        "timesteps": 53600,
        "reward_mean": -1.141625,
        "reward_max": -0.21887499999999988,
        "reward_min": -2.5204062499999997,
        "leartime_s": 0.03894881400628947,
        "sampletime": 0.7318961169803515,
        "best_mean": -0.7620750000000001,
        "best_max": 0.1871,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 269,
        "timesteps": 53800,
        "reward_mean": -1.1526750000000001,
        "reward_max": -0.2890062500000001,
        "reward_min": -2.164662500000001,
        "leartime_s": 0.03094147000228986,
        "sampletime": 0.9007124280033167,
        "best_mean": -0.7620750000000001,
        "best_max": 0.1871,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 270,
        "timesteps": 54000,
        "reward_mean": -1.22325,
        "reward_max": -0.022343749999999954,
        "reward_min": -2.6498875000000006,
        "leartime_s": 0.03472624399000779,
        "sampletime": 0.7328271419974044,
        "best_mean": -0.7620750000000001,
        "best_max": 0.1871,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 271,
        "timesteps": 54200,
        "reward_mean": -1.0349499999999998,
        "reward_max": -0.148725,
        "reward_min": -2.03689375,
        "leartime_s": 0.032601301005342975,
        "sampletime": 0.7943644670012873,
        "best_mean": -0.7620750000000001,
        "best_max": 0.1871,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 272,
        "timesteps": 54400,
        "reward_mean": -0.958075,
        "reward_max": -0.07463125000000001,
        "reward_min": -1.9605812500000004,
        "leartime_s": 0.05029334299615584,
        "sampletime": 0.7461272770015057,
        "best_mean": -0.7620750000000001,
        "best_max": 0.1871,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 273,
        "timesteps": 54600,
        "reward_mean": -1.046525,
        "reward_max": -0.15705624999999995,
        "reward_min": -2.2849124999999995,
        "leartime_s": 0.02867712700390257,
        "sampletime": 0.768502802005969,
        "best_mean": -0.7620750000000001,
        "best_max": 0.1871,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 274,
        "timesteps": 54800,
        "reward_mean": -1.12835,
        "reward_max": -0.28439374999999995,
        "reward_min": -2.222475,
        "leartime_s": 0.0444263219833374,
        "sampletime": 0.7458213449863251,
        "best_mean": -0.7620750000000001,
        "best_max": 0.1871,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 275,
        "timesteps": 55000,
        "reward_mean": -0.84045,
        "reward_max": 0.10414375000000006,
        "reward_min": -2.5223812500000005,
        "leartime_s": 0.017596096004126593,
        "sampletime": 0.7935539770114701,
        "best_mean": -0.7620750000000001,
        "best_max": 0.1871,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 276,
        "timesteps": 55200,
        "reward_mean": -1.0062250000000001,
        "reward_max": 0.0480312499999999,
        "reward_min": -1.996631250000001,
        "leartime_s": 0.050087206007447094,
        "sampletime": 0.6939979330054484,
        "best_mean": -0.7620750000000001,
        "best_max": 0.1871,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 277,
        "timesteps": 55400,
        "reward_mean": -0.9678499999999999,
        "reward_max": -0.14034375000000013,
        "reward_min": -2.0676,
        "leartime_s": 0.026117786997929215,
        "sampletime": 0.7566986950114369,
        "best_mean": -0.7620750000000001,
        "best_max": 0.1871,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 278,
        "timesteps": 55600,
        "reward_mean": -1.089525,
        "reward_max": 0.15805625000000004,
        "reward_min": -2.4014749999999996,
        "leartime_s": 0.04740968000260182,
        "sampletime": 0.6312648250022903,
        "best_mean": -0.7620750000000001,
        "best_max": 0.1871,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 279,
        "timesteps": 55800,
        "reward_mean": -0.9043,
        "reward_max": -0.07372500000000004,
        "reward_min": -2.1324125,
        "leartime_s": 0.034460037015378475,
        "sampletime": 0.7502513699873816,
        "best_mean": -0.7620750000000001,
        "best_max": 0.1871,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 280,
        "timesteps": 56000,
        "reward_mean": -1.0560999999999998,
        "reward_max": -0.25053124999999987,
        "reward_min": -2.0506937499999998,
        "leartime_s": 0.01714058397919871,
        "sampletime": 0.7535289759980515,
        "best_mean": -0.7620750000000001,
        "best_max": 0.1871,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 281,
        "timesteps": 56200,
        "reward_mean": -1.0943999999999998,
        "reward_max": 0.10060000000000002,
        "reward_min": -2.5254499999999998,
        "leartime_s": 0.0162208300025668,
        "sampletime": 0.788460092007881,
        "best_mean": -0.7620750000000001,
        "best_max": 0.1871,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 282,
        "timesteps": 56400,
        "reward_mean": -1.23525,
        "reward_max": -0.3462125,
        "reward_min": -2.1639749999999993,
        "leartime_s": 0.02550012301071547,
        "sampletime": 0.6562415999942459,
        "best_mean": -0.7620750000000001,
        "best_max": 0.1871,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 283,
        "timesteps": 56600,
        "reward_mean": -0.7573499999999999,
        "reward_max": 0.24115625000000013,
        "reward_min": -2.1238625,
        "leartime_s": 0.03845123198698275,
        "sampletime": 0.7810313100053463,
        "best_mean": -0.7573499999999999,
        "best_max": 0.24115625000000013,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 284,
        "timesteps": 56800,
        "reward_mean": -0.9148749999999999,
        "reward_max": 0.0016625000000001118,
        "reward_min": -1.9358374999999994,
        "leartime_s": 0.023669553018407896,
        "sampletime": 0.8757334649853874,
        "best_mean": -0.7573499999999999,
        "best_max": 0.24115625000000013,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 285,
        "timesteps": 57000,
        "reward_mean": -1.2675,
        "reward_max": 0.0020749999999998825,
        "reward_min": -2.2482875000000004,
        "leartime_s": 0.023996968026040122,
        "sampletime": 0.7017542849935126,
        "best_mean": -0.7573499999999999,
        "best_max": 0.24115625000000013,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 286,
        "timesteps": 57200,
        "reward_mean": -0.9322249999999999,
        "reward_max": -0.1578562500000001,
        "reward_min": -2.857237499999999,
        "leartime_s": 0.03014403601991944,
        "sampletime": 0.7185273290087935,
        "best_mean": -0.7573499999999999,
        "best_max": 0.24115625000000013,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 287,
        "timesteps": 57400,
        "reward_mean": -1.241275,
        "reward_max": -0.46236250000000007,
        "reward_min": -2.2138312499999997,
        "leartime_s": 0.04097839101450518,
        "sampletime": 0.7208093639928848,
        "best_mean": -0.7573499999999999,
        "best_max": 0.24115625000000013,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 288,
        "timesteps": 57600,
        "reward_mean": -1.179,
        "reward_max": -0.2704625000000002,
        "reward_min": -2.0793562499999996,
        "leartime_s": 0.029913920996477827,
        "sampletime": 0.6908954769896809,
        "best_mean": -0.7573499999999999,
        "best_max": 0.24115625000000013,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 289,
        "timesteps": 57800,
        "reward_mean": -0.8942999999999999,
        "reward_max": 0.05711250000000004,
        "reward_min": -1.9840000000000002,
        "leartime_s": 0.035181351006031036,
        "sampletime": 0.7662369160098024,
        "best_mean": -0.7573499999999999,
        "best_max": 0.24115625000000013,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 290,
        "timesteps": 58000,
        "reward_mean": -0.644,
        "reward_max": 0.3496125,
        "reward_min": -1.7187374999999998,
        "leartime_s": 0.036044387001311406,
        "sampletime": 0.6812433500017505,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 291,
        "timesteps": 58200,
        "reward_mean": -1.1211499999999999,
        "reward_max": -0.21888750000000007,
        "reward_min": -2.418,
        "leartime_s": 0.028544892003992572,
        "sampletime": 0.7297821209940594,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 292,
        "timesteps": 58400,
        "reward_mean": -1.44985,
        "reward_max": -0.6026437499999998,
        "reward_min": -2.5703624999999994,
        "leartime_s": 0.03281513199908659,
        "sampletime": 0.8512625020230189,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 293,
        "timesteps": 58600,
        "reward_mean": -1.0892249999999999,
        "reward_max": -0.17516250000000014,
        "reward_min": -2.625012500000001,
        "leartime_s": 0.029353720979997888,
        "sampletime": 0.7182894930010661,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 294,
        "timesteps": 58800,
        "reward_mean": -1.0465,
        "reward_max": -0.02899999999999999,
        "reward_min": -2.3085249999999995,
        "leartime_s": 0.07067765999818221,
        "sampletime": 0.6903040990000591,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 295,
        "timesteps": 59000,
        "reward_mean": -1.1042,
        "reward_max": -0.24068750000000008,
        "reward_min": -2.8741375,
        "leartime_s": 0.03385902298032306,
        "sampletime": 0.6412098490109202,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 296,
        "timesteps": 59200,
        "reward_mean": -1.0905000000000002,
        "reward_max": -0.29138125000000015,
        "reward_min": -2.288925,
        "leartime_s": 0.03349799197167158,
        "sampletime": 0.710473560000537,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 297,
        "timesteps": 59400,
        "reward_mean": -1.0495000000000003,
        "reward_max": -0.14150000000000001,
        "reward_min": -1.9764437500000003,
        "leartime_s": 0.04765354099799879,
        "sampletime": 0.7208195620041806,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 298,
        "timesteps": 59600,
        "reward_mean": -1.07275,
        "reward_max": -0.21556249999999996,
        "reward_min": -2.5244687499999996,
        "leartime_s": 0.031282802985515445,
        "sampletime": 0.7539677339955233,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 299,
        "timesteps": 59800,
        "reward_mean": -1.2153000000000003,
        "reward_max": -0.2704875,
        "reward_min": -2.258625,
        "leartime_s": 0.06363059999421239,
        "sampletime": 0.6466352010029368,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 300,
        "timesteps": 60000,
        "reward_mean": -0.8126500000000001,
        "reward_max": 0.04644374999999985,
        "reward_min": -1.9634125000000004,
        "leartime_s": 0.02866741397883743,
        "sampletime": 0.7975172759906854,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 301,
        "timesteps": 60200,
        "reward_mean": -1.0818,
        "reward_max": -0.27544375,
        "reward_min": -2.0294437499999995,
        "leartime_s": 0.027371084986953065,
        "sampletime": 0.758804737997707,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 302,
        "timesteps": 60400,
        "reward_mean": -1.3135,
        "reward_max": -0.27181875,
        "reward_min": -2.4033625,
        "leartime_s": 0.04113157800748013,
        "sampletime": 0.6581140650087036,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 303,
        "timesteps": 60600,
        "reward_mean": -1.33405,
        "reward_max": -0.3819937500000001,
        "reward_min": -3.0496624999999993,
        "leartime_s": 0.02658190400688909,
        "sampletime": 0.7879875660000835,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 304,
        "timesteps": 60800,
        "reward_mean": -1.09885,
        "reward_max": -0.3654125000000001,
        "reward_min": -1.9430749999999997,
        "leartime_s": 0.05831931499415077,
        "sampletime": 0.6740026549960021,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 305,
        "timesteps": 61000,
        "reward_mean": -1.067975,
        "reward_max": -0.10325625000000004,
        "reward_min": -2.043,
        "leartime_s": 0.03890949898050167,
        "sampletime": 0.7126501870225184,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 306,
        "timesteps": 61200,
        "reward_mean": -0.9660749999999999,
        "reward_max": 0.03803749999999993,
        "reward_min": -1.90385625,
        "leartime_s": 0.0379839829984121,
        "sampletime": 0.77285253800801,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 307,
        "timesteps": 61400,
        "reward_mean": -1.102375,
        "reward_max": -0.24816250000000012,
        "reward_min": -2.27999375,
        "leartime_s": 0.031920622976031154,
        "sampletime": 0.808075895998627,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 308,
        "timesteps": 61600,
        "reward_mean": -1.25325,
        "reward_max": -0.38351250000000003,
        "reward_min": -2.45096875,
        "leartime_s": 0.044401521008694544,
        "sampletime": 0.7643761379877105,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 309,
        "timesteps": 61800,
        "reward_mean": -1.1465750000000001,
        "reward_max": -0.06536249999999995,
        "reward_min": -2.1174250000000003,
        "leartime_s": 0.03359448199626058,
        "sampletime": 0.7222051040153019,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 310,
        "timesteps": 62000,
        "reward_mean": -0.938975,
        "reward_max": -0.06723124999999971,
        "reward_min": -2.07805625,
        "leartime_s": 0.03326533199287951,
        "sampletime": 0.6851632249890827,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 311,
        "timesteps": 62200,
        "reward_mean": -0.8881999999999998,
        "reward_max": 0.09078125,
        "reward_min": -2.3001624999999994,
        "leartime_s": 0.050460737984394655,
        "sampletime": 0.7668833770148922,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 312,
        "timesteps": 62400,
        "reward_mean": -1.0636750000000001,
        "reward_max": -0.184925,
        "reward_min": -2.437943750000001,
        "leartime_s": 0.022217584017198533,
        "sampletime": 0.640442547010025,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 313,
        "timesteps": 62600,
        "reward_mean": -1.2717250000000004,
        "reward_max": -0.47821250000000004,
        "reward_min": -2.3401062500000003,
        "leartime_s": 0.023261019989149645,
        "sampletime": 0.7798912459984422,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 314,
        "timesteps": 62800,
        "reward_mean": -1.0089999999999997,
        "reward_max": -0.17443125000000004,
        "reward_min": -2.0036187500000007,
        "leartime_s": 0.04755565102095716,
        "sampletime": 0.8645731860015076,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 315,
        "timesteps": 63000,
        "reward_mean": -1.2208500000000002,
        "reward_max": -0.35131249999999997,
        "reward_min": -2.1169312500000004,
        "leartime_s": 0.03378004499245435,
        "sampletime": 0.7227965009806212,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 316,
        "timesteps": 63200,
        "reward_mean": -0.9818499999999999,
        "reward_max": -0.07156250000000008,
        "reward_min": -2.3789,
        "leartime_s": 0.04334210301749408,
        "sampletime": 0.7803918110148516,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 317,
        "timesteps": 63400,
        "reward_mean": -1.1104250000000002,
        "reward_max": -0.3090875,
        "reward_min": -2.4608874999999997,
        "leartime_s": 0.03775832199607976,
        "sampletime": 0.7888593150128145,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 318,
        "timesteps": 63600,
        "reward_mean": -1.1337000000000004,
        "reward_max": -0.14579999999999996,
        "reward_min": -2.6736375,
        "leartime_s": 0.025747147999936715,
        "sampletime": 0.8284694070171099,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 319,
        "timesteps": 63800,
        "reward_mean": -1.14305,
        "reward_max": 0.04913749999999997,
        "reward_min": -2.39579375,
        "leartime_s": 0.05236380998394452,
        "sampletime": 0.729666047001956,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 320,
        "timesteps": 64000,
        "reward_mean": -1.44885,
        "reward_max": -0.43450625000000004,
        "reward_min": -2.8628312500000015,
        "leartime_s": 0.03825208300258964,
        "sampletime": 0.6542718529817648,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 321,
        "timesteps": 64200,
        "reward_mean": -1.289075,
        "reward_max": -0.38083750000000016,
        "reward_min": -2.6156125,
        "leartime_s": 0.04987796401837841,
        "sampletime": 0.7761270820046775,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 322,
        "timesteps": 64400,
        "reward_mean": -1.006625,
        "reward_max": 0.03180624999999991,
        "reward_min": -2.2793687499999997,
        "leartime_s": 0.02386761800153181,
        "sampletime": 0.619619542005239,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 323,
        "timesteps": 64600,
        "reward_mean": -1.2349,
        "reward_max": -0.1354312499999999,
        "reward_min": -2.5102687500000003,
        "leartime_s": 0.05510157599928789,
        "sampletime": 0.7464131930028088,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 324,
        "timesteps": 64800,
        "reward_mean": -0.931875,
        "reward_max": -0.09903750000000011,
        "reward_min": -2.0350624999999996,
        "leartime_s": 0.04789616298512556,
        "sampletime": 0.7582499329873826,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 325,
        "timesteps": 65000,
        "reward_mean": -1.2795500000000002,
        "reward_max": -0.4472500000000001,
        "reward_min": -2.4570875,
        "leartime_s": 0.05678715699468739,
        "sampletime": 0.6934623749984894,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 326,
        "timesteps": 65200,
        "reward_mean": -1.0192750000000002,
        "reward_max": -0.3224437500000001,
        "reward_min": -1.9519375,
        "leartime_s": 0.05940122698666528,
        "sampletime": 0.67498716400587,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 327,
        "timesteps": 65400,
        "reward_mean": -0.942725,
        "reward_max": 0.020393750000000155,
        "reward_min": -2.1864812500000004,
        "leartime_s": 0.056009791005635634,
        "sampletime": 0.800424296001438,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 328,
        "timesteps": 65600,
        "reward_mean": -1.0615749999999997,
        "reward_max": -0.19355624999999996,
        "reward_min": -2.32370625,
        "leartime_s": 0.028512463002698496,
        "sampletime": 0.8212749260128476,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 329,
        "timesteps": 65800,
        "reward_mean": -1.1051,
        "reward_max": -0.13825000000000018,
        "reward_min": -2.38456875,
        "leartime_s": 0.031164337997324765,
        "sampletime": 0.7021807470009662,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 330,
        "timesteps": 66000,
        "reward_mean": -1.19335,
        "reward_max": -0.34277499999999983,
        "reward_min": -2.46338125,
        "leartime_s": 0.051839286024915054,
        "sampletime": 0.713671664998401,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 331,
        "timesteps": 66200,
        "reward_mean": -1.0450749999999998,
        "reward_max": -0.14549374999999998,
        "reward_min": -2.0905062500000002,
        "leartime_s": 0.06761561200255528,
        "sampletime": 0.6615823479951359,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 332,
        "timesteps": 66400,
        "reward_mean": -0.99665,
        "reward_max": -0.016087499999999987,
        "reward_min": -1.9582437500000005,
        "leartime_s": 0.028478035994339734,
        "sampletime": 0.7000224310031626,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 333,
        "timesteps": 66600,
        "reward_mean": -1.1719750000000002,
        "reward_max": 0.008131249999999896,
        "reward_min": -2.3542687500000006,
        "leartime_s": 0.033357432985212654,
        "sampletime": 0.7723744379763957,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 334,
        "timesteps": 66800,
        "reward_mean": -1.113075,
        "reward_max": -0.07495625000000003,
        "reward_min": -2.08653125,
        "leartime_s": 0.0487341080151964,
        "sampletime": 0.7353844229946844,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 335,
        "timesteps": 67000,
        "reward_mean": -1.1083000000000003,
        "reward_max": -0.19451875000000007,
        "reward_min": -2.13588125,
        "leartime_s": 0.04465344498748891,
        "sampletime": 0.6445558429986704,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 336,
        "timesteps": 67200,
        "reward_mean": -1.18785,
        "reward_max": -0.3348437500000001,
        "reward_min": -2.2182437499999996,
        "leartime_s": 0.0472272610059008,
        "sampletime": 0.8286853320023511,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 337,
        "timesteps": 67400,
        "reward_mean": -1.264575,
        "reward_max": -0.13545625000000006,
        "reward_min": -2.63916875,
        "leartime_s": 0.03434972101240419,
        "sampletime": 0.8195034199743532,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 338,
        "timesteps": 67600,
        "reward_mean": -1.02865,
        "reward_max": -0.19248749999999992,
        "reward_min": -1.9989687500000006,
        "leartime_s": 0.07262086600530893,
        "sampletime": 0.7384527740068734,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 339,
        "timesteps": 67800,
        "reward_mean": -1.1632750000000003,
        "reward_max": -0.24699375000000012,
        "reward_min": -2.4396625000000007,
        "leartime_s": 0.05182448701816611,
        "sampletime": 0.6602461840084288,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 340,
        "timesteps": 68000,
        "reward_mean": -1.4273249999999997,
        "reward_max": -0.6259187500000001,
        "reward_min": -2.36334375,
        "leartime_s": 0.059083912026835606,
        "sampletime": 0.6804616080189589,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 341,
        "timesteps": 68200,
        "reward_mean": -0.7824749999999999,
        "reward_max": 0.3391437500000001,
        "reward_min": -1.9766124999999997,
        "leartime_s": 0.051995860994793475,
        "sampletime": 0.7193141349998768,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 342,
        "timesteps": 68400,
        "reward_mean": -0.869325,
        "reward_max": 0.16315000000000007,
        "reward_min": -2.153475,
        "leartime_s": 0.07293424801900983,
        "sampletime": 0.72085395801696,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 343,
        "timesteps": 68600,
        "reward_mean": -0.919225,
        "reward_max": -0.03821249999999998,
        "reward_min": -2.2220312499999997,
        "leartime_s": 0.055057329998817295,
        "sampletime": 0.7095350800082088,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 344,
        "timesteps": 68800,
        "reward_mean": -0.9386,
        "reward_max": 0.004912500000000066,
        "reward_min": -1.9964375000000003,
        "leartime_s": 0.07144105798215605,
        "sampletime": 0.6936284200055525,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 345,
        "timesteps": 69000,
        "reward_mean": -1.1247249999999998,
        "reward_max": -0.35838749999999975,
        "reward_min": -2.48320625,
        "leartime_s": 0.04357740900013596,
        "sampletime": 0.7491498849994969,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 346,
        "timesteps": 69200,
        "reward_mean": -1.262775,
        "reward_max": -0.53970625,
        "reward_min": -2.3596062500000006,
        "leartime_s": 0.026367682992713526,
        "sampletime": 0.7406534510082565,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 347,
        "timesteps": 69400,
        "reward_mean": -0.99525,
        "reward_max": -0.12970625000000002,
        "reward_min": -2.0621937499999996,
        "leartime_s": 0.05986700498033315,
        "sampletime": 0.661697292001918,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 348,
        "timesteps": 69600,
        "reward_mean": -1.1087999999999998,
        "reward_max": -0.26004999999999995,
        "reward_min": -2.25121875,
        "leartime_s": 0.02320298898848705,
        "sampletime": 0.7721157199994195,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 349,
        "timesteps": 69800,
        "reward_mean": -1.2948000000000002,
        "reward_max": -0.17853750000000013,
        "reward_min": -2.2498375,
        "leartime_s": 0.04533713700948283,
        "sampletime": 0.6259221179934684,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 350,
        "timesteps": 70000,
        "reward_mean": -0.9224249999999999,
        "reward_max": 0.07992500000000011,
        "reward_min": -1.9949562500000002,
        "leartime_s": 0.05216609299532138,
        "sampletime": 0.7228051139973104,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 351,
        "timesteps": 70200,
        "reward_mean": -0.9492999999999999,
        "reward_max": -0.20648125,
        "reward_min": -2.0157249999999998,
        "leartime_s": 0.025155114999506623,
        "sampletime": 0.7123145709920209,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 352,
        "timesteps": 70400,
        "reward_mean": -1.320275,
        "reward_max": -0.34770625000000005,
        "reward_min": -2.6366625,
        "leartime_s": 0.03748857000027783,
        "sampletime": 0.6650205319747329,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 353,
        "timesteps": 70600,
        "reward_mean": -0.9923999999999998,
        "reward_max": -0.024624999999999855,
        "reward_min": -2.22341875,
        "leartime_s": 0.04075163198285736,
        "sampletime": 0.6479742570081726,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 354,
        "timesteps": 70800,
        "reward_mean": -0.86515,
        "reward_max": 0.18091249999999998,
        "reward_min": -1.95855,
        "leartime_s": 0.02923767000902444,
        "sampletime": 0.6418768799921963,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 355,
        "timesteps": 71000,
        "reward_mean": -1.017625,
        "reward_max": -0.24603125000000006,
        "reward_min": -2.3652624999999996,
        "leartime_s": 0.018883226002799347,
        "sampletime": 0.9172505860042293,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 356,
        "timesteps": 71200,
        "reward_mean": -1.1041249999999998,
        "reward_max": -0.0689249999999999,
        "reward_min": -2.5531875,
        "leartime_s": 0.029350081022130325,
        "sampletime": 0.7036701499891933,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 357,
        "timesteps": 71400,
        "reward_mean": -1.103975,
        "reward_max": -0.07959375000000002,
        "reward_min": -2.2365375,
        "leartime_s": 0.021218731009867042,
        "sampletime": 0.6744149220176041,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 358,
        "timesteps": 71600,
        "reward_mean": -1.109475,
        "reward_max": -0.11824999999999994,
        "reward_min": -2.3195437500000002,
        "leartime_s": 0.03437109201331623,
        "sampletime": 0.6636919479933567,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 359,
        "timesteps": 71800,
        "reward_mean": -0.8993499999999999,
        "reward_max": -0.026799999999999942,
        "reward_min": -1.9018687499999998,
        "leartime_s": 0.04900972201721743,
        "sampletime": 0.7415893469878938,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 360,
        "timesteps": 72000,
        "reward_mean": -1.0912,
        "reward_max": 0.028993750000000124,
        "reward_min": -2.3126125,
        "leartime_s": 0.05547173001104966,
        "sampletime": 0.7463940379966516,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 361,
        "timesteps": 72200,
        "reward_mean": -1.02315,
        "reward_max": 0.15729375000000023,
        "reward_min": -2.0197250000000007,
        "leartime_s": 0.036837588995695114,
        "sampletime": 0.745161499013193,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 362,
        "timesteps": 72400,
        "reward_mean": -1.0927500000000003,
        "reward_max": 0.01575625,
        "reward_min": -2.44218125,
        "leartime_s": 0.04722676199162379,
        "sampletime": 0.6731224959949031,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 363,
        "timesteps": 72600,
        "reward_mean": -1.09625,
        "reward_max": -0.05997499999999986,
        "reward_min": -2.08286875,
        "leartime_s": 0.021945576008874923,
        "sampletime": 0.8066453909850679,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 364,
        "timesteps": 72800,
        "reward_mean": -0.8895250000000001,
        "reward_max": -0.002906250000000103,
        "reward_min": -2.10465625,
        "leartime_s": 0.037479730002814904,
        "sampletime": 0.8208882010076195,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 365,
        "timesteps": 73000,
        "reward_mean": -1.0611,
        "reward_max": -0.18121249999999986,
        "reward_min": -2.4248937500000007,
        "leartime_s": 0.03599803100223653,
        "sampletime": 0.7789244439918548,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 366,
        "timesteps": 73200,
        "reward_mean": -1.427275,
        "reward_max": -0.21848125000000007,
        "reward_min": -2.807725,
        "leartime_s": 0.03229757898952812,
        "sampletime": 0.6672395739878993,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 367,
        "timesteps": 73400,
        "reward_mean": -0.9362249999999999,
        "reward_max": 0.11813750000000012,
        "reward_min": -2.24775,
        "leartime_s": 0.043058666022261605,
        "sampletime": 0.7506370560149662,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 368,
        "timesteps": 73600,
        "reward_mean": -0.7921749999999999,
        "reward_max": 0.0782187500000001,
        "reward_min": -1.8505187499999998,
        "leartime_s": 0.03853400898515247,
        "sampletime": 0.7001362180162687,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 369,
        "timesteps": 73800,
        "reward_mean": -0.8757749999999999,
        "reward_max": 0.07226250000000012,
        "reward_min": -2.18325,
        "leartime_s": 0.0438706630084198,
        "sampletime": 0.8498589600203559,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 370,
        "timesteps": 74000,
        "reward_mean": -0.9031750000000001,
        "reward_max": -0.1336749999999998,
        "reward_min": -2.3009062500000006,
        "leartime_s": 0.072289288014872,
        "sampletime": 0.9580879479763098,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 371,
        "timesteps": 74200,
        "reward_mean": -1.0319999999999996,
        "reward_max": -0.13188125000000003,
        "reward_min": -2.390462500000001,
        "leartime_s": 0.0625721669930499,
        "sampletime": 0.604876013007015,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 372,
        "timesteps": 74400,
        "reward_mean": -0.8256749999999999,
        "reward_max": 0.1548000000000001,
        "reward_min": -1.8606125000000002,
        "leartime_s": 0.025537858018651605,
        "sampletime": 0.8170710720005445,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 373,
        "timesteps": 74600,
        "reward_mean": -1.1342999999999996,
        "reward_max": 0.11359375000000013,
        "reward_min": -2.1618187499999992,
        "leartime_s": 0.04394535400206223,
        "sampletime": 0.7229499710083473,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 374,
        "timesteps": 74800,
        "reward_mean": -0.67775,
        "reward_max": 0.20739375000000013,
        "reward_min": -1.9516312499999995,
        "leartime_s": 0.049566406989470124,
        "sampletime": 0.7003696729952935,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 375,
        "timesteps": 75000,
        "reward_mean": -1.033725,
        "reward_max": -0.16444375,
        "reward_min": -2.2172999999999994,
        "leartime_s": 0.04929436300881207,
        "sampletime": 0.721626267011743,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 376,
        "timesteps": 75200,
        "reward_mean": -1.0137749999999999,
        "reward_max": -0.09631875000000009,
        "reward_min": -2.43101875,
        "leartime_s": 0.027648340008454397,
        "sampletime": 0.7221042710007168,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 377,
        "timesteps": 75400,
        "reward_mean": -1.000975,
        "reward_max": 0.02058750000000001,
        "reward_min": -2.0932875,
        "leartime_s": 0.05573373200604692,
        "sampletime": 0.7792286440089811,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 378,
        "timesteps": 75600,
        "reward_mean": -0.8817750000000001,
        "reward_max": 0.06979374999999999,
        "reward_min": -2.189881250000001,
        "leartime_s": 0.06748460899689235,
        "sampletime": 0.7411139260220807,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 379,
        "timesteps": 75800,
        "reward_mean": -0.8356000000000001,
        "reward_max": 0.18213749999999984,
        "reward_min": -2.0013562499999997,
        "leartime_s": 0.04007028599153273,
        "sampletime": 0.7297332719899714,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 380,
        "timesteps": 76000,
        "reward_mean": -0.7741249999999998,
        "reward_max": 0.36570625,
        "reward_min": -2.2811249999999994,
        "leartime_s": 0.06521590199554339,
        "sampletime": 0.740754778002156,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 381,
        "timesteps": 76200,
        "reward_mean": -0.8098000000000001,
        "reward_max": 0.09590000000000003,
        "reward_min": -2.08274375,
        "leartime_s": 0.041846060019452125,
        "sampletime": 0.7183232179959305,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 382,
        "timesteps": 76400,
        "reward_mean": -1.0235499999999997,
        "reward_max": 0.05995625000000004,
        "reward_min": -2.4342562500000002,
        "leartime_s": 0.04358343899366446,
        "sampletime": 0.7381492519925814,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 383,
        "timesteps": 76600,
        "reward_mean": -1.0035749999999999,
        "reward_max": 0.04650625000000008,
        "reward_min": -2.33389375,
        "leartime_s": 0.05751451800460927,
        "sampletime": 0.7032424859935418,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 384,
        "timesteps": 76800,
        "reward_mean": -0.6755749999999998,
        "reward_max": 0.5654812500000002,
        "reward_min": -2.0695250000000005,
        "leartime_s": 0.02892157799215056,
        "sampletime": 0.9282469430181663,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 385,
        "timesteps": 77000,
        "reward_mean": -0.7128,
        "reward_max": 0.4791937500000001,
        "reward_min": -1.9098,
        "leartime_s": 0.07767463001073338,
        "sampletime": 0.7003579510201234,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 386,
        "timesteps": 77200,
        "reward_mean": -0.98595,
        "reward_max": -0.13774999999999996,
        "reward_min": -2.2922250000000006,
        "leartime_s": 0.044412475981516764,
        "sampletime": 0.7601310300233308,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 387,
        "timesteps": 77400,
        "reward_mean": -1.1262000000000003,
        "reward_max": 0.03838125000000003,
        "reward_min": -2.3691562499999996,
        "leartime_s": 0.060445982991950586,
        "sampletime": 0.7850755380059127,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 388,
        "timesteps": 77600,
        "reward_mean": -1.1457500000000003,
        "reward_max": -0.26023125,
        "reward_min": -2.5006812500000004,
        "leartime_s": 0.03028276699478738,
        "sampletime": 0.6656529619940557,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 389,
        "timesteps": 77800,
        "reward_mean": -0.8359500000000001,
        "reward_max": 0.1718375000000001,
        "reward_min": -1.9959875000000005,
        "leartime_s": 0.05458211500081234,
        "sampletime": 0.6832291290047579,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 390,
        "timesteps": 78000,
        "reward_mean": -0.8592,
        "reward_max": 0.30990000000000006,
        "reward_min": -2.1440125000000005,
        "leartime_s": 0.03838056599488482,
        "sampletime": 0.690528727020137,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 391,
        "timesteps": 78200,
        "reward_mean": -0.6585,
        "reward_max": 0.2219375,
        "reward_min": -1.7113125,
        "leartime_s": 0.07995851401938125,
        "sampletime": 0.7280902170168702,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 392,
        "timesteps": 78400,
        "reward_mean": -0.8831000000000001,
        "reward_max": 0.11133750000000006,
        "reward_min": -2.4460749999999996,
        "leartime_s": 0.06699103600112721,
        "sampletime": 0.7075501889921725,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 393,
        "timesteps": 78600,
        "reward_mean": -0.8494250000000002,
        "reward_max": 0.06960000000000002,
        "reward_min": -2.07416875,
        "leartime_s": 0.04932691599242389,
        "sampletime": 0.8102504280104768,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 394,
        "timesteps": 78800,
        "reward_mean": -0.9148,
        "reward_max": -0.15311874999999972,
        "reward_min": -2.289,
        "leartime_s": 0.08084784098900855,
        "sampletime": 0.6673164809762966,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 395,
        "timesteps": 79000,
        "reward_mean": -0.9067750000000001,
        "reward_max": 0.06831250000000005,
        "reward_min": -2.336125,
        "leartime_s": 0.06449744201381691,
        "sampletime": 0.7257253919960931,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 396,
        "timesteps": 79200,
        "reward_mean": -0.838375,
        "reward_max": 0.09894375000000002,
        "reward_min": -2.1680812499999997,
        "leartime_s": 0.08333600999321789,
        "sampletime": 0.7506782669806853,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 397,
        "timesteps": 79400,
        "reward_mean": -0.986125,
        "reward_max": 0.004037500000000124,
        "reward_min": -1.9836437500000001,
        "leartime_s": 0.07684591901488602,
        "sampletime": 0.764450914983172,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 398,
        "timesteps": 79600,
        "reward_mean": -0.8310750000000001,
        "reward_max": 0.36226249999999993,
        "reward_min": -1.9239250000000006,
        "leartime_s": 0.03871586199966259,
        "sampletime": 0.8850078020186629,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 399,
        "timesteps": 79800,
        "reward_mean": -0.7395499999999999,
        "reward_max": 0.2942750000000002,
        "reward_min": -1.8889562500000006,
        "leartime_s": 0.06494896500953473,
        "sampletime": 0.7717341220122762,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 400,
        "timesteps": 80000,
        "reward_mean": -0.7626750000000001,
        "reward_max": 0.2163062499999999,
        "reward_min": -2.484212500000001,
        "leartime_s": 0.05721657400135882,
        "sampletime": 0.7353120880143251,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 401,
        "timesteps": 80200,
        "reward_mean": -0.80945,
        "reward_max": 0.002012499999999945,
        "reward_min": -1.8268000000000004,
        "leartime_s": 0.044678717997157946,
        "sampletime": 0.7697916860051919,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 402,
        "timesteps": 80400,
        "reward_mean": -0.8914500000000001,
        "reward_max": 0.03042500000000002,
        "reward_min": -2.2813312499999996,
        "leartime_s": 0.044005590985761955,
        "sampletime": 0.7417593699938152,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 403,
        "timesteps": 80600,
        "reward_mean": -0.68365,
        "reward_max": 0.3599874999999999,
        "reward_min": -1.7554499999999993,
        "leartime_s": 0.022539308993145823,
        "sampletime": 0.6906139019993134,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 404,
        "timesteps": 80800,
        "reward_mean": -0.6929000000000001,
        "reward_max": 0.45969999999999994,
        "reward_min": -1.7324625000000002,
        "leartime_s": 0.04097716600517742,
        "sampletime": 0.640126512007555,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 405,
        "timesteps": 81000,
        "reward_mean": -0.7243249999999999,
        "reward_max": 0.060418750000000056,
        "reward_min": -1.68705625,
        "leartime_s": 0.059228406025795266,
        "sampletime": 0.7083108049992006,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 406,
        "timesteps": 81200,
        "reward_mean": -0.741375,
        "reward_max": 0.32476874999999994,
        "reward_min": -2.2303187499999995,
        "leartime_s": 0.0752375969896093,
        "sampletime": 0.7792719040007796,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 407,
        "timesteps": 81400,
        "reward_mean": -0.7049749999999999,
        "reward_max": 0.18631250000000008,
        "reward_min": -1.9385625000000002,
        "leartime_s": 0.03017718900809996,
        "sampletime": 0.7276479130086955,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 408,
        "timesteps": 81600,
        "reward_mean": -0.9196749999999999,
        "reward_max": 0.035318749999999954,
        "reward_min": -2.6921874999999993,
        "leartime_s": 0.05378569400636479,
        "sampletime": 0.6835269049915951,
        "best_mean": -0.644,
        "best_max": 0.3496125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 409,
        "timesteps": 81800,
        "reward_mean": -0.5654000000000001,
        "reward_max": 0.5682249999999999,
        "reward_min": -2.061806250000001,
        "leartime_s": 0.05096675601089373,
        "sampletime": 0.7133737569965888,
        "best_mean": -0.5654000000000001,
        "best_max": 0.5682249999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 410,
        "timesteps": 82000,
        "reward_mean": -0.6023499999999999,
        "reward_max": 0.46546250000000006,
        "reward_min": -2.0320687499999996,
        "leartime_s": 0.030953192006563768,
        "sampletime": 0.794525772013003,
        "best_mean": -0.5654000000000001,
        "best_max": 0.5682249999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 411,
        "timesteps": 82200,
        "reward_mean": -0.8433749999999999,
        "reward_max": 0.19796249999999999,
        "reward_min": -1.9969687499999997,
        "leartime_s": 0.029007281991653144,
        "sampletime": 0.6959275700210128,
        "best_mean": -0.5654000000000001,
        "best_max": 0.5682249999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 412,
        "timesteps": 82400,
        "reward_mean": -0.812125,
        "reward_max": 0.24140624999999993,
        "reward_min": -2.036025,
        "leartime_s": 0.07725446100812405,
        "sampletime": 0.8123711160151288,
        "best_mean": -0.5654000000000001,
        "best_max": 0.5682249999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 413,
        "timesteps": 82600,
        "reward_mean": -0.5005999999999999,
        "reward_max": 0.38478749999999995,
        "reward_min": -1.7782374999999997,
        "leartime_s": 0.051617368997540325,
        "sampletime": 0.6583141910086852,
        "best_mean": -0.5005999999999999,
        "best_max": 0.38478749999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 414,
        "timesteps": 82800,
        "reward_mean": -0.39657500000000007,
        "reward_max": 0.4538874999999999,
        "reward_min": -1.2920500000000001,
        "leartime_s": 0.04223627099418081,
        "sampletime": 0.7005360820039641,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 415,
        "timesteps": 83000,
        "reward_mean": -0.5342749999999998,
        "reward_max": 0.3055875000000003,
        "reward_min": -1.7655250000000002,
        "leartime_s": 0.0811498939874582,
        "sampletime": 0.804793271003291,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 416,
        "timesteps": 83200,
        "reward_mean": -0.6467999999999999,
        "reward_max": 0.22813750000000016,
        "reward_min": -1.6650187500000004,
        "leartime_s": 0.047556594014167786,
        "sampletime": 0.7020196540106554,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 417,
        "timesteps": 83400,
        "reward_mean": -0.6715749999999999,
        "reward_max": 0.05848125000000017,
        "reward_min": -1.6320437500000002,
        "leartime_s": 0.033374216000083834,
        "sampletime": 0.7575071199971717,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 418,
        "timesteps": 83600,
        "reward_mean": -0.6310500000000002,
        "reward_max": 0.37629374999999987,
        "reward_min": -1.7448937499999997,
        "leartime_s": 0.05396624299464747,
        "sampletime": 0.7712616860226262,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 419,
        "timesteps": 83800,
        "reward_mean": -0.7674500000000001,
        "reward_max": 0.07604999999999992,
        "reward_min": -1.6806875,
        "leartime_s": 0.06835289401351474,
        "sampletime": 0.6871596119890455,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 420,
        "timesteps": 84000,
        "reward_mean": -0.51945,
        "reward_max": 0.38691875000000014,
        "reward_min": -1.5529124999999995,
        "leartime_s": 0.03189627800020389,
        "sampletime": 0.6520335939712822,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 421,
        "timesteps": 84200,
        "reward_mean": -0.9191500000000001,
        "reward_max": 0.22934999999999986,
        "reward_min": -2.1492375000000004,
        "leartime_s": 0.058150772005319595,
        "sampletime": 0.7334873100044206,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 422,
        "timesteps": 84400,
        "reward_mean": -0.9545249999999998,
        "reward_max": 0.03115000000000004,
        "reward_min": -2.0862937499999994,
        "leartime_s": 0.05505293401074596,
        "sampletime": 0.8034888760012109,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 423,
        "timesteps": 84600,
        "reward_mean": -0.4241249999999999,
        "reward_max": 0.41662499999999986,
        "reward_min": -1.4550312499999998,
        "leartime_s": 0.07989871897734702,
        "sampletime": 0.6472962159896269,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 424,
        "timesteps": 84800,
        "reward_mean": -0.6323,
        "reward_max": 0.37573750000000006,
        "reward_min": -1.8917312500000003,
        "leartime_s": 0.04094783400068991,
        "sampletime": 0.6437445759947877,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 425,
        "timesteps": 85000,
        "reward_mean": -0.9119750000000001,
        "reward_max": 0.07106874999999989,
        "reward_min": -1.9972500000000002,
        "leartime_s": 0.07490378600778058,
        "sampletime": 0.6553615470184013,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 426,
        "timesteps": 85200,
        "reward_mean": -0.748175,
        "reward_max": 0.3289562500000002,
        "reward_min": -1.9529875,
        "leartime_s": 0.025884900998789817,
        "sampletime": 0.8479315070144366,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 427,
        "timesteps": 85400,
        "reward_mean": -0.8287,
        "reward_max": 0.06236249999999999,
        "reward_min": -1.9050937499999996,
        "leartime_s": 0.06245428801048547,
        "sampletime": 0.7788035180128645,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 428,
        "timesteps": 85600,
        "reward_mean": -0.8667749999999999,
        "reward_max": 0.22043749999999995,
        "reward_min": -2.1065875000000003,
        "leartime_s": 0.03100691200233996,
        "sampletime": 0.7746533349854872,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 429,
        "timesteps": 85800,
        "reward_mean": -0.8871749999999999,
        "reward_max": 0.12224999999999994,
        "reward_min": -2.1358875,
        "leartime_s": 0.06405803601955995,
        "sampletime": 0.7112398680183105,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 430,
        "timesteps": 86000,
        "reward_mean": -0.8165249999999998,
        "reward_max": -0.020793750000000243,
        "reward_min": -2.0100874999999996,
        "leartime_s": 0.03825988800963387,
        "sampletime": 0.7933791010000277,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 431,
        "timesteps": 86200,
        "reward_mean": -1.0669250000000001,
        "reward_max": -0.09938750000000017,
        "reward_min": -2.1793875,
        "leartime_s": 0.02873362900572829,
        "sampletime": 0.7463828280160669,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 432,
        "timesteps": 86400,
        "reward_mean": -0.5917749999999998,
        "reward_max": 0.33189375000000026,
        "reward_min": -1.6035249999999994,
        "leartime_s": 0.07351867799297906,
        "sampletime": 0.7404746020038147,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 433,
        "timesteps": 86600,
        "reward_mean": -0.8757749999999999,
        "reward_max": 0.11710000000000001,
        "reward_min": -2.1979687499999994,
        "leartime_s": 0.07431514299241826,
        "sampletime": 0.7913186509977095,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 434,
        "timesteps": 86800,
        "reward_mean": -0.9169499999999999,
        "reward_max": 0.26222500000000004,
        "reward_min": -1.9685749999999997,
        "leartime_s": 0.04040636200807057,
        "sampletime": 0.6479907169996295,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 435,
        "timesteps": 87000,
        "reward_mean": -1.0327999999999997,
        "reward_max": 0.0022125000000001865,
        "reward_min": -2.188425,
        "leartime_s": 0.041806630993960425,
        "sampletime": 0.8456573779985774,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 436,
        "timesteps": 87200,
        "reward_mean": -0.9128749999999998,
        "reward_max": 0.47723125000000016,
        "reward_min": -2.04343125,
        "leartime_s": 0.04743459599558264,
        "sampletime": 0.7369712340005208,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 437,
        "timesteps": 87400,
        "reward_mean": -0.9781749999999999,
        "reward_max": -0.04006249999999984,
        "reward_min": -2.0366125000000004,
        "leartime_s": 0.044069644005503505,
        "sampletime": 0.7497477040160447,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 438,
        "timesteps": 87600,
        "reward_mean": -0.933125,
        "reward_max": -0.00819375,
        "reward_min": -2.242425,
        "leartime_s": 0.0732022849842906,
        "sampletime": 0.6591918109916151,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 439,
        "timesteps": 87800,
        "reward_mean": -0.5200249999999998,
        "reward_max": 0.4710187500000002,
        "reward_min": -1.5111875000000001,
        "leartime_s": 0.058765534980921075,
        "sampletime": 0.7816750740166754,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 440,
        "timesteps": 88000,
        "reward_mean": -0.821925,
        "reward_max": 0.13282500000000003,
        "reward_min": -2.23685,
        "leartime_s": 0.04644038001424633,
        "sampletime": 0.9352349719847552,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 441,
        "timesteps": 88200,
        "reward_mean": -0.808275,
        "reward_max": 0.07521875000000011,
        "reward_min": -1.8210812500000002,
        "leartime_s": 0.0789931130129844,
        "sampletime": 0.7261183179798536,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 442,
        "timesteps": 88400,
        "reward_mean": -1.023225,
        "reward_max": 0.0006999999999999784,
        "reward_min": -2.3100937499999996,
        "leartime_s": 0.026105634024133906,
        "sampletime": 0.6939317579963244,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 443,
        "timesteps": 88600,
        "reward_mean": -1.025375,
        "reward_max": -0.11518124999999979,
        "reward_min": -2.2417562500000003,
        "leartime_s": 0.07115664400043897,
        "sampletime": 0.839195654989453,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 444,
        "timesteps": 88800,
        "reward_mean": -1.1203999999999998,
        "reward_max": -0.03640625000000007,
        "reward_min": -2.20740625,
        "leartime_s": 0.07346172901452519,
        "sampletime": 0.7177778090117499,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 445,
        "timesteps": 89000,
        "reward_mean": -1.1725,
        "reward_max": -0.2563874999999999,
        "reward_min": -2.2775250000000002,
        "leartime_s": 0.02282490298966877,
        "sampletime": 0.690395976009313,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 446,
        "timesteps": 89200,
        "reward_mean": -0.9015749999999999,
        "reward_max": 0.25345000000000006,
        "reward_min": -2.2111812500000005,
        "leartime_s": 0.030439402005868033,
        "sampletime": 0.718300762004219,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 447,
        "timesteps": 89400,
        "reward_mean": -0.9318999999999998,
        "reward_max": 0.007350000000000245,
        "reward_min": -1.9836624999999997,
        "leartime_s": 0.07745771302143112,
        "sampletime": 0.6849052259931341,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 448,
        "timesteps": 89600,
        "reward_mean": -0.8598249999999998,
        "reward_max": -0.0851749999999999,
        "reward_min": -2.1437,
        "leartime_s": 0.025638620980316773,
        "sampletime": 0.7398744689999148,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 449,
        "timesteps": 89800,
        "reward_mean": -0.6090749999999998,
        "reward_max": 0.19584375000000012,
        "reward_min": -1.8759937499999995,
        "leartime_s": 0.03054420099942945,
        "sampletime": 0.8990509120048955,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 450,
        "timesteps": 90000,
        "reward_mean": -1.0405250000000001,
        "reward_max": 0.0631249999999999,
        "reward_min": -2.616412499999999,
        "leartime_s": 0.06561363901710138,
        "sampletime": 0.6873551059979945,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 451,
        "timesteps": 90200,
        "reward_mean": -0.8904249999999999,
        "reward_max": 0.09336249999999992,
        "reward_min": -2.25295,
        "leartime_s": 0.02752139000222087,
        "sampletime": 0.7213113459874876,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 452,
        "timesteps": 90400,
        "reward_mean": -0.9753000000000001,
        "reward_max": 0.00764375000000006,
        "reward_min": -1.9978187499999995,
        "leartime_s": 0.03800169797614217,
        "sampletime": 0.7363809900125489,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 453,
        "timesteps": 90600,
        "reward_mean": -0.9922250000000001,
        "reward_max": 0.021493749999999867,
        "reward_min": -2.3667187500000004,
        "leartime_s": 0.023815477994503453,
        "sampletime": 0.7890979190124199,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 454,
        "timesteps": 90800,
        "reward_mean": -1.008875,
        "reward_max": -0.06816250000000007,
        "reward_min": -1.9481999999999997,
        "leartime_s": 0.1028117630048655,
        "sampletime": 1.1190139329992235,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 455,
        "timesteps": 91000,
        "reward_mean": -0.9977999999999999,
        "reward_max": 0.07783125000000005,
        "reward_min": -2.5387375000000003,
        "leartime_s": 0.041960631002439186,
        "sampletime": 0.6726413239957765,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 456,
        "timesteps": 91200,
        "reward_mean": -0.9624749999999999,
        "reward_max": -0.09503124999999997,
        "reward_min": -2.3501000000000003,
        "leartime_s": 0.02983421800308861,
        "sampletime": 0.6472630460048094,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 457,
        "timesteps": 91400,
        "reward_mean": -1.223575,
        "reward_max": -0.35516250000000016,
        "reward_min": -2.3174437500000002,
        "leartime_s": 0.06502435498987325,
        "sampletime": 0.709572035993915,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 458,
        "timesteps": 91600,
        "reward_mean": -1.2166750000000002,
        "reward_max": -0.08056250000000009,
        "reward_min": -2.26233125,
        "leartime_s": 0.036718568997457623,
        "sampletime": 0.82918935501948,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 459,
        "timesteps": 91800,
        "reward_mean": -1.2902500000000001,
        "reward_max": -0.2787437500000002,
        "reward_min": -2.7010874999999994,
        "leartime_s": 0.07142611799645238,
        "sampletime": 0.7536302910011727,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 460,
        "timesteps": 92000,
        "reward_mean": -1.1087999999999998,
        "reward_max": -0.0392125000000001,
        "reward_min": -2.2736000000000005,
        "leartime_s": 0.05087007800466381,
        "sampletime": 0.9341761640098412,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 461,
        "timesteps": 92200,
        "reward_mean": -0.994625,
        "reward_max": -0.07742499999999991,
        "reward_min": -2.2775187500000005,
        "leartime_s": 0.04072839400032535,
        "sampletime": 0.7945879890176002,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 462,
        "timesteps": 92400,
        "reward_mean": -1.041375,
        "reward_max": -0.19784999999999994,
        "reward_min": -2.5171187499999994,
        "leartime_s": 0.030955344991525635,
        "sampletime": 0.7129603200010024,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 463,
        "timesteps": 92600,
        "reward_mean": -1.1144749999999999,
        "reward_max": -0.09137500000000012,
        "reward_min": -2.476268750000001,
        "leartime_s": 0.043217968981480226,
        "sampletime": 0.8249588530161418,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 464,
        "timesteps": 92800,
        "reward_mean": -1.2679,
        "reward_max": 0.011993749999999914,
        "reward_min": -2.6217937499999997,
        "leartime_s": 0.05690851400140673,
        "sampletime": 0.8028604660066776,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 465,
        "timesteps": 93000,
        "reward_mean": -1.0986500000000001,
        "reward_max": -0.11216250000000015,
        "reward_min": -2.1842124999999997,
        "leartime_s": 0.04025174101116136,
        "sampletime": 0.6564203080197331,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 466,
        "timesteps": 93200,
        "reward_mean": -1.123525,
        "reward_max": -0.17656250000000007,
        "reward_min": -2.7922124999999998,
        "leartime_s": 0.07953307899879292,
        "sampletime": 0.6623954169917852,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 467,
        "timesteps": 93400,
        "reward_mean": -1.0373250000000003,
        "reward_max": 0.054893749999999866,
        "reward_min": -2.3931375000000004,
        "leartime_s": 0.08905292800045572,
        "sampletime": 0.6848409659869503,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 468,
        "timesteps": 93600,
        "reward_mean": -1.1301,
        "reward_max": -0.2806875000000002,
        "reward_min": -2.3624874999999994,
        "leartime_s": 0.0941498999891337,
        "sampletime": 1.0554642880160827,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 469,
        "timesteps": 93800,
        "reward_mean": -1.1265749999999999,
        "reward_max": -0.12579374999999998,
        "reward_min": -2.5145999999999993,
        "leartime_s": 0.09614194100140594,
        "sampletime": 0.7767157159978524,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 470,
        "timesteps": 94000,
        "reward_mean": -1.23495,
        "reward_max": -0.07752500000000007,
        "reward_min": -2.526825000000001,
        "leartime_s": 0.07568895298754796,
        "sampletime": 0.6883615219849162,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 471,
        "timesteps": 94200,
        "reward_mean": -1.1963250000000003,
        "reward_max": -0.2794375000000001,
        "reward_min": -2.4573937499999996,
        "leartime_s": 0.043782302003819495,
        "sampletime": 0.727517669001827,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 472,
        "timesteps": 94400,
        "reward_mean": -1.1771999999999998,
        "reward_max": -0.19798749999999993,
        "reward_min": -2.3832499999999994,
        "leartime_s": 0.06351506698410958,
        "sampletime": 0.7032666169980075,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 473,
        "timesteps": 94600,
        "reward_mean": -1.0268000000000002,
        "reward_max": 0.004524999999999932,
        "reward_min": -1.9293625000000003,
        "leartime_s": 0.08884513701195829,
        "sampletime": 0.6872189239948057,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 474,
        "timesteps": 94800,
        "reward_mean": -1.1465500000000002,
        "reward_max": -0.31560000000000027,
        "reward_min": -2.991493750000001,
        "leartime_s": 0.04662211300455965,
        "sampletime": 0.7209972499986179,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 475,
        "timesteps": 95000,
        "reward_mean": -1.3096999999999999,
        "reward_max": -0.48074999999999984,
        "reward_min": -2.3530875,
        "leartime_s": 0.07679155899677426,
        "sampletime": 0.6547482929890975,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 476,
        "timesteps": 95200,
        "reward_mean": -1.143225,
        "reward_max": -0.04074999999999999,
        "reward_min": -2.5190812499999997,
        "leartime_s": 0.04062883698497899,
        "sampletime": 0.6774032349931076,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 477,
        "timesteps": 95400,
        "reward_mean": -1.183825,
        "reward_max": -0.13236875,
        "reward_min": -2.1925812499999995,
        "leartime_s": 0.08280568799818866,
        "sampletime": 0.5981169500155374,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 478,
        "timesteps": 95600,
        "reward_mean": -1.1069500000000003,
        "reward_max": -0.1122250000000003,
        "reward_min": -2.6026625000000005,
        "leartime_s": 0.08012164299725555,
        "sampletime": 0.7461858890019357,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 479,
        "timesteps": 95800,
        "reward_mean": -1.2550500000000002,
        "reward_max": -0.16901875000000022,
        "reward_min": -2.5812437499999996,
        "leartime_s": 0.058797378005692735,
        "sampletime": 0.9054312180087436,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 480,
        "timesteps": 96000,
        "reward_mean": -1.1271250000000002,
        "reward_max": -0.03228124999999987,
        "reward_min": -2.4155125000000006,
        "leartime_s": 0.049756813008571044,
        "sampletime": 0.8292815290042199,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 481,
        "timesteps": 96200,
        "reward_mean": -1.0964250000000002,
        "reward_max": 0.02321249999999983,
        "reward_min": -2.3288750000000005,
        "leartime_s": 0.05183415600913577,
        "sampletime": 0.7932453049870674,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 482,
        "timesteps": 96400,
        "reward_mean": -1.1778750000000002,
        "reward_max": -0.008556250000000029,
        "reward_min": -2.3778875,
        "leartime_s": 0.08276012999704108,
        "sampletime": 0.7854216170089785,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 483,
        "timesteps": 96600,
        "reward_mean": -1.0559749999999999,
        "reward_max": -0.18831250000000002,
        "reward_min": -2.1253437500000003,
        "leartime_s": 0.0753556830168236,
        "sampletime": 0.8045686489786021,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 484,
        "timesteps": 96800,
        "reward_mean": -1.2902500000000006,
        "reward_max": -0.36360625,
        "reward_min": -2.6070687499999994,
        "leartime_s": 0.06341756600886583,
        "sampletime": 0.6144914769975003,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 485,
        "timesteps": 97000,
        "reward_mean": -1.41035,
        "reward_max": -0.43728124999999984,
        "reward_min": -2.6046624999999985,
        "leartime_s": 0.02953739499207586,
        "sampletime": 0.6439890320179984,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 486,
        "timesteps": 97200,
        "reward_mean": -1.1307749999999999,
        "reward_max": -0.24164999999999998,
        "reward_min": -2.1406624999999995,
        "leartime_s": 0.03271462500561029,
        "sampletime": 0.8041673180123325,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 487,
        "timesteps": 97400,
        "reward_mean": -1.417725,
        "reward_max": -0.37175,
        "reward_min": -2.6093249999999997,
        "leartime_s": 0.05495893501210958,
        "sampletime": 0.6031753849820234,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 488,
        "timesteps": 97600,
        "reward_mean": -1.26755,
        "reward_max": -0.32105,
        "reward_min": -2.752887500000001,
        "leartime_s": 0.0525101300154347,
        "sampletime": 0.699530051992042,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 489,
        "timesteps": 97800,
        "reward_mean": -1.1503,
        "reward_max": -0.17839999999999995,
        "reward_min": -2.3654437500000007,
        "leartime_s": 0.03257221498643048,
        "sampletime": 0.7162457869853824,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 490,
        "timesteps": 98000,
        "reward_mean": -1.3431,
        "reward_max": -0.5221187499999997,
        "reward_min": -2.5145999999999997,
        "leartime_s": 0.05291616200702265,
        "sampletime": 0.6402906119765248,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 491,
        "timesteps": 98200,
        "reward_mean": -1.0506249999999997,
        "reward_max": -0.02205624999999993,
        "reward_min": -2.6073125000000013,
        "leartime_s": 0.0665588979900349,
        "sampletime": 0.7319195159943774,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 492,
        "timesteps": 98400,
        "reward_mean": -1.2284000000000002,
        "reward_max": -0.1425750000000002,
        "reward_min": -2.453875000000001,
        "leartime_s": 0.03025488101411611,
        "sampletime": 0.6618974469893146,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 493,
        "timesteps": 98600,
        "reward_mean": -1.121025,
        "reward_max": -0.32306875,
        "reward_min": -2.31920625,
        "leartime_s": 0.03655607902328484,
        "sampletime": 0.7895859799755272,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 494,
        "timesteps": 98800,
        "reward_mean": -1.0797750000000002,
        "reward_max": -0.012756250000000045,
        "reward_min": -2.02130625,
        "leartime_s": 0.02685301098972559,
        "sampletime": 0.732763662992511,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 495,
        "timesteps": 99000,
        "reward_mean": -1.342375,
        "reward_max": -0.47100624999999996,
        "reward_min": -2.3867812500000003,
        "leartime_s": 0.07865420301095583,
        "sampletime": 0.7427092989964876,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 496,
        "timesteps": 99200,
        "reward_mean": -1.1856000000000004,
        "reward_max": -0.4302062500000003,
        "reward_min": -2.4674750000000003,
        "leartime_s": 0.04242706499644555,
        "sampletime": 0.9577837109973188,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 497,
        "timesteps": 99400,
        "reward_mean": -1.2426,
        "reward_max": -0.2144437500000001,
        "reward_min": -2.4748937500000006,
        "leartime_s": 0.04253756601247005,
        "sampletime": 0.6985059799917508,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 498,
        "timesteps": 99600,
        "reward_mean": -1.111225,
        "reward_max": -0.20514375,
        "reward_min": -2.07693125,
        "leartime_s": 0.04386286699445918,
        "sampletime": 0.6963424969871994,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 499,
        "timesteps": 99800,
        "reward_mean": -1.2515249999999998,
        "reward_max": -0.1316374999999998,
        "reward_min": -2.405875,
        "leartime_s": 0.06489836901891977,
        "sampletime": 0.6335934819944669,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 500,
        "timesteps": 100000,
        "reward_mean": -1.133825,
        "reward_max": 0.16870624999999995,
        "reward_min": -2.7175874999999987,
        "leartime_s": 0.03806647000601515,
        "sampletime": 0.7034825320006348,
        "best_mean": -0.39657500000000007,
        "best_max": 0.4538874999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 22452,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    }
]