[
    {
        "generation": 1,
        "timesteps": 2000,
        "reward_mean": -39.170675,
        "reward_max": -3.192937500000002,
        "reward_min": -75.46843750000001,
        "leartime_s": 0.022527364984853193,
        "sampletime": 1.6834596290136687,
        "best_mean": -39.170675,
        "best_max": -3.192937500000002,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 2,
        "timesteps": 4000,
        "reward_mean": -37.822225,
        "reward_max": -1.3471875000000004,
        "reward_min": -140.0268125,
        "leartime_s": 0.0283829859981779,
        "sampletime": 2.1640373560076114,
        "best_mean": -37.822225,
        "best_max": -1.3471875000000004,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 3,
        "timesteps": 6000,
        "reward_mean": -20.12475,
        "reward_max": 0.9047500000000006,
        "reward_min": -142.49325,
        "leartime_s": 0.04098312501446344,
        "sampletime": 1.9568566759990063,
        "best_mean": -20.12475,
        "best_max": 0.9047500000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 4,
        "timesteps": 8000,
        "reward_mean": -18.342775000000003,
        "reward_max": 1.2775000000000007,
        "reward_min": -66.9355625,
        "leartime_s": 0.05156116699799895,
        "sampletime": 1.6552072859776672,
        "best_mean": -18.342775000000003,
        "best_max": 1.2775000000000007,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 5,
        "timesteps": 10000,
        "reward_mean": -18.104975000000003,
        "reward_max": -1.1691874999999998,
        "reward_min": -41.793375000000005,
        "leartime_s": 0.05791723198490217,
        "sampletime": 2.134241645981092,
        "best_mean": -18.104975000000003,
        "best_max": -1.1691874999999998,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 6,
        "timesteps": 12000,
        "reward_mean": -18.173125,
        "reward_max": 1.0145625,
        "reward_min": -42.22112499999999,
        "leartime_s": 0.02376782600185834,
        "sampletime": 2.017709970998112,
        "best_mean": -18.104975000000003,
        "best_max": -1.1691874999999998,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 7,
        "timesteps": 14000,
        "reward_mean": -14.654549999999999,
        "reward_max": -0.18612499999999943,
        "reward_min": -66.09918750000001,
        "leartime_s": 0.021871589997317642,
        "sampletime": 1.8706258469901513,
        "best_mean": -14.654549999999999,
        "best_max": -0.18612499999999943,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 8,
        "timesteps": 16000,
        "reward_mean": -8.200275,
        "reward_max": -1.6268749999999998,
        "reward_min": -33.5028125,
        "leartime_s": 0.02823439400526695,
        "sampletime": 2.1843826239928603,
        "best_mean": -8.200275,
        "best_max": -1.6268749999999998,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 9,
        "timesteps": 18000,
        "reward_mean": -6.091925000000001,
        "reward_max": -1.3573124999999993,
        "reward_min": -60.23243749999999,
        "leartime_s": 0.004998132993932813,
        "sampletime": 2.0173751869879197,
        "best_mean": -6.091925000000001,
        "best_max": -1.3573124999999993,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 10,
        "timesteps": 20000,
        "reward_mean": -3.881775,
        "reward_max": -0.8009999999999999,
        "reward_min": -10.140437499999999,
        "leartime_s": 0.032995436020428315,
        "sampletime": 1.8974854769767262,
        "best_mean": -3.881775,
        "best_max": -0.8009999999999999,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 11,
        "timesteps": 22000,
        "reward_mean": -2.2741000000000002,
        "reward_max": -0.34306249999999994,
        "reward_min": -4.7096875,
        "leartime_s": 0.00741542101604864,
        "sampletime": 1.8147733499936294,
        "best_mean": -2.2741000000000002,
        "best_max": -0.34306249999999994,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 12,
        "timesteps": 24000,
        "reward_mean": -1.5713250000000003,
        "reward_max": 0.0216875,
        "reward_min": -3.2246875000000004,
        "leartime_s": 0.03838765199179761,
        "sampletime": 1.7528671080071945,
        "best_mean": -1.5713250000000003,
        "best_max": 0.0216875,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 13,
        "timesteps": 26000,
        "reward_mean": -1.5920250000000005,
        "reward_max": -0.4363750000000003,
        "reward_min": -4.0120000000000005,
        "leartime_s": 0.007898315991042182,
        "sampletime": 2.0669389700051397,
        "best_mean": -1.5713250000000003,
        "best_max": 0.0216875,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 14,
        "timesteps": 28000,
        "reward_mean": -1.4244000000000003,
        "reward_max": 0.013375000000000026,
        "reward_min": -2.8676875000000006,
        "leartime_s": 0.005949268990661949,
        "sampletime": 2.1380521199898794,
        "best_mean": -1.4244000000000003,
        "best_max": 0.013375000000000026,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 15,
        "timesteps": 30000,
        "reward_mean": -1.5395750000000004,
        "reward_max": -0.3393750000000003,
        "reward_min": -3.365250000000001,
        "leartime_s": 0.007931808999273926,
        "sampletime": 1.7521108240180183,
        "best_mean": -1.4244000000000003,
        "best_max": 0.013375000000000026,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 16,
        "timesteps": 32000,
        "reward_mean": -1.3541500000000002,
        "reward_max": -0.3579374999999998,
        "reward_min": -3.1556875,
        "leartime_s": 0.015772863989695907,
        "sampletime": 1.7307888959767297,
        "best_mean": -1.3541500000000002,
        "best_max": -0.3579374999999998,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 17,
        "timesteps": 34000,
        "reward_mean": -1.48405,
        "reward_max": -0.20793750000000008,
        "reward_min": -2.9232500000000003,
        "leartime_s": 0.013838579994626343,
        "sampletime": 2.306568394007627,
        "best_mean": -1.3541500000000002,
        "best_max": -0.3579374999999998,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 18,
        "timesteps": 36000,
        "reward_mean": -1.58565,
        "reward_max": 0.14437500000000017,
        "reward_min": -3.3193125,
        "leartime_s": 0.01782677401206456,
        "sampletime": 1.7351559410162736,
        "best_mean": -1.3541500000000002,
        "best_max": -0.3579374999999998,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 19,
        "timesteps": 38000,
        "reward_mean": -1.4911250000000005,
        "reward_max": -0.2132499999999998,
        "reward_min": -3.2303750000000004,
        "leartime_s": 0.05869411397725344,
        "sampletime": 2.0404693960153963,
        "best_mean": -1.3541500000000002,
        "best_max": -0.3579374999999998,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 20,
        "timesteps": 40000,
        "reward_mean": -1.4468,
        "reward_max": -0.49668750000000017,
        "reward_min": -3.2343750000000004,
        "leartime_s": 0.01812183699803427,
        "sampletime": 2.1861212060030084,
        "best_mean": -1.3541500000000002,
        "best_max": -0.3579374999999998,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 21,
        "timesteps": 42000,
        "reward_mean": -1.31995,
        "reward_max": -0.2894374999999998,
        "reward_min": -2.5874375000000005,
        "leartime_s": 0.008441102982033044,
        "sampletime": 2.093739885982359,
        "best_mean": -1.31995,
        "best_max": -0.2894374999999998,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 22,
        "timesteps": 44000,
        "reward_mean": -1.2671,
        "reward_max": -0.2570624999999998,
        "reward_min": -2.2971875,
        "leartime_s": 0.010471961024450138,
        "sampletime": 2.492709838988958,
        "best_mean": -1.2671,
        "best_max": -0.2570624999999998,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 23,
        "timesteps": 46000,
        "reward_mean": -1.4323749999999997,
        "reward_max": -0.38843749999999994,
        "reward_min": -2.7901875,
        "leartime_s": 0.012762790982378647,
        "sampletime": 1.752014480996877,
        "best_mean": -1.2671,
        "best_max": -0.2570624999999998,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 24,
        "timesteps": 48000,
        "reward_mean": -1.6326000000000003,
        "reward_max": -0.4192499999999998,
        "reward_min": -2.7425624999999996,
        "leartime_s": 0.006518957001389936,
        "sampletime": 1.8780902569997124,
        "best_mean": -1.2671,
        "best_max": -0.2570624999999998,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 25,
        "timesteps": 50000,
        "reward_mean": -1.5356500000000002,
        "reward_max": -0.5321874999999999,
        "reward_min": -2.7166875,
        "leartime_s": 0.00897710700519383,
        "sampletime": 2.146422417019494,
        "best_mean": -1.2671,
        "best_max": -0.2570624999999998,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 26,
        "timesteps": 52000,
        "reward_mean": -1.5476750000000001,
        "reward_max": -0.5564999999999999,
        "reward_min": -2.9636875,
        "leartime_s": 0.007903738995082676,
        "sampletime": 1.7412861949997023,
        "best_mean": -1.2671,
        "best_max": -0.2570624999999998,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 27,
        "timesteps": 54000,
        "reward_mean": -1.471975,
        "reward_max": -0.43975,
        "reward_min": -2.6935000000000002,
        "leartime_s": 0.04152243601856753,
        "sampletime": 1.964476494002156,
        "best_mean": -1.2671,
        "best_max": -0.2570624999999998,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 28,
        "timesteps": 56000,
        "reward_mean": -1.658675,
        "reward_max": -0.6664375000000001,
        "reward_min": -3.7970625,
        "leartime_s": 0.03272845200262964,
        "sampletime": 2.2015841600077692,
        "best_mean": -1.2671,
        "best_max": -0.2570624999999998,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 29,
        "timesteps": 58000,
        "reward_mean": -1.6920500000000003,
        "reward_max": -0.7701250000000001,
        "reward_min": -3.1345624999999995,
        "leartime_s": 0.015886604000115767,
        "sampletime": 1.7686772099987138,
        "best_mean": -1.2671,
        "best_max": -0.2570624999999998,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 30,
        "timesteps": 60000,
        "reward_mean": -1.4329250000000002,
        "reward_max": -0.33749999999999986,
        "reward_min": -2.53075,
        "leartime_s": 0.007204722001915798,
        "sampletime": 2.1587623689847533,
        "best_mean": -1.2671,
        "best_max": -0.2570624999999998,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 31,
        "timesteps": 62000,
        "reward_mean": -1.6552749999999998,
        "reward_max": -0.5832499999999999,
        "reward_min": -3.2618125,
        "leartime_s": 0.005847649008501321,
        "sampletime": 2.071276722010225,
        "best_mean": -1.2671,
        "best_max": -0.2570624999999998,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 32,
        "timesteps": 64000,
        "reward_mean": -1.6201250000000003,
        "reward_max": -0.49143749999999986,
        "reward_min": -2.7555625,
        "leartime_s": 0.0486761869979091,
        "sampletime": 1.7401827300200239,
        "best_mean": -1.2671,
        "best_max": -0.2570624999999998,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 33,
        "timesteps": 66000,
        "reward_mean": -1.7571499999999998,
        "reward_max": -0.7705625,
        "reward_min": -3.1685,
        "leartime_s": 0.020658085006289184,
        "sampletime": 1.727511327015236,
        "best_mean": -1.2671,
        "best_max": -0.2570624999999998,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 34,
        "timesteps": 68000,
        "reward_mean": -1.4710499999999997,
        "reward_max": -0.40093750000000006,
        "reward_min": -2.5263124999999995,
        "leartime_s": 0.029618141998071223,
        "sampletime": 2.11422509100521,
        "best_mean": -1.2671,
        "best_max": -0.2570624999999998,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 35,
        "timesteps": 70000,
        "reward_mean": -1.4213500000000003,
        "reward_max": -0.7311250000000001,
        "reward_min": -2.4711875,
        "leartime_s": 0.037063765979837626,
        "sampletime": 2.1963662820053287,
        "best_mean": -1.2671,
        "best_max": -0.2570624999999998,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 36,
        "timesteps": 72000,
        "reward_mean": -1.2713250000000003,
        "reward_max": -0.26518749999999985,
        "reward_min": -2.3459375,
        "leartime_s": 0.09233653597766533,
        "sampletime": 1.658814602997154,
        "best_mean": -1.2671,
        "best_max": -0.2570624999999998,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 37,
        "timesteps": 74000,
        "reward_mean": -1.49215,
        "reward_max": -0.3459375000000001,
        "reward_min": -2.647437499999999,
        "leartime_s": 0.006691666989354417,
        "sampletime": 2.3474912679812405,
        "best_mean": -1.2671,
        "best_max": -0.2570624999999998,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 38,
        "timesteps": 76000,
        "reward_mean": -1.3552000000000002,
        "reward_max": -0.4686874999999998,
        "reward_min": -2.4500000000000006,
        "leartime_s": 0.006184301018947735,
        "sampletime": 1.833949063991895,
        "best_mean": -1.2671,
        "best_max": -0.2570624999999998,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 39,
        "timesteps": 78000,
        "reward_mean": -1.2869500000000003,
        "reward_max": -0.28787500000000005,
        "reward_min": -2.7728124999999997,
        "leartime_s": 0.03752064099535346,
        "sampletime": 2.0888263790111523,
        "best_mean": -1.2671,
        "best_max": -0.2570624999999998,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 40,
        "timesteps": 80000,
        "reward_mean": -1.06775,
        "reward_max": -0.13962500000000005,
        "reward_min": -2.1748125000000003,
        "leartime_s": 0.015100056974915788,
        "sampletime": 2.155260327999713,
        "best_mean": -1.06775,
        "best_max": -0.13962500000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 41,
        "timesteps": 82000,
        "reward_mean": -1.1930000000000003,
        "reward_max": -0.14743749999999967,
        "reward_min": -2.1938750000000002,
        "leartime_s": 0.03255337700829841,
        "sampletime": 1.7121811799879652,
        "best_mean": -1.06775,
        "best_max": -0.13962500000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 42,
        "timesteps": 84000,
        "reward_mean": -1.11115,
        "reward_max": 0.06456249999999998,
        "reward_min": -2.3003125000000004,
        "leartime_s": 0.006754857982741669,
        "sampletime": 2.1286804839910474,
        "best_mean": -1.06775,
        "best_max": -0.13962500000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 43,
        "timesteps": 86000,
        "reward_mean": -1.09345,
        "reward_max": -0.15274999999999994,
        "reward_min": -2.6793125,
        "leartime_s": 0.01902056101243943,
        "sampletime": 1.9606567739974707,
        "best_mean": -1.06775,
        "best_max": -0.13962500000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 44,
        "timesteps": 88000,
        "reward_mean": -1.1521000000000001,
        "reward_max": 0.1226875000000003,
        "reward_min": -2.3009375000000007,
        "leartime_s": 0.00656263399287127,
        "sampletime": 1.975082658987958,
        "best_mean": -1.06775,
        "best_max": -0.13962500000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 45,
        "timesteps": 90000,
        "reward_mean": -1.1257750000000002,
        "reward_max": 0.026625000000000364,
        "reward_min": -2.463250000000001,
        "leartime_s": 0.030223307985579595,
        "sampletime": 2.0393703850277234,
        "best_mean": -1.06775,
        "best_max": -0.13962500000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 46,
        "timesteps": 92000,
        "reward_mean": -0.9373250000000003,
        "reward_max": 0.14981250000000013,
        "reward_min": -2.167062500000001,
        "leartime_s": 0.023994806018890813,
        "sampletime": 2.1700601099873893,
        "best_mean": -0.9373250000000003,
        "best_max": 0.14981250000000013,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 47,
        "timesteps": 94000,
        "reward_mean": -0.8136250000000002,
        "reward_max": 0.19750000000000023,
        "reward_min": -1.9311875000000005,
        "leartime_s": 0.03095834399573505,
        "sampletime": 1.874052280007163,
        "best_mean": -0.8136250000000002,
        "best_max": 0.19750000000000023,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 48,
        "timesteps": 96000,
        "reward_mean": -0.9483750000000001,
        "reward_max": -0.08800000000000009,
        "reward_min": -2.4191875000000005,
        "leartime_s": 0.02661662598256953,
        "sampletime": 1.9553757139947265,
        "best_mean": -0.8136250000000002,
        "best_max": 0.19750000000000023,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 49,
        "timesteps": 98000,
        "reward_mean": -0.6859750000000001,
        "reward_max": 0.23856250000000018,
        "reward_min": -1.6911875,
        "leartime_s": 0.014592176012229174,
        "sampletime": 1.6423113729979377,
        "best_mean": -0.6859750000000001,
        "best_max": 0.23856250000000018,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 50,
        "timesteps": 100000,
        "reward_mean": -0.9274500000000001,
        "reward_max": -0.22556249999999983,
        "reward_min": -2.3201875000000007,
        "leartime_s": 0.01940546397236176,
        "sampletime": 2.022347752004862,
        "best_mean": -0.6859750000000001,
        "best_max": 0.23856250000000018,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 51,
        "timesteps": 102000,
        "reward_mean": -0.6624750000000001,
        "reward_max": 0.2432500000000003,
        "reward_min": -2.2260000000000004,
        "leartime_s": 0.012011143000563607,
        "sampletime": 1.6472787740058266,
        "best_mean": -0.6624750000000001,
        "best_max": 0.2432500000000003,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 52,
        "timesteps": 104000,
        "reward_mean": -0.6034,
        "reward_max": 0.23875000000000038,
        "reward_min": -1.801500000000001,
        "leartime_s": 0.030902892991434783,
        "sampletime": 1.9899129059922416,
        "best_mean": -0.6034,
        "best_max": 0.23875000000000038,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 53,
        "timesteps": 106000,
        "reward_mean": -0.8877500000000003,
        "reward_max": -0.08906249999999988,
        "reward_min": -2.0888750000000003,
        "leartime_s": 0.014366912975674495,
        "sampletime": 2.1570741559844464,
        "best_mean": -0.6034,
        "best_max": 0.23875000000000038,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 54,
        "timesteps": 108000,
        "reward_mean": -0.8604500000000002,
        "reward_max": 0.037937500000000145,
        "reward_min": -1.995875000000001,
        "leartime_s": 0.034083317004842684,
        "sampletime": 1.9310816270008218,
        "best_mean": -0.6034,
        "best_max": 0.23875000000000038,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 55,
        "timesteps": 110000,
        "reward_mean": -0.8826250000000001,
        "reward_max": -0.005624999999999908,
        "reward_min": -2.0869375000000003,
        "leartime_s": 0.07842177202110179,
        "sampletime": 2.092340024013538,
        "best_mean": -0.6034,
        "best_max": 0.23875000000000038,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 56,
        "timesteps": 112000,
        "reward_mean": -0.7139000000000001,
        "reward_max": 0.06656249999999991,
        "reward_min": -1.8053125000000005,
        "leartime_s": 0.01100487500661984,
        "sampletime": 2.180350760987494,
        "best_mean": -0.6034,
        "best_max": 0.23875000000000038,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 57,
        "timesteps": 114000,
        "reward_mean": -0.8626000000000001,
        "reward_max": 0.10887500000000025,
        "reward_min": -2.0622499999999997,
        "leartime_s": 0.030564479995518923,
        "sampletime": 1.9335492359823547,
        "best_mean": -0.6034,
        "best_max": 0.23875000000000038,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 58,
        "timesteps": 116000,
        "reward_mean": -0.9185500000000001,
        "reward_max": -0.06424999999999972,
        "reward_min": -1.8786874999999998,
        "leartime_s": 0.031275064015062526,
        "sampletime": 2.1944949380122125,
        "best_mean": -0.6034,
        "best_max": 0.23875000000000038,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 59,
        "timesteps": 118000,
        "reward_mean": -0.9212000000000002,
        "reward_max": -0.01749999999999978,
        "reward_min": -2.434000000000001,
        "leartime_s": 0.010840289003681391,
        "sampletime": 1.8532730090082623,
        "best_mean": -0.6034,
        "best_max": 0.23875000000000038,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 60,
        "timesteps": 120000,
        "reward_mean": -0.79615,
        "reward_max": 0.00531250000000031,
        "reward_min": -1.8073124999999997,
        "leartime_s": 0.022848083986900747,
        "sampletime": 1.9480065910029225,
        "best_mean": -0.6034,
        "best_max": 0.23875000000000038,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 61,
        "timesteps": 122000,
        "reward_mean": -0.7467,
        "reward_max": 0.31562500000000016,
        "reward_min": -1.7560625000000007,
        "leartime_s": 0.05097414000192657,
        "sampletime": 1.90245217300253,
        "best_mean": -0.6034,
        "best_max": 0.23875000000000038,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 62,
        "timesteps": 124000,
        "reward_mean": -1.0774750000000004,
        "reward_max": -0.24118750000000003,
        "reward_min": -2.0596875000000003,
        "leartime_s": 0.007608323998283595,
        "sampletime": 2.056396664993372,
        "best_mean": -0.6034,
        "best_max": 0.23875000000000038,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 63,
        "timesteps": 126000,
        "reward_mean": -0.9614750000000002,
        "reward_max": -0.05962499999999986,
        "reward_min": -2.209250000000001,
        "leartime_s": 0.007097918016370386,
        "sampletime": 1.8402038970089052,
        "best_mean": -0.6034,
        "best_max": 0.23875000000000038,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 64,
        "timesteps": 128000,
        "reward_mean": -0.8885500000000001,
        "reward_max": -0.0024999999999997663,
        "reward_min": -1.9102500000000004,
        "leartime_s": 0.011000120983226225,
        "sampletime": 2.1471375899855047,
        "best_mean": -0.6034,
        "best_max": 0.23875000000000038,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 65,
        "timesteps": 130000,
        "reward_mean": -0.9834,
        "reward_max": -0.20806249999999973,
        "reward_min": -2.0203125,
        "leartime_s": 0.010489178996067494,
        "sampletime": 1.7091024900146294,
        "best_mean": -0.6034,
        "best_max": 0.23875000000000038,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 66,
        "timesteps": 132000,
        "reward_mean": -1.0544,
        "reward_max": -0.1100624999999997,
        "reward_min": -2.4695000000000005,
        "leartime_s": 0.0409505229908973,
        "sampletime": 1.7490989729994908,
        "best_mean": -0.6034,
        "best_max": 0.23875000000000038,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 67,
        "timesteps": 134000,
        "reward_mean": -1.0791000000000002,
        "reward_max": -0.01912499999999963,
        "reward_min": -2.392750000000001,
        "leartime_s": 0.030155032000038773,
        "sampletime": 1.9583015009993687,
        "best_mean": -0.6034,
        "best_max": 0.23875000000000038,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 68,
        "timesteps": 136000,
        "reward_mean": -1.0049750000000002,
        "reward_max": -0.11718749999999992,
        "reward_min": -1.9750000000000005,
        "leartime_s": 0.0206993049941957,
        "sampletime": 1.9869830470124725,
        "best_mean": -0.6034,
        "best_max": 0.23875000000000038,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 69,
        "timesteps": 138000,
        "reward_mean": -1.049875,
        "reward_max": -0.2693125000000001,
        "reward_min": -2.0115625000000006,
        "leartime_s": 0.02487478801049292,
        "sampletime": 2.1504679679928813,
        "best_mean": -0.6034,
        "best_max": 0.23875000000000038,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 70,
        "timesteps": 140000,
        "reward_mean": -1.2253500000000004,
        "reward_max": -0.3046875,
        "reward_min": -2.7775000000000007,
        "leartime_s": 0.018449746014084667,
        "sampletime": 1.9439673589949962,
        "best_mean": -0.6034,
        "best_max": 0.23875000000000038,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 71,
        "timesteps": 142000,
        "reward_mean": -0.9443250000000001,
        "reward_max": -0.015374999999999805,
        "reward_min": -2.1645,
        "leartime_s": 0.011922651989152655,
        "sampletime": 1.963917313987622,
        "best_mean": -0.6034,
        "best_max": 0.23875000000000038,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 72,
        "timesteps": 144000,
        "reward_mean": -1.1108000000000002,
        "reward_max": -0.10137499999999992,
        "reward_min": -2.6490625,
        "leartime_s": 0.02969275100622326,
        "sampletime": 1.9321362199843861,
        "best_mean": -0.6034,
        "best_max": 0.23875000000000038,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 73,
        "timesteps": 146000,
        "reward_mean": -1.1796750000000003,
        "reward_max": -0.23668749999999994,
        "reward_min": -2.3386875000000003,
        "leartime_s": 0.017366587999276817,
        "sampletime": 1.7145754150114954,
        "best_mean": -0.6034,
        "best_max": 0.23875000000000038,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 74,
        "timesteps": 148000,
        "reward_mean": -1.1137249999999999,
        "reward_max": -0.1670000000000001,
        "reward_min": -2.2898125000000005,
        "leartime_s": 0.023729989014100283,
        "sampletime": 1.9850993390136864,
        "best_mean": -0.6034,
        "best_max": 0.23875000000000038,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 75,
        "timesteps": 150000,
        "reward_mean": -0.802825,
        "reward_max": 0.11862500000000024,
        "reward_min": -2.426187500000001,
        "leartime_s": 0.015594450000207871,
        "sampletime": 1.8904753669921774,
        "best_mean": -0.6034,
        "best_max": 0.23875000000000038,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 76,
        "timesteps": 152000,
        "reward_mean": -0.631025,
        "reward_max": 0.2361250000000003,
        "reward_min": -2.011812500000001,
        "leartime_s": 0.03087809798307717,
        "sampletime": 1.9559146410028916,
        "best_mean": -0.6034,
        "best_max": 0.23875000000000038,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 77,
        "timesteps": 154000,
        "reward_mean": -1.031775,
        "reward_max": 0.03618750000000028,
        "reward_min": -2.0911875000000006,
        "leartime_s": 0.010223535005934536,
        "sampletime": 1.7545873439812567,
        "best_mean": -0.6034,
        "best_max": 0.23875000000000038,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 78,
        "timesteps": 156000,
        "reward_mean": -0.7588,
        "reward_max": 0.47425000000000034,
        "reward_min": -2.3993125,
        "leartime_s": 0.029187454987550154,
        "sampletime": 2.252148960978957,
        "best_mean": -0.6034,
        "best_max": 0.23875000000000038,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 79,
        "timesteps": 158000,
        "reward_mean": -0.8492500000000001,
        "reward_max": 0.1380000000000003,
        "reward_min": -1.7896875000000005,
        "leartime_s": 0.025650562980445102,
        "sampletime": 1.8909124079800677,
        "best_mean": -0.6034,
        "best_max": 0.23875000000000038,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 80,
        "timesteps": 160000,
        "reward_mean": -0.798425,
        "reward_max": -0.007312499999999722,
        "reward_min": -2.0057499999999995,
        "leartime_s": 0.022893963003298268,
        "sampletime": 2.2861064299941063,
        "best_mean": -0.6034,
        "best_max": 0.23875000000000038,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 81,
        "timesteps": 162000,
        "reward_mean": -0.88365,
        "reward_max": -0.06824999999999976,
        "reward_min": -2.0960625000000004,
        "leartime_s": 0.015680381009588018,
        "sampletime": 1.7430650889873505,
        "best_mean": -0.6034,
        "best_max": 0.23875000000000038,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 82,
        "timesteps": 164000,
        "reward_mean": -0.9491000000000002,
        "reward_max": 0.0933750000000003,
        "reward_min": -2.2335000000000003,
        "leartime_s": 0.009961343021132052,
        "sampletime": 1.7256039749772754,
        "best_mean": -0.6034,
        "best_max": 0.23875000000000038,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 83,
        "timesteps": 166000,
        "reward_mean": -0.9063500000000001,
        "reward_max": 0.0834375,
        "reward_min": -2.0116875000000007,
        "leartime_s": 0.00607731202035211,
        "sampletime": 1.8361096699954942,
        "best_mean": -0.6034,
        "best_max": 0.23875000000000038,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 84,
        "timesteps": 168000,
        "reward_mean": -0.63585,
        "reward_max": 0.2782500000000002,
        "reward_min": -2.1728125,
        "leartime_s": 0.009568938985466957,
        "sampletime": 2.090246073988965,
        "best_mean": -0.6034,
        "best_max": 0.23875000000000038,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 85,
        "timesteps": 170000,
        "reward_mean": -0.8332250000000001,
        "reward_max": 0.09093750000000013,
        "reward_min": -2.0158750000000007,
        "leartime_s": 0.03705621199333109,
        "sampletime": 1.7734284120087977,
        "best_mean": -0.6034,
        "best_max": 0.23875000000000038,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 86,
        "timesteps": 172000,
        "reward_mean": -0.5062749999999998,
        "reward_max": 0.3794375000000002,
        "reward_min": -1.9470000000000003,
        "leartime_s": 0.027968754991889,
        "sampletime": 1.9915762760210782,
        "best_mean": -0.5062749999999998,
        "best_max": 0.3794375000000002,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 87,
        "timesteps": 174000,
        "reward_mean": -0.45149999999999996,
        "reward_max": 0.44068750000000034,
        "reward_min": -1.8491875000000004,
        "leartime_s": 0.031553057982819155,
        "sampletime": 1.8716874139790889,
        "best_mean": -0.45149999999999996,
        "best_max": 0.44068750000000034,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 88,
        "timesteps": 176000,
        "reward_mean": -0.7653250000000001,
        "reward_max": 0.23250000000000046,
        "reward_min": -2.122875,
        "leartime_s": 0.024540935002733022,
        "sampletime": 1.9425130590097979,
        "best_mean": -0.45149999999999996,
        "best_max": 0.44068750000000034,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 89,
        "timesteps": 178000,
        "reward_mean": -0.45192499999999997,
        "reward_max": 0.48593750000000024,
        "reward_min": -1.4800624999999996,
        "leartime_s": 0.048905796982580796,
        "sampletime": 1.771901775005972,
        "best_mean": -0.45149999999999996,
        "best_max": 0.44068750000000034,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 90,
        "timesteps": 180000,
        "reward_mean": -0.5094249999999998,
        "reward_max": 0.6509375000000005,
        "reward_min": -1.6242500000000002,
        "leartime_s": 0.02341029400122352,
        "sampletime": 2.216970401990693,
        "best_mean": -0.45149999999999996,
        "best_max": 0.44068750000000034,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 91,
        "timesteps": 182000,
        "reward_mean": -0.3554999999999999,
        "reward_max": 0.6176250000000003,
        "reward_min": -1.4329375,
        "leartime_s": 0.022019185009412467,
        "sampletime": 2.076430929999333,
        "best_mean": -0.3554999999999999,
        "best_max": 0.6176250000000003,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 92,
        "timesteps": 184000,
        "reward_mean": -0.6154999999999998,
        "reward_max": 0.2123750000000003,
        "reward_min": -1.5903750000000003,
        "leartime_s": 0.03168177499901503,
        "sampletime": 1.8643987920077052,
        "best_mean": -0.3554999999999999,
        "best_max": 0.6176250000000003,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 93,
        "timesteps": 186000,
        "reward_mean": -0.40702499999999997,
        "reward_max": 0.8505625000000003,
        "reward_min": -1.4052500000000003,
        "leartime_s": 0.01865001698024571,
        "sampletime": 1.9844177779741585,
        "best_mean": -0.3554999999999999,
        "best_max": 0.6176250000000003,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 94,
        "timesteps": 188000,
        "reward_mean": -0.41649999999999987,
        "reward_max": 0.5954375000000005,
        "reward_min": -1.5776875000000004,
        "leartime_s": 0.03578298099455424,
        "sampletime": 2.0933707039803267,
        "best_mean": -0.3554999999999999,
        "best_max": 0.6176250000000003,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 95,
        "timesteps": 190000,
        "reward_mean": -0.4004749999999998,
        "reward_max": 0.4219375000000006,
        "reward_min": -1.4301875000000004,
        "leartime_s": 0.04515232000267133,
        "sampletime": 1.8792845610005315,
        "best_mean": -0.3554999999999999,
        "best_max": 0.6176250000000003,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 96,
        "timesteps": 192000,
        "reward_mean": -0.5074749999999999,
        "reward_max": 0.6436875000000006,
        "reward_min": -1.6601875000000001,
        "leartime_s": 0.04109409201191738,
        "sampletime": 1.7603741549828555,
        "best_mean": -0.3554999999999999,
        "best_max": 0.6176250000000003,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 97,
        "timesteps": 194000,
        "reward_mean": -0.5081749999999999,
        "reward_max": 0.7511250000000004,
        "reward_min": -1.5306250000000003,
        "leartime_s": 0.008380918996408582,
        "sampletime": 1.6959301310125738,
        "best_mean": -0.3554999999999999,
        "best_max": 0.6176250000000003,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 98,
        "timesteps": 196000,
        "reward_mean": -0.4260499999999998,
        "reward_max": 0.3291875000000004,
        "reward_min": -1.6023749999999999,
        "leartime_s": 0.02784241401241161,
        "sampletime": 1.8488432719896082,
        "best_mean": -0.3554999999999999,
        "best_max": 0.6176250000000003,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 99,
        "timesteps": 198000,
        "reward_mean": -0.6159749999999999,
        "reward_max": 0.3205625000000005,
        "reward_min": -1.8978750000000002,
        "leartime_s": 0.01249510599882342,
        "sampletime": 1.915841718990123,
        "best_mean": -0.3554999999999999,
        "best_max": 0.6176250000000003,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 100,
        "timesteps": 200000,
        "reward_mean": -0.4569749999999999,
        "reward_max": 0.5432500000000002,
        "reward_min": -1.5459375,
        "leartime_s": 0.05403965900768526,
        "sampletime": 1.8618083549954463,
        "best_mean": -0.3554999999999999,
        "best_max": 0.6176250000000003,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 101,
        "timesteps": 202000,
        "reward_mean": -0.31234999999999985,
        "reward_max": 0.5675000000000003,
        "reward_min": -1.5661874999999996,
        "leartime_s": 0.010999599995557219,
        "sampletime": 1.8491068609873764,
        "best_mean": -0.31234999999999985,
        "best_max": 0.5675000000000003,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 102,
        "timesteps": 204000,
        "reward_mean": -0.5103999999999999,
        "reward_max": 0.5003750000000005,
        "reward_min": -1.4401249999999999,
        "leartime_s": 0.04190559999551624,
        "sampletime": 2.049818483996205,
        "best_mean": -0.31234999999999985,
        "best_max": 0.5675000000000003,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 103,
        "timesteps": 206000,
        "reward_mean": -0.634525,
        "reward_max": 0.39043750000000055,
        "reward_min": -1.7408125000000003,
        "leartime_s": 0.016519046010216698,
        "sampletime": 1.8047045640123542,
        "best_mean": -0.31234999999999985,
        "best_max": 0.5675000000000003,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 104,
        "timesteps": 208000,
        "reward_mean": -0.3970999999999999,
        "reward_max": 0.6192500000000003,
        "reward_min": -1.6633125000000006,
        "leartime_s": 0.026419290021294728,
        "sampletime": 2.1079490769770928,
        "best_mean": -0.31234999999999985,
        "best_max": 0.5675000000000003,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 105,
        "timesteps": 210000,
        "reward_mean": -0.2305999999999998,
        "reward_max": 0.5460625000000005,
        "reward_min": -1.2199375,
        "leartime_s": 0.029293831990798935,
        "sampletime": 2.026945738994982,
        "best_mean": -0.2305999999999998,
        "best_max": 0.5460625000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 106,
        "timesteps": 212000,
        "reward_mean": -0.46649999999999986,
        "reward_max": 0.4584375000000003,
        "reward_min": -1.5864375,
        "leartime_s": 0.027919298998313025,
        "sampletime": 1.7173095119942445,
        "best_mean": -0.2305999999999998,
        "best_max": 0.5460625000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 107,
        "timesteps": 214000,
        "reward_mean": -0.42217499999999986,
        "reward_max": 0.5625000000000002,
        "reward_min": -1.98075,
        "leartime_s": 0.021124819002579898,
        "sampletime": 1.9701684429892339,
        "best_mean": -0.2305999999999998,
        "best_max": 0.5460625000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 108,
        "timesteps": 216000,
        "reward_mean": -0.30589999999999984,
        "reward_max": 0.4925000000000005,
        "reward_min": -1.5313750000000002,
        "leartime_s": 0.013077568000881001,
        "sampletime": 2.267071947979275,
        "best_mean": -0.2305999999999998,
        "best_max": 0.5460625000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 109,
        "timesteps": 218000,
        "reward_mean": -0.4089249999999998,
        "reward_max": 0.38968750000000035,
        "reward_min": -1.6450624999999999,
        "leartime_s": 0.027812423009891063,
        "sampletime": 2.210459049005294,
        "best_mean": -0.2305999999999998,
        "best_max": 0.5460625000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 110,
        "timesteps": 220000,
        "reward_mean": -0.3894749999999999,
        "reward_max": 0.31968750000000046,
        "reward_min": -1.3188750000000002,
        "leartime_s": 0.014458663994446397,
        "sampletime": 2.3158598099835217,
        "best_mean": -0.2305999999999998,
        "best_max": 0.5460625000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 111,
        "timesteps": 222000,
        "reward_mean": -0.2722999999999998,
        "reward_max": 0.6351250000000005,
        "reward_min": -1.6571875000000003,
        "leartime_s": 0.0632372550026048,
        "sampletime": 1.7950694079918321,
        "best_mean": -0.2305999999999998,
        "best_max": 0.5460625000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 112,
        "timesteps": 224000,
        "reward_mean": -0.34104999999999985,
        "reward_max": 0.4986875000000004,
        "reward_min": -1.7395000000000005,
        "leartime_s": 0.051328556990483776,
        "sampletime": 2.046824963996187,
        "best_mean": -0.2305999999999998,
        "best_max": 0.5460625000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 113,
        "timesteps": 226000,
        "reward_mean": -0.5186999999999998,
        "reward_max": 0.46687500000000054,
        "reward_min": -1.7134375000000004,
        "leartime_s": 0.017335655022179708,
        "sampletime": 1.7508462879923172,
        "best_mean": -0.2305999999999998,
        "best_max": 0.5460625000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 114,
        "timesteps": 228000,
        "reward_mean": -0.5583499999999999,
        "reward_max": 0.23787500000000028,
        "reward_min": -1.9667500000000002,
        "leartime_s": 0.01887326900032349,
        "sampletime": 1.7776750970224384,
        "best_mean": -0.2305999999999998,
        "best_max": 0.5460625000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 115,
        "timesteps": 230000,
        "reward_mean": -0.5536749999999999,
        "reward_max": 1.0365625000000003,
        "reward_min": -1.8841875000000001,
        "leartime_s": 0.013455111999064684,
        "sampletime": 1.9689384840021376,
        "best_mean": -0.2305999999999998,
        "best_max": 0.5460625000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 116,
        "timesteps": 232000,
        "reward_mean": -0.45734999999999987,
        "reward_max": 0.5235000000000005,
        "reward_min": -1.53175,
        "leartime_s": 0.009502031985903159,
        "sampletime": 2.3493713550269604,
        "best_mean": -0.2305999999999998,
        "best_max": 0.5460625000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 117,
        "timesteps": 234000,
        "reward_mean": -0.1653499999999998,
        "reward_max": 0.8206250000000002,
        "reward_min": -1.2284374999999996,
        "leartime_s": 0.024939265014836565,
        "sampletime": 1.7512160270125605,
        "best_mean": -0.1653499999999998,
        "best_max": 0.8206250000000002,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 118,
        "timesteps": 236000,
        "reward_mean": -0.2052249999999998,
        "reward_max": 0.6403750000000001,
        "reward_min": -1.5666250000000004,
        "leartime_s": 0.043279899982735515,
        "sampletime": 1.993922865978675,
        "best_mean": -0.1653499999999998,
        "best_max": 0.8206250000000002,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 119,
        "timesteps": 238000,
        "reward_mean": -0.12339999999999976,
        "reward_max": 0.7225000000000005,
        "reward_min": -1.4791250000000005,
        "leartime_s": 0.03759721398819238,
        "sampletime": 2.195551204000367,
        "best_mean": -0.12339999999999976,
        "best_max": 0.7225000000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 120,
        "timesteps": 240000,
        "reward_mean": -0.35099999999999987,
        "reward_max": 0.4748125000000003,
        "reward_min": -1.2303750000000004,
        "leartime_s": 0.03005557702272199,
        "sampletime": 1.6960384100093506,
        "best_mean": -0.12339999999999976,
        "best_max": 0.7225000000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 121,
        "timesteps": 242000,
        "reward_mean": -0.4913749999999999,
        "reward_max": 0.3105625000000002,
        "reward_min": -1.5186250000000003,
        "leartime_s": 0.009479168016696349,
        "sampletime": 2.0363159109838307,
        "best_mean": -0.12339999999999976,
        "best_max": 0.7225000000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 122,
        "timesteps": 244000,
        "reward_mean": -0.15772499999999975,
        "reward_max": 0.9347500000000005,
        "reward_min": -1.4230624999999997,
        "leartime_s": 0.04049623798346147,
        "sampletime": 2.2726434050127864,
        "best_mean": -0.12339999999999976,
        "best_max": 0.7225000000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 123,
        "timesteps": 246000,
        "reward_mean": -0.5859249999999997,
        "reward_max": 0.5098125000000006,
        "reward_min": -1.6326874999999994,
        "leartime_s": 0.020243900013156235,
        "sampletime": 1.8211222999962047,
        "best_mean": -0.12339999999999976,
        "best_max": 0.7225000000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 124,
        "timesteps": 248000,
        "reward_mean": -0.20739999999999978,
        "reward_max": 0.6775625000000003,
        "reward_min": -1.5194999999999999,
        "leartime_s": 0.02715225302381441,
        "sampletime": 2.0404763739788905,
        "best_mean": -0.12339999999999976,
        "best_max": 0.7225000000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 125,
        "timesteps": 250000,
        "reward_mean": -0.4607749999999999,
        "reward_max": 0.6516875000000005,
        "reward_min": -1.6495624999999998,
        "leartime_s": 0.025921036984072998,
        "sampletime": 2.0376431150070857,
        "best_mean": -0.12339999999999976,
        "best_max": 0.7225000000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 126,
        "timesteps": 252000,
        "reward_mean": -0.0822499999999998,
        "reward_max": 0.7696875000000004,
        "reward_min": -0.8804375,
        "leartime_s": 0.019263157999375835,
        "sampletime": 2.0461656209954526,
        "best_mean": -0.0822499999999998,
        "best_max": 0.7696875000000004,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 127,
        "timesteps": 254000,
        "reward_mean": -0.37774999999999975,
        "reward_max": 0.6501250000000004,
        "reward_min": -1.4546875,
        "leartime_s": 0.03787410500808619,
        "sampletime": 1.8864007639931515,
        "best_mean": -0.0822499999999998,
        "best_max": 0.7696875000000004,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 128,
        "timesteps": 256000,
        "reward_mean": -0.3750749999999998,
        "reward_max": 0.5730000000000004,
        "reward_min": -1.2676250000000002,
        "leartime_s": 0.0864241259987466,
        "sampletime": 2.3640705200086813,
        "best_mean": -0.0822499999999998,
        "best_max": 0.7696875000000004,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 129,
        "timesteps": 258000,
        "reward_mean": -0.3255499999999998,
        "reward_max": 0.8330000000000005,
        "reward_min": -1.6598125000000001,
        "leartime_s": 0.013031907001277432,
        "sampletime": 1.7985967580170836,
        "best_mean": -0.0822499999999998,
        "best_max": 0.7696875000000004,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 130,
        "timesteps": 260000,
        "reward_mean": -0.22857499999999975,
        "reward_max": 0.7363125000000006,
        "reward_min": -1.3224375000000004,
        "leartime_s": 0.015767600008985028,
        "sampletime": 1.6730280560150277,
        "best_mean": -0.0822499999999998,
        "best_max": 0.7696875000000004,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 131,
        "timesteps": 262000,
        "reward_mean": -0.29037499999999977,
        "reward_max": 0.7840625000000006,
        "reward_min": -1.4089375000000002,
        "leartime_s": 0.028629339998587966,
        "sampletime": 1.9100023200153373,
        "best_mean": -0.0822499999999998,
        "best_max": 0.7696875000000004,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 132,
        "timesteps": 264000,
        "reward_mean": -0.22164999999999968,
        "reward_max": 0.7960000000000005,
        "reward_min": -1.296125,
        "leartime_s": 0.04971929299063049,
        "sampletime": 1.8507568280037958,
        "best_mean": -0.0822499999999998,
        "best_max": 0.7696875000000004,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 133,
        "timesteps": 266000,
        "reward_mean": -0.10519999999999974,
        "reward_max": 0.9659375000000003,
        "reward_min": -1.2163125,
        "leartime_s": 0.022941158997127786,
        "sampletime": 2.2284121029952075,
        "best_mean": -0.0822499999999998,
        "best_max": 0.7696875000000004,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 134,
        "timesteps": 268000,
        "reward_mean": -0.2967249999999998,
        "reward_max": 0.6798125000000005,
        "reward_min": -1.8249375000000003,
        "leartime_s": 0.013923795020673424,
        "sampletime": 2.131671588984318,
        "best_mean": -0.0822499999999998,
        "best_max": 0.7696875000000004,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 135,
        "timesteps": 270000,
        "reward_mean": -0.3034249999999998,
        "reward_max": 0.5250000000000005,
        "reward_min": -1.5870000000000004,
        "leartime_s": 0.04814923999947496,
        "sampletime": 1.750032132025808,
        "best_mean": -0.0822499999999998,
        "best_max": 0.7696875000000004,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 136,
        "timesteps": 272000,
        "reward_mean": -0.24942499999999976,
        "reward_max": 0.6098750000000006,
        "reward_min": -1.5704999999999998,
        "leartime_s": 0.06937853500130586,
        "sampletime": 2.2279640120104887,
        "best_mean": -0.0822499999999998,
        "best_max": 0.7696875000000004,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 137,
        "timesteps": 274000,
        "reward_mean": -0.20947499999999977,
        "reward_max": 0.5668125000000007,
        "reward_min": -1.4825000000000002,
        "leartime_s": 0.01882700901478529,
        "sampletime": 1.832353375008097,
        "best_mean": -0.0822499999999998,
        "best_max": 0.7696875000000004,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 138,
        "timesteps": 276000,
        "reward_mean": -0.21869999999999978,
        "reward_max": 1.1048750000000007,
        "reward_min": -1.5956875000000001,
        "leartime_s": 0.03169797101872973,
        "sampletime": 1.9721534440177493,
        "best_mean": -0.0822499999999998,
        "best_max": 0.7696875000000004,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 139,
        "timesteps": 278000,
        "reward_mean": -0.1748999999999997,
        "reward_max": 0.6230000000000003,
        "reward_min": -1.4662499999999998,
        "leartime_s": 0.02672230001189746,
        "sampletime": 1.9978132609976456,
        "best_mean": -0.0822499999999998,
        "best_max": 0.7696875000000004,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 140,
        "timesteps": 280000,
        "reward_mean": -0.011699999999999692,
        "reward_max": 1.0757500000000002,
        "reward_min": -1.3387499999999999,
        "leartime_s": 0.017721526004606858,
        "sampletime": 1.9432250980171375,
        "best_mean": -0.011699999999999692,
        "best_max": 1.0757500000000002,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 141,
        "timesteps": 282000,
        "reward_mean": -0.06207499999999974,
        "reward_max": 1.0802500000000004,
        "reward_min": -1.2791875,
        "leartime_s": 0.026342147000832483,
        "sampletime": 1.9358319420134649,
        "best_mean": -0.011699999999999692,
        "best_max": 1.0757500000000002,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 142,
        "timesteps": 284000,
        "reward_mean": -0.13012499999999974,
        "reward_max": 0.8775000000000004,
        "reward_min": -1.2933750000000002,
        "leartime_s": 0.01766261601005681,
        "sampletime": 2.189407678000862,
        "best_mean": -0.011699999999999692,
        "best_max": 1.0757500000000002,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 143,
        "timesteps": 286000,
        "reward_mean": -0.2738749999999997,
        "reward_max": 0.6623750000000005,
        "reward_min": -1.2789375,
        "leartime_s": 0.0364867799798958,
        "sampletime": 2.1193370379914995,
        "best_mean": -0.011699999999999692,
        "best_max": 1.0757500000000002,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 144,
        "timesteps": 288000,
        "reward_mean": 0.09190000000000029,
        "reward_max": 1.2607500000000003,
        "reward_min": -0.9921249999999999,
        "leartime_s": 0.05424944599508308,
        "sampletime": 2.0168105060001835,
        "best_mean": 0.09190000000000029,
        "best_max": 1.2607500000000003,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 145,
        "timesteps": 290000,
        "reward_mean": 0.02055000000000034,
        "reward_max": 0.8992500000000005,
        "reward_min": -0.9061250000000001,
        "leartime_s": 0.03577631400548853,
        "sampletime": 1.769979171018349,
        "best_mean": 0.09190000000000029,
        "best_max": 1.2607500000000003,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 146,
        "timesteps": 292000,
        "reward_mean": -0.011424999999999649,
        "reward_max": 0.9208750000000004,
        "reward_min": -1.173125,
        "leartime_s": 0.0143313980079256,
        "sampletime": 1.968635439989157,
        "best_mean": 0.09190000000000029,
        "best_max": 1.2607500000000003,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 147,
        "timesteps": 294000,
        "reward_mean": -0.12862499999999968,
        "reward_max": 0.9433125000000006,
        "reward_min": -1.4182500000000005,
        "leartime_s": 0.015000662999227643,
        "sampletime": 1.7034278250066563,
        "best_mean": 0.09190000000000029,
        "best_max": 1.2607500000000003,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 148,
        "timesteps": 296000,
        "reward_mean": -0.20942499999999972,
        "reward_max": 0.6956875000000003,
        "reward_min": -1.8216875000000003,
        "leartime_s": 0.017536914005177096,
        "sampletime": 1.918466388975503,
        "best_mean": 0.09190000000000029,
        "best_max": 1.2607500000000003,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 149,
        "timesteps": 298000,
        "reward_mean": -0.2713499999999998,
        "reward_max": 0.47843750000000024,
        "reward_min": -1.10825,
        "leartime_s": 0.017530293989693746,
        "sampletime": 1.7670649439969566,
        "best_mean": 0.09190000000000029,
        "best_max": 1.2607500000000003,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 150,
        "timesteps": 300000,
        "reward_mean": -0.18804999999999975,
        "reward_max": 0.5568750000000003,
        "reward_min": -1.4536249999999997,
        "leartime_s": 0.010062623012345284,
        "sampletime": 2.1662544920109212,
        "best_mean": 0.09190000000000029,
        "best_max": 1.2607500000000003,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 151,
        "timesteps": 302000,
        "reward_mean": 0.3689250000000003,
        "reward_max": 1.2173750000000008,
        "reward_min": -0.8681874999999998,
        "leartime_s": 0.014298157999292016,
        "sampletime": 2.121083448000718,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 152,
        "timesteps": 304000,
        "reward_mean": 0.00017500000000029826,
        "reward_max": 0.9236250000000003,
        "reward_min": -1.0146250000000003,
        "leartime_s": 0.02618068500305526,
        "sampletime": 2.0897397350054234,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 153,
        "timesteps": 306000,
        "reward_mean": -0.13139999999999966,
        "reward_max": 0.6273750000000008,
        "reward_min": -1.0483125,
        "leartime_s": 0.011509484000271186,
        "sampletime": 2.315552112995647,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 154,
        "timesteps": 308000,
        "reward_mean": 0.06605000000000026,
        "reward_max": 1.3028125000000002,
        "reward_min": -1.2984375,
        "leartime_s": 0.04238933901069686,
        "sampletime": 1.8215641800197773,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 155,
        "timesteps": 310000,
        "reward_mean": 0.06285000000000038,
        "reward_max": 1.1848750000000006,
        "reward_min": -1.0622499999999997,
        "leartime_s": 0.011299103003693745,
        "sampletime": 2.2971738129854202,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 156,
        "timesteps": 312000,
        "reward_mean": -0.08897499999999968,
        "reward_max": 0.9899375000000005,
        "reward_min": -1.3141875000000003,
        "leartime_s": 0.015577777987346053,
        "sampletime": 2.103990479983622,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 157,
        "timesteps": 314000,
        "reward_mean": -0.07042499999999967,
        "reward_max": 0.9513750000000006,
        "reward_min": -1.3760625,
        "leartime_s": 0.03158209900720976,
        "sampletime": 2.1137856949935667,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 158,
        "timesteps": 316000,
        "reward_mean": 0.18225000000000033,
        "reward_max": 1.1050625,
        "reward_min": -1.2219375000000001,
        "leartime_s": 0.055258765001781285,
        "sampletime": 2.049184889998287,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 159,
        "timesteps": 318000,
        "reward_mean": -0.10567499999999977,
        "reward_max": 0.9822500000000006,
        "reward_min": -1.2193124999999996,
        "leartime_s": 0.0583034289884381,
        "sampletime": 1.753500812978018,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 160,
        "timesteps": 320000,
        "reward_mean": -0.017249999999999717,
        "reward_max": 0.9654375000000004,
        "reward_min": -1.255375,
        "leartime_s": 0.010922980000032112,
        "sampletime": 2.338029671984259,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 161,
        "timesteps": 322000,
        "reward_mean": -0.08684999999999969,
        "reward_max": 0.8545000000000003,
        "reward_min": -2.0075,
        "leartime_s": 0.011396324000088498,
        "sampletime": 1.9182235240004957,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 162,
        "timesteps": 324000,
        "reward_mean": -0.06709999999999972,
        "reward_max": 1.0107500000000007,
        "reward_min": -1.119375,
        "leartime_s": 0.02474300400353968,
        "sampletime": 1.9109577590133995,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 163,
        "timesteps": 326000,
        "reward_mean": -0.35964999999999975,
        "reward_max": 0.6914375000000004,
        "reward_min": -1.4008749999999996,
        "leartime_s": 0.052223810023861006,
        "sampletime": 2.4664172810153104,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 164,
        "timesteps": 328000,
        "reward_mean": -0.09222499999999977,
        "reward_max": 0.8138125000000004,
        "reward_min": -1.1220624999999997,
        "leartime_s": 0.04047305299900472,
        "sampletime": 1.735884090012405,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 165,
        "timesteps": 330000,
        "reward_mean": -0.08254999999999961,
        "reward_max": 0.7935625000000003,
        "reward_min": -1.2808749999999998,
        "leartime_s": 0.03961297101341188,
        "sampletime": 1.7229352389986161,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 166,
        "timesteps": 332000,
        "reward_mean": 0.06440000000000023,
        "reward_max": 0.8836875000000004,
        "reward_min": -1.2783749999999998,
        "leartime_s": 0.04705371698946692,
        "sampletime": 1.912266956991516,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 167,
        "timesteps": 334000,
        "reward_mean": -0.009949999999999754,
        "reward_max": 1.2944375000000001,
        "reward_min": -1.1454999999999997,
        "leartime_s": 0.033541976008564234,
        "sampletime": 1.980816852999851,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 168,
        "timesteps": 336000,
        "reward_mean": 0.05772500000000031,
        "reward_max": 0.9581875000000004,
        "reward_min": -1.3040624999999997,
        "leartime_s": 0.030538480990799144,
        "sampletime": 1.8678777079912834,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 169,
        "timesteps": 338000,
        "reward_mean": 0.09705000000000033,
        "reward_max": 1.0638750000000006,
        "reward_min": -1.213375,
        "leartime_s": 0.029807000973960385,
        "sampletime": 2.241358402010519,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 170,
        "timesteps": 340000,
        "reward_mean": -0.10104999999999972,
        "reward_max": 1.1760625000000005,
        "reward_min": -1.341625,
        "leartime_s": 0.021479785995325074,
        "sampletime": 2.0874741169973277,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 171,
        "timesteps": 342000,
        "reward_mean": -0.06989999999999977,
        "reward_max": 0.8372500000000003,
        "reward_min": -1.2096874999999998,
        "leartime_s": 0.05605403700610623,
        "sampletime": 1.8336315949854907,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 172,
        "timesteps": 344000,
        "reward_mean": -0.13742499999999971,
        "reward_max": 0.8283125000000005,
        "reward_min": -1.5883124999999998,
        "leartime_s": 0.012664362002396956,
        "sampletime": 2.22522527599358,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 173,
        "timesteps": 346000,
        "reward_mean": -0.11602499999999974,
        "reward_max": 0.8878750000000005,
        "reward_min": -1.2086875,
        "leartime_s": 0.04887663200497627,
        "sampletime": 1.930661708000116,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 174,
        "timesteps": 348000,
        "reward_mean": -0.010649999999999686,
        "reward_max": 1.0248750000000004,
        "reward_min": -1.2197500000000001,
        "leartime_s": 0.04494225900270976,
        "sampletime": 2.141134936013259,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 175,
        "timesteps": 350000,
        "reward_mean": -0.23909999999999973,
        "reward_max": 0.7055000000000007,
        "reward_min": -1.4856250000000002,
        "leartime_s": 0.03429815199342556,
        "sampletime": 2.066206029994646,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 176,
        "timesteps": 352000,
        "reward_mean": -0.1305249999999997,
        "reward_max": 1.0070000000000006,
        "reward_min": -1.3957500000000005,
        "leartime_s": 0.046197270014090464,
        "sampletime": 2.0543517070182133,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 177,
        "timesteps": 354000,
        "reward_mean": 0.05257500000000035,
        "reward_max": 1.0313750000000004,
        "reward_min": -1.2528750000000004,
        "leartime_s": 0.01804793899646029,
        "sampletime": 2.032733729982283,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 178,
        "timesteps": 356000,
        "reward_mean": 0.08505000000000033,
        "reward_max": 1.0395000000000005,
        "reward_min": -1.0453749999999995,
        "leartime_s": 0.05674430399085395,
        "sampletime": 1.769782037998084,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 179,
        "timesteps": 358000,
        "reward_mean": -0.21767499999999976,
        "reward_max": 0.7820000000000005,
        "reward_min": -1.3028749999999998,
        "leartime_s": 0.0128215049917344,
        "sampletime": 2.085923194012139,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 180,
        "timesteps": 360000,
        "reward_mean": 0.18790000000000026,
        "reward_max": 1.245125,
        "reward_min": -0.8223125,
        "leartime_s": 0.02895308900042437,
        "sampletime": 1.9447664510225877,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 181,
        "timesteps": 362000,
        "reward_mean": -0.004124999999999749,
        "reward_max": 0.9270000000000007,
        "reward_min": -0.9982499999999997,
        "leartime_s": 0.01291028200648725,
        "sampletime": 1.9250024769862648,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 182,
        "timesteps": 364000,
        "reward_mean": -0.07407499999999977,
        "reward_max": 0.9394375000000004,
        "reward_min": -1.1086250000000002,
        "leartime_s": 0.04406906000804156,
        "sampletime": 1.6591707619954832,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 183,
        "timesteps": 366000,
        "reward_mean": -0.045824999999999665,
        "reward_max": 1.0633125000000003,
        "reward_min": -0.9553124999999995,
        "leartime_s": 0.033079411019571126,
        "sampletime": 1.8817937559797429,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 184,
        "timesteps": 368000,
        "reward_mean": 0.0060750000000003275,
        "reward_max": 1.3592500000000007,
        "reward_min": -1.0230624999999998,
        "leartime_s": 0.056938453984912485,
        "sampletime": 1.6962584180000704,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 185,
        "timesteps": 370000,
        "reward_mean": -0.03894999999999971,
        "reward_max": 1.0491250000000005,
        "reward_min": -1.5153125,
        "leartime_s": 0.051091895991703495,
        "sampletime": 2.1931647390010767,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 186,
        "timesteps": 372000,
        "reward_mean": -0.026974999999999826,
        "reward_max": 0.8107500000000001,
        "reward_min": -1.0053125,
        "leartime_s": 0.038792538980487734,
        "sampletime": 2.040715180017287,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 187,
        "timesteps": 374000,
        "reward_mean": 0.14652500000000032,
        "reward_max": 0.9448750000000004,
        "reward_min": -1.1255624999999998,
        "leartime_s": 0.013524291018256918,
        "sampletime": 1.862275002989918,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 188,
        "timesteps": 376000,
        "reward_mean": 0.041350000000000324,
        "reward_max": 0.9900000000000004,
        "reward_min": -0.9606874999999997,
        "leartime_s": 0.034080059005646035,
        "sampletime": 2.143759353988571,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 189,
        "timesteps": 378000,
        "reward_mean": -0.17292499999999975,
        "reward_max": 0.7110625000000004,
        "reward_min": -1.2816874999999999,
        "leartime_s": 0.028338569012703374,
        "sampletime": 1.8135267600009684,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 190,
        "timesteps": 380000,
        "reward_mean": 0.16035000000000035,
        "reward_max": 1.1354375000000005,
        "reward_min": -1.3320625,
        "leartime_s": 0.01779126698966138,
        "sampletime": 2.2052320769871585,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 191,
        "timesteps": 382000,
        "reward_mean": -0.03494999999999972,
        "reward_max": 0.7719375000000006,
        "reward_min": -1.4653750000000003,
        "leartime_s": 0.05161441001109779,
        "sampletime": 2.1113552289898507,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 192,
        "timesteps": 384000,
        "reward_mean": -0.1555249999999997,
        "reward_max": 0.8196250000000004,
        "reward_min": -1.6212499999999999,
        "leartime_s": 0.03696838900214061,
        "sampletime": 2.2027312380087096,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 193,
        "timesteps": 386000,
        "reward_mean": -0.19572499999999973,
        "reward_max": 0.8330000000000004,
        "reward_min": -1.3424999999999998,
        "leartime_s": 0.024271639995276928,
        "sampletime": 2.0250280179898255,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 194,
        "timesteps": 388000,
        "reward_mean": 0.010050000000000217,
        "reward_max": 0.9098125000000004,
        "reward_min": -1.1323750000000001,
        "leartime_s": 0.03309168800478801,
        "sampletime": 1.6952198290091474,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 195,
        "timesteps": 390000,
        "reward_mean": 0.044125000000000324,
        "reward_max": 0.9696250000000006,
        "reward_min": -0.9237499999999998,
        "leartime_s": 0.012393192009767517,
        "sampletime": 2.0681943199888337,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 196,
        "timesteps": 392000,
        "reward_mean": 0.058800000000000255,
        "reward_max": 0.9093750000000003,
        "reward_min": -1.1804375,
        "leartime_s": 0.020368547993712127,
        "sampletime": 2.0180260479974095,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 197,
        "timesteps": 394000,
        "reward_mean": -0.15379999999999974,
        "reward_max": 0.8354375000000005,
        "reward_min": -1.2219375,
        "leartime_s": 0.03916422897600569,
        "sampletime": 1.8663678129960317,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 198,
        "timesteps": 396000,
        "reward_mean": -0.1685749999999997,
        "reward_max": 0.6425625000000005,
        "reward_min": -1.12125,
        "leartime_s": 0.026473476988030598,
        "sampletime": 1.9341763989941683,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 199,
        "timesteps": 398000,
        "reward_mean": 0.07665000000000027,
        "reward_max": 0.9540625000000001,
        "reward_min": -0.772,
        "leartime_s": 0.049132719985209405,
        "sampletime": 1.6466007290000562,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 200,
        "timesteps": 400000,
        "reward_mean": 0.15210000000000032,
        "reward_max": 0.9986250000000005,
        "reward_min": -0.9984374999999999,
        "leartime_s": 0.032699698000214994,
        "sampletime": 1.9246328070003074,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 201,
        "timesteps": 402000,
        "reward_mean": -0.10414999999999976,
        "reward_max": 0.8279375000000003,
        "reward_min": -1.2177499999999997,
        "leartime_s": 0.07698300399351865,
        "sampletime": 2.0793183030036744,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 202,
        "timesteps": 404000,
        "reward_mean": -0.3570999999999998,
        "reward_max": 0.5775000000000003,
        "reward_min": -1.3719375000000003,
        "leartime_s": 0.061184395977761596,
        "sampletime": 2.248636935983086,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 203,
        "timesteps": 406000,
        "reward_mean": 0.14705000000000035,
        "reward_max": 1.1069375000000008,
        "reward_min": -1.0109374999999996,
        "leartime_s": 0.028113166976254433,
        "sampletime": 1.6476739089994226,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 204,
        "timesteps": 408000,
        "reward_mean": -0.020474999999999674,
        "reward_max": 0.8119375000000006,
        "reward_min": -1.3904999999999996,
        "leartime_s": 0.060440959001425654,
        "sampletime": 1.918105203018058,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 205,
        "timesteps": 410000,
        "reward_mean": 0.05015000000000034,
        "reward_max": 0.8881250000000006,
        "reward_min": -0.8436874999999997,
        "leartime_s": 0.04052682899055071,
        "sampletime": 1.990746247000061,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 206,
        "timesteps": 412000,
        "reward_mean": -0.01387499999999978,
        "reward_max": 0.9962500000000006,
        "reward_min": -1.3514375,
        "leartime_s": 0.09375569198164158,
        "sampletime": 1.7371737339999527,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 207,
        "timesteps": 414000,
        "reward_mean": 0.04150000000000033,
        "reward_max": 0.9850625000000005,
        "reward_min": -1.2100000000000002,
        "leartime_s": 0.013355940027395263,
        "sampletime": 2.1355969269934576,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 208,
        "timesteps": 416000,
        "reward_mean": -0.17327499999999976,
        "reward_max": 0.8293125000000002,
        "reward_min": -1.493125,
        "leartime_s": 0.026826136017916724,
        "sampletime": 1.9546835560176987,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 209,
        "timesteps": 418000,
        "reward_mean": -0.2560749999999998,
        "reward_max": 0.6371875000000005,
        "reward_min": -1.219375,
        "leartime_s": 0.0470062320237048,
        "sampletime": 1.810125837015221,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 210,
        "timesteps": 420000,
        "reward_mean": 0.009725000000000272,
        "reward_max": 1.0273125000000005,
        "reward_min": -1.4923125,
        "leartime_s": 0.0975054329901468,
        "sampletime": 1.9837660259800032,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 211,
        "timesteps": 422000,
        "reward_mean": -0.04737499999999972,
        "reward_max": 0.9798750000000004,
        "reward_min": -1.2671249999999998,
        "leartime_s": 0.04580169002292678,
        "sampletime": 2.4757527800102253,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 212,
        "timesteps": 424000,
        "reward_mean": 0.03175000000000026,
        "reward_max": 0.9252500000000005,
        "reward_min": -0.9827499999999999,
        "leartime_s": 0.05653746100142598,
        "sampletime": 1.7136291660135612,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 213,
        "timesteps": 426000,
        "reward_mean": 0.0903000000000003,
        "reward_max": 1.1421875000000006,
        "reward_min": -1.02525,
        "leartime_s": 0.015702745993621647,
        "sampletime": 2.3132537069905084,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 214,
        "timesteps": 428000,
        "reward_mean": -0.21604999999999971,
        "reward_max": 0.6271250000000006,
        "reward_min": -1.3508750000000003,
        "leartime_s": 0.040257866989122704,
        "sampletime": 1.9426956860115752,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 215,
        "timesteps": 430000,
        "reward_mean": 0.14710000000000029,
        "reward_max": 0.9065625000000002,
        "reward_min": -0.7431874999999998,
        "leartime_s": 0.04207720098202117,
        "sampletime": 1.8842141529894434,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 216,
        "timesteps": 432000,
        "reward_mean": -0.1889249999999998,
        "reward_max": 0.6047500000000002,
        "reward_min": -1.2388125,
        "leartime_s": 0.025317913998151198,
        "sampletime": 1.778546671004733,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 217,
        "timesteps": 434000,
        "reward_mean": 0.025275000000000252,
        "reward_max": 1.1136875000000004,
        "reward_min": -1.2608125000000003,
        "leartime_s": 0.04312643900630064,
        "sampletime": 1.8976388739829417,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 218,
        "timesteps": 436000,
        "reward_mean": 0.11260000000000035,
        "reward_max": 1.1543750000000006,
        "reward_min": -1.1073749999999998,
        "leartime_s": 0.059438972995849326,
        "sampletime": 2.076631367992377,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 219,
        "timesteps": 438000,
        "reward_mean": -0.2404749999999998,
        "reward_max": 0.8740625000000005,
        "reward_min": -1.20725,
        "leartime_s": 0.04628329601837322,
        "sampletime": 1.9034539540007245,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 220,
        "timesteps": 440000,
        "reward_mean": 0.03320000000000037,
        "reward_max": 1.1341250000000003,
        "reward_min": -1.024875,
        "leartime_s": 0.026818437996553257,
        "sampletime": 2.278386697988026,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 221,
        "timesteps": 442000,
        "reward_mean": -0.14879999999999977,
        "reward_max": 0.7746250000000005,
        "reward_min": -1.4296875,
        "leartime_s": 0.03866716302582063,
        "sampletime": 1.7227278460050002,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 222,
        "timesteps": 444000,
        "reward_mean": -0.2224249999999997,
        "reward_max": 0.8578750000000004,
        "reward_min": -1.327625,
        "leartime_s": 0.04305667901644483,
        "sampletime": 2.163600010011578,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 223,
        "timesteps": 446000,
        "reward_mean": -0.024149999999999686,
        "reward_max": 0.7874375000000007,
        "reward_min": -0.9873749999999999,
        "leartime_s": 0.03991348302224651,
        "sampletime": 1.8496013460098766,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 224,
        "timesteps": 448000,
        "reward_mean": 0.17082500000000028,
        "reward_max": 1.1895625000000005,
        "reward_min": -1.2449375,
        "leartime_s": 0.07734776500728913,
        "sampletime": 2.2995230949891265,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 225,
        "timesteps": 450000,
        "reward_mean": -0.08064999999999978,
        "reward_max": 0.8135000000000002,
        "reward_min": -1.4324375,
        "leartime_s": 0.033834923000540584,
        "sampletime": 2.1009662639989983,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 226,
        "timesteps": 452000,
        "reward_mean": 0.14700000000000035,
        "reward_max": 1.2478750000000005,
        "reward_min": -1.0764999999999998,
        "leartime_s": 0.047492304001934826,
        "sampletime": 1.8244467850017827,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 227,
        "timesteps": 454000,
        "reward_mean": 0.2468000000000004,
        "reward_max": 1.0939375000000005,
        "reward_min": -1.0937499999999998,
        "leartime_s": 0.027925055008381605,
        "sampletime": 2.3338621410075575,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 228,
        "timesteps": 456000,
        "reward_mean": -0.16369999999999976,
        "reward_max": 0.7910000000000004,
        "reward_min": -1.8319375,
        "leartime_s": 0.03696847701212391,
        "sampletime": 1.980524251004681,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 229,
        "timesteps": 458000,
        "reward_mean": -0.17907499999999976,
        "reward_max": 0.7307500000000002,
        "reward_min": -1.4543749999999998,
        "leartime_s": 0.025786126992898062,
        "sampletime": 2.269929014990339,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 230,
        "timesteps": 460000,
        "reward_mean": -0.28659999999999974,
        "reward_max": 0.8060000000000006,
        "reward_min": -1.5213125000000003,
        "leartime_s": 0.03271875498467125,
        "sampletime": 2.0401042650046293,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 231,
        "timesteps": 462000,
        "reward_mean": -0.23102499999999976,
        "reward_max": 0.8538750000000004,
        "reward_min": -1.2733749999999995,
        "leartime_s": 0.05389354401268065,
        "sampletime": 1.972376883000834,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 232,
        "timesteps": 464000,
        "reward_mean": -0.025224999999999685,
        "reward_max": 0.9780625000000004,
        "reward_min": -1.0645,
        "leartime_s": 0.033906754018971696,
        "sampletime": 1.8686060320178512,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 233,
        "timesteps": 466000,
        "reward_mean": -0.06047499999999971,
        "reward_max": 0.7900625000000001,
        "reward_min": -1.1834375000000001,
        "leartime_s": 0.03648915601661429,
        "sampletime": 1.744028725021053,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 234,
        "timesteps": 468000,
        "reward_mean": -0.17172499999999974,
        "reward_max": 0.8178750000000005,
        "reward_min": -1.2706874999999997,
        "leartime_s": 0.020667395991040394,
        "sampletime": 1.6513153950218111,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 235,
        "timesteps": 470000,
        "reward_mean": -0.19597499999999973,
        "reward_max": 0.9090625000000004,
        "reward_min": -1.3755000000000002,
        "leartime_s": 0.04333866899833083,
        "sampletime": 1.9476797640090808,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 236,
        "timesteps": 472000,
        "reward_mean": -0.11632499999999976,
        "reward_max": 0.9791250000000007,
        "reward_min": -1.156375,
        "leartime_s": 0.03655044501647353,
        "sampletime": 2.0896495869965293,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 237,
        "timesteps": 474000,
        "reward_mean": -0.17442499999999972,
        "reward_max": 0.5976250000000003,
        "reward_min": -1.3314374999999998,
        "leartime_s": 0.04641635398729704,
        "sampletime": 2.000528475997271,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 238,
        "timesteps": 476000,
        "reward_mean": 0.022400000000000298,
        "reward_max": 0.9880000000000004,
        "reward_min": -0.9889999999999999,
        "leartime_s": 0.03905114298686385,
        "sampletime": 2.0565972230106127,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 239,
        "timesteps": 478000,
        "reward_mean": -0.19169999999999976,
        "reward_max": 0.9159375000000006,
        "reward_min": -1.407125,
        "leartime_s": 0.013409910985501483,
        "sampletime": 2.030493378988467,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 240,
        "timesteps": 480000,
        "reward_mean": -0.07559999999999974,
        "reward_max": 1.0037500000000001,
        "reward_min": -1.0329375,
        "leartime_s": 0.02350782899884507,
        "sampletime": 2.210173906001728,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 241,
        "timesteps": 482000,
        "reward_mean": -0.08239999999999978,
        "reward_max": 0.8123125000000005,
        "reward_min": -1.2769375000000003,
        "leartime_s": 0.030527235998306423,
        "sampletime": 1.7139774019888137,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 242,
        "timesteps": 484000,
        "reward_mean": -0.41964999999999975,
        "reward_max": 0.6273750000000008,
        "reward_min": -1.633,
        "leartime_s": 0.026443192997248843,
        "sampletime": 2.1265389930049423,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 243,
        "timesteps": 486000,
        "reward_mean": -0.36049999999999977,
        "reward_max": 0.6234375000000003,
        "reward_min": -1.7915,
        "leartime_s": 0.029317896987777203,
        "sampletime": 2.047018642013427,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 244,
        "timesteps": 488000,
        "reward_mean": -0.2828249999999997,
        "reward_max": 0.7499375000000005,
        "reward_min": -1.7171875000000003,
        "leartime_s": 0.06811466699582525,
        "sampletime": 1.804223371000262,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 245,
        "timesteps": 490000,
        "reward_mean": -0.28249999999999975,
        "reward_max": 0.8757500000000005,
        "reward_min": -1.3156250000000003,
        "leartime_s": 0.021054753015050665,
        "sampletime": 1.9444959779793862,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 246,
        "timesteps": 492000,
        "reward_mean": -0.2829499999999998,
        "reward_max": 0.5343750000000005,
        "reward_min": -1.4546875,
        "leartime_s": 0.030667968007037416,
        "sampletime": 2.2481108400097582,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 247,
        "timesteps": 494000,
        "reward_mean": -0.1136999999999997,
        "reward_max": 0.8456875000000006,
        "reward_min": -1.5860000000000003,
        "leartime_s": 0.02271757400012575,
        "sampletime": 1.867770314012887,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 248,
        "timesteps": 496000,
        "reward_mean": -0.18212499999999976,
        "reward_max": 0.7821250000000002,
        "reward_min": -1.4123125,
        "leartime_s": 0.03685233599389903,
        "sampletime": 2.151203657995211,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 249,
        "timesteps": 498000,
        "reward_mean": -0.4636249999999998,
        "reward_max": 0.6549375000000004,
        "reward_min": -1.5719375,
        "leartime_s": 0.033847020007669926,
        "sampletime": 1.639953317004256,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 250,
        "timesteps": 500000,
        "reward_mean": -0.15714999999999976,
        "reward_max": 0.7550000000000006,
        "reward_min": -1.4278125,
        "leartime_s": 0.05046339600812644,
        "sampletime": 1.9037638290028553,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 251,
        "timesteps": 502000,
        "reward_mean": -0.007999999999999691,
        "reward_max": 0.9633750000000008,
        "reward_min": -1.5444375,
        "leartime_s": 0.06265190200065263,
        "sampletime": 1.883927245013183,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 252,
        "timesteps": 504000,
        "reward_mean": -0.19137499999999968,
        "reward_max": 0.8762500000000005,
        "reward_min": -1.6941875000000002,
        "leartime_s": 0.04290570400189608,
        "sampletime": 2.100075594004011,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 253,
        "timesteps": 506000,
        "reward_mean": -0.18059999999999973,
        "reward_max": 0.8036875000000006,
        "reward_min": -1.4974999999999998,
        "leartime_s": 0.03860581899061799,
        "sampletime": 2.111846704996424,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 254,
        "timesteps": 508000,
        "reward_mean": -0.35674999999999973,
        "reward_max": 0.6260000000000006,
        "reward_min": -1.8193124999999999,
        "leartime_s": 0.02607886999612674,
        "sampletime": 1.953843227995094,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 255,
        "timesteps": 510000,
        "reward_mean": -0.0713249999999997,
        "reward_max": 0.8282500000000007,
        "reward_min": -1.0940625,
        "leartime_s": 0.014473438001004979,
        "sampletime": 2.0415821310016327,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 256,
        "timesteps": 512000,
        "reward_mean": -0.20819999999999977,
        "reward_max": 0.7642500000000002,
        "reward_min": -1.4977500000000001,
        "leartime_s": 0.06729783199261874,
        "sampletime": 2.1203483220015187,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 257,
        "timesteps": 514000,
        "reward_mean": -0.27569999999999983,
        "reward_max": 0.6747500000000004,
        "reward_min": -1.4155625000000003,
        "leartime_s": 0.030782496003666893,
        "sampletime": 2.002252670004964,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 258,
        "timesteps": 516000,
        "reward_mean": -0.33682499999999976,
        "reward_max": 0.7686875000000007,
        "reward_min": -1.436375,
        "leartime_s": 0.0715618149843067,
        "sampletime": 2.106105854996713,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 259,
        "timesteps": 518000,
        "reward_mean": -0.31109999999999977,
        "reward_max": 0.5881250000000005,
        "reward_min": -1.6726875000000005,
        "leartime_s": 0.01441102399257943,
        "sampletime": 1.9629975389980245,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 260,
        "timesteps": 520000,
        "reward_mean": -0.29067499999999974,
        "reward_max": 0.6486875000000006,
        "reward_min": -1.5981250000000002,
        "leartime_s": 0.09237326300353743,
        "sampletime": 2.1353956689999904,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 261,
        "timesteps": 522000,
        "reward_mean": -0.1998999999999997,
        "reward_max": 0.7267500000000007,
        "reward_min": -1.3883750000000001,
        "leartime_s": 0.043009187997085974,
        "sampletime": 2.092595153982984,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 262,
        "timesteps": 524000,
        "reward_mean": -0.24267499999999975,
        "reward_max": 0.5967500000000002,
        "reward_min": -1.2306875000000004,
        "leartime_s": 0.05502246200921945,
        "sampletime": 1.8336327620199881,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 263,
        "timesteps": 526000,
        "reward_mean": -0.2444749999999998,
        "reward_max": 0.9622500000000004,
        "reward_min": -1.5549375,
        "leartime_s": 0.05865665097371675,
        "sampletime": 1.919201245997101,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 264,
        "timesteps": 528000,
        "reward_mean": -0.0603749999999997,
        "reward_max": 0.8580000000000005,
        "reward_min": -1.3966250000000004,
        "leartime_s": 0.056684764014789835,
        "sampletime": 1.966393564012833,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 265,
        "timesteps": 530000,
        "reward_mean": -0.36062499999999975,
        "reward_max": 0.6661875000000004,
        "reward_min": -1.9595625,
        "leartime_s": 0.024038203002419323,
        "sampletime": 1.7093591350130737,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 266,
        "timesteps": 532000,
        "reward_mean": -0.2504499999999998,
        "reward_max": 0.7035000000000005,
        "reward_min": -1.4053124999999997,
        "leartime_s": 0.04175916500389576,
        "sampletime": 1.696408239979064,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 267,
        "timesteps": 534000,
        "reward_mean": -0.20164999999999975,
        "reward_max": 0.8602500000000004,
        "reward_min": -1.4290000000000003,
        "leartime_s": 0.029470148001564667,
        "sampletime": 2.356324185995618,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 268,
        "timesteps": 536000,
        "reward_mean": -0.2817749999999998,
        "reward_max": 0.6155625000000006,
        "reward_min": -1.6572500000000003,
        "leartime_s": 0.030551293020835146,
        "sampletime": 1.6754253670223989,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 269,
        "timesteps": 538000,
        "reward_mean": -0.09587499999999967,
        "reward_max": 0.6303750000000001,
        "reward_min": -1.5454375,
        "leartime_s": 0.017050616996129975,
        "sampletime": 2.270963875023881,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 270,
        "timesteps": 540000,
        "reward_mean": -0.39982499999999976,
        "reward_max": 0.5683750000000005,
        "reward_min": -1.5059375000000004,
        "leartime_s": 0.031318491004640236,
        "sampletime": 1.9837500659923535,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 271,
        "timesteps": 542000,
        "reward_mean": -0.4210749999999998,
        "reward_max": 0.6125625000000007,
        "reward_min": -1.7070625,
        "leartime_s": 0.02324542700080201,
        "sampletime": 2.1226675669895485,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 272,
        "timesteps": 544000,
        "reward_mean": -0.30629999999999974,
        "reward_max": 0.4903125000000006,
        "reward_min": -1.3003749999999998,
        "leartime_s": 0.01860263099661097,
        "sampletime": 2.0832629400247242,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 273,
        "timesteps": 546000,
        "reward_mean": -0.3331499999999999,
        "reward_max": 0.6621250000000003,
        "reward_min": -1.4152499999999997,
        "leartime_s": 0.07633012998849154,
        "sampletime": 1.7783759919984732,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 274,
        "timesteps": 548000,
        "reward_mean": -0.2707999999999998,
        "reward_max": 0.7771875000000004,
        "reward_min": -1.2699375,
        "leartime_s": 0.019165952980984002,
        "sampletime": 2.0803217489738017,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 275,
        "timesteps": 550000,
        "reward_mean": -0.2499999999999998,
        "reward_max": 0.6147500000000005,
        "reward_min": -1.7020624999999996,
        "leartime_s": 0.03300356701947749,
        "sampletime": 2.0316115180030465,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 276,
        "timesteps": 552000,
        "reward_mean": -0.21654999999999977,
        "reward_max": 0.6000000000000006,
        "reward_min": -1.2211875,
        "leartime_s": 0.01791507299640216,
        "sampletime": 1.9326905909983907,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 277,
        "timesteps": 554000,
        "reward_mean": -0.23522499999999974,
        "reward_max": 0.5675625000000004,
        "reward_min": -1.3430625,
        "leartime_s": 0.018327016005059704,
        "sampletime": 1.9053246999974363,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 278,
        "timesteps": 556000,
        "reward_mean": -0.08407499999999973,
        "reward_max": 0.9285000000000003,
        "reward_min": -1.2516250000000004,
        "leartime_s": 0.033177195000462234,
        "sampletime": 1.815136706980411,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 279,
        "timesteps": 558000,
        "reward_mean": -0.48119999999999974,
        "reward_max": 0.4988750000000001,
        "reward_min": -1.6486250000000002,
        "leartime_s": 0.026348568993853405,
        "sampletime": 1.8507947490143124,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 280,
        "timesteps": 560000,
        "reward_mean": -0.3293249999999997,
        "reward_max": 0.5248125000000006,
        "reward_min": -1.5231875000000004,
        "leartime_s": 0.04955019601038657,
        "sampletime": 1.833443166979123,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 281,
        "timesteps": 562000,
        "reward_mean": -0.09007499999999972,
        "reward_max": 0.7766875000000006,
        "reward_min": -1.3270625000000005,
        "leartime_s": 0.0680228260171134,
        "sampletime": 1.9170848039793782,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 282,
        "timesteps": 564000,
        "reward_mean": -0.09232499999999973,
        "reward_max": 0.9955625000000005,
        "reward_min": -1.3569375000000004,
        "leartime_s": 0.057820262998575345,
        "sampletime": 1.7137933259946294,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 283,
        "timesteps": 566000,
        "reward_mean": -0.49819999999999987,
        "reward_max": 0.7736250000000002,
        "reward_min": -1.4551875,
        "leartime_s": 0.04805461398791522,
        "sampletime": 1.8279219059913885,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 284,
        "timesteps": 568000,
        "reward_mean": -0.2337749999999997,
        "reward_max": 0.8155625000000005,
        "reward_min": -1.4140625000000002,
        "leartime_s": 0.08691414800705388,
        "sampletime": 1.867387239006348,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 285,
        "timesteps": 570000,
        "reward_mean": -0.10332499999999974,
        "reward_max": 0.9810625000000002,
        "reward_min": -1.623625,
        "leartime_s": 0.029935178987216204,
        "sampletime": 2.0024132579856087,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 286,
        "timesteps": 572000,
        "reward_mean": -0.05817499999999977,
        "reward_max": 0.9030625000000005,
        "reward_min": -1.5593125,
        "leartime_s": 0.028708480997011065,
        "sampletime": 1.7818957600102294,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 287,
        "timesteps": 574000,
        "reward_mean": -0.0715999999999998,
        "reward_max": 0.9523125000000002,
        "reward_min": -1.2687499999999998,
        "leartime_s": 0.11903820300358348,
        "sampletime": 1.7808849510038272,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 288,
        "timesteps": 576000,
        "reward_mean": -0.1482999999999998,
        "reward_max": 0.9867500000000003,
        "reward_min": -1.1207500000000001,
        "leartime_s": 0.07054784701904282,
        "sampletime": 2.366146510001272,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 289,
        "timesteps": 578000,
        "reward_mean": -0.17127499999999982,
        "reward_max": 0.9667500000000001,
        "reward_min": -1.6055625000000002,
        "leartime_s": 0.033646970987319946,
        "sampletime": 2.004677115008235,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 290,
        "timesteps": 580000,
        "reward_mean": -0.1871749999999997,
        "reward_max": 0.8921875000000005,
        "reward_min": -1.7848125000000006,
        "leartime_s": 0.0621795579791069,
        "sampletime": 2.0612970780057367,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 291,
        "timesteps": 582000,
        "reward_mean": -0.06109999999999973,
        "reward_max": 1.1477500000000005,
        "reward_min": -1.022625,
        "leartime_s": 0.055681915022432804,
        "sampletime": 2.1753203739936,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 292,
        "timesteps": 584000,
        "reward_mean": -0.2209499999999998,
        "reward_max": 0.9113750000000002,
        "reward_min": -1.3169374999999997,
        "leartime_s": 0.05547407499398105,
        "sampletime": 1.784809723001672,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 293,
        "timesteps": 586000,
        "reward_mean": -0.17189999999999972,
        "reward_max": 0.7508750000000001,
        "reward_min": -1.7126875,
        "leartime_s": 0.03959228700841777,
        "sampletime": 1.8890822120010853,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 294,
        "timesteps": 588000,
        "reward_mean": 0.039925000000000335,
        "reward_max": 0.8423125000000005,
        "reward_min": -0.8643750000000001,
        "leartime_s": 0.020012220018543303,
        "sampletime": 1.9350926199986134,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 295,
        "timesteps": 590000,
        "reward_mean": -0.15589999999999982,
        "reward_max": 0.7433750000000005,
        "reward_min": -1.5431249999999996,
        "leartime_s": 0.01051332100178115,
        "sampletime": 1.769084172003204,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 296,
        "timesteps": 592000,
        "reward_mean": -0.19577499999999973,
        "reward_max": 0.6118125000000005,
        "reward_min": -1.4768749999999997,
        "leartime_s": 0.02886614899034612,
        "sampletime": 2.1389904220122844,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 297,
        "timesteps": 594000,
        "reward_mean": -0.24052499999999974,
        "reward_max": 0.8587500000000003,
        "reward_min": -1.4242500000000005,
        "leartime_s": 0.021196790010435507,
        "sampletime": 2.0698120400193147,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 298,
        "timesteps": 596000,
        "reward_mean": -0.16439999999999969,
        "reward_max": 0.9436875000000007,
        "reward_min": -1.1795624999999998,
        "leartime_s": 0.06225521699525416,
        "sampletime": 1.9354076529853046,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 299,
        "timesteps": 598000,
        "reward_mean": -0.34224999999999967,
        "reward_max": 0.5896250000000003,
        "reward_min": -1.7983749999999996,
        "leartime_s": 0.05782208201708272,
        "sampletime": 1.7094177549879532,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 300,
        "timesteps": 600000,
        "reward_mean": -0.19507499999999978,
        "reward_max": 0.7836875000000005,
        "reward_min": -1.3464375,
        "leartime_s": 0.0289650890044868,
        "sampletime": 1.9548863020027056,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 301,
        "timesteps": 602000,
        "reward_mean": -0.03379999999999979,
        "reward_max": 1.0991250000000004,
        "reward_min": -1.7473750000000001,
        "leartime_s": 0.06645637398469262,
        "sampletime": 1.766627906006761,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 302,
        "timesteps": 604000,
        "reward_mean": -0.23522499999999974,
        "reward_max": 0.7708125000000005,
        "reward_min": -1.5303125,
        "leartime_s": 0.0874255690141581,
        "sampletime": 2.5498208290082403,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 303,
        "timesteps": 606000,
        "reward_mean": -0.4287999999999998,
        "reward_max": 0.42156250000000045,
        "reward_min": -1.6683124999999999,
        "leartime_s": 0.02178052402450703,
        "sampletime": 1.7085824800014962,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 304,
        "timesteps": 608000,
        "reward_mean": -0.28314999999999974,
        "reward_max": 0.8217500000000006,
        "reward_min": -1.825625,
        "leartime_s": 0.09356418601237237,
        "sampletime": 2.1103989749972243,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 305,
        "timesteps": 610000,
        "reward_mean": 0.014350000000000227,
        "reward_max": 1.1779375000000005,
        "reward_min": -1.4266874999999999,
        "leartime_s": 0.02841012700810097,
        "sampletime": 1.9955049160053022,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 306,
        "timesteps": 612000,
        "reward_mean": -0.4001999999999997,
        "reward_max": 0.9403750000000005,
        "reward_min": -2.01775,
        "leartime_s": 0.06941401399672031,
        "sampletime": 1.752349084999878,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 307,
        "timesteps": 614000,
        "reward_mean": -0.31739999999999985,
        "reward_max": 0.7710625000000003,
        "reward_min": -1.3168125,
        "leartime_s": 0.03393212900846265,
        "sampletime": 2.0439278970006853,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 308,
        "timesteps": 616000,
        "reward_mean": -0.5667749999999999,
        "reward_max": 0.47137500000000043,
        "reward_min": -1.9569999999999999,
        "leartime_s": 0.05243914798484184,
        "sampletime": 2.127030620991718,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 309,
        "timesteps": 618000,
        "reward_mean": -0.3417749999999998,
        "reward_max": 0.6713750000000005,
        "reward_min": -1.4135624999999998,
        "leartime_s": 0.08190312099759467,
        "sampletime": 1.8327434899983928,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 310,
        "timesteps": 620000,
        "reward_mean": -0.39374999999999977,
        "reward_max": 0.5323750000000005,
        "reward_min": -1.614,
        "leartime_s": 0.07311514200409874,
        "sampletime": 1.6419197139912285,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 311,
        "timesteps": 622000,
        "reward_mean": -0.3150499999999997,
        "reward_max": 0.8339375000000007,
        "reward_min": -1.6338125000000003,
        "leartime_s": 0.07184457301627845,
        "sampletime": 2.0407739040092565,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 312,
        "timesteps": 624000,
        "reward_mean": -0.5130499999999999,
        "reward_max": 0.4945000000000005,
        "reward_min": -1.7159375,
        "leartime_s": 0.04683402299997397,
        "sampletime": 2.0206277430115733,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 313,
        "timesteps": 626000,
        "reward_mean": -0.23764999999999975,
        "reward_max": 0.7693125000000002,
        "reward_min": -1.751875,
        "leartime_s": 0.04047721001552418,
        "sampletime": 1.980227239022497,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 314,
        "timesteps": 628000,
        "reward_mean": -0.3271249999999998,
        "reward_max": 0.7305625000000003,
        "reward_min": -1.8353125000000001,
        "leartime_s": 0.042053582990774885,
        "sampletime": 2.1260799059818964,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 315,
        "timesteps": 630000,
        "reward_mean": -0.27764999999999973,
        "reward_max": 0.6283125000000005,
        "reward_min": -1.451,
        "leartime_s": 0.031958517007296905,
        "sampletime": 1.6914889710024,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 316,
        "timesteps": 632000,
        "reward_mean": -0.22204999999999972,
        "reward_max": 0.7718750000000005,
        "reward_min": -1.3981875000000004,
        "leartime_s": 0.026719202025560662,
        "sampletime": 1.7118022989889141,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 317,
        "timesteps": 634000,
        "reward_mean": -0.3693499999999998,
        "reward_max": 0.5437500000000005,
        "reward_min": -1.5121249999999997,
        "leartime_s": 0.04362156899878755,
        "sampletime": 1.9894468419952318,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 318,
        "timesteps": 636000,
        "reward_mean": -0.35317499999999985,
        "reward_max": 0.6329375000000003,
        "reward_min": -1.4852500000000006,
        "leartime_s": 0.04596039600437507,
        "sampletime": 1.8348954989924096,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 319,
        "timesteps": 638000,
        "reward_mean": -0.20867499999999972,
        "reward_max": 1.0358125000000007,
        "reward_min": -2.2080624999999996,
        "leartime_s": 0.07346217500162311,
        "sampletime": 1.8371630239998922,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 320,
        "timesteps": 640000,
        "reward_mean": -0.31602499999999983,
        "reward_max": 0.7761875000000005,
        "reward_min": -1.332125,
        "leartime_s": 0.054199172009248286,
        "sampletime": 2.0658681930217426,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 321,
        "timesteps": 642000,
        "reward_mean": -0.3593749999999998,
        "reward_max": 0.7631250000000005,
        "reward_min": -1.3881875000000001,
        "leartime_s": 0.04270295999594964,
        "sampletime": 2.0191180979891215,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 322,
        "timesteps": 644000,
        "reward_mean": -0.23102499999999973,
        "reward_max": 0.7148750000000005,
        "reward_min": -1.5621874999999998,
        "leartime_s": 0.02908180298982188,
        "sampletime": 1.8681332539999858,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 323,
        "timesteps": 646000,
        "reward_mean": -0.2599999999999998,
        "reward_max": 0.9141875000000005,
        "reward_min": -1.6946250000000003,
        "leartime_s": 0.0369803860085085,
        "sampletime": 2.2920361470023636,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 324,
        "timesteps": 648000,
        "reward_mean": -0.05627499999999971,
        "reward_max": 1.0540625000000006,
        "reward_min": -1.3946250000000002,
        "leartime_s": 0.03980800500721671,
        "sampletime": 2.1257522720261477,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 325,
        "timesteps": 650000,
        "reward_mean": -0.16764999999999974,
        "reward_max": 0.7662500000000004,
        "reward_min": -1.1825625,
        "leartime_s": 0.025196911010425538,
        "sampletime": 1.8670121089962777,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 326,
        "timesteps": 652000,
        "reward_mean": -0.21057499999999985,
        "reward_max": 0.7805000000000005,
        "reward_min": -1.5728125000000004,
        "leartime_s": 0.04753180898842402,
        "sampletime": 1.9486389469821006,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 327,
        "timesteps": 654000,
        "reward_mean": -0.4295249999999998,
        "reward_max": 0.5317500000000004,
        "reward_min": -1.5184375000000003,
        "leartime_s": 0.03840515500633046,
        "sampletime": 2.0729190639976878,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 328,
        "timesteps": 656000,
        "reward_mean": -0.4007249999999998,
        "reward_max": 0.5785625000000004,
        "reward_min": -1.4205625,
        "leartime_s": 0.04595348599832505,
        "sampletime": 1.766937838983722,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 329,
        "timesteps": 658000,
        "reward_mean": -0.22374999999999973,
        "reward_max": 0.9636250000000001,
        "reward_min": -1.3898124999999997,
        "leartime_s": 0.07109979700180702,
        "sampletime": 2.174032680981327,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 330,
        "timesteps": 660000,
        "reward_mean": -0.4644749999999998,
        "reward_max": 0.6983125000000006,
        "reward_min": -1.6944375,
        "leartime_s": 0.02336225801263936,
        "sampletime": 2.023204339988297,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 331,
        "timesteps": 662000,
        "reward_mean": -0.44902499999999973,
        "reward_max": 0.39262500000000045,
        "reward_min": -1.6258749999999997,
        "leartime_s": 0.03997184897889383,
        "sampletime": 1.7188827580248471,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 332,
        "timesteps": 664000,
        "reward_mean": -0.30004999999999976,
        "reward_max": 0.6016250000000003,
        "reward_min": -1.5421875000000005,
        "leartime_s": 0.06594818600569852,
        "sampletime": 1.6016790159919765,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 333,
        "timesteps": 666000,
        "reward_mean": -0.35427499999999973,
        "reward_max": 0.6781875000000004,
        "reward_min": -1.8541250000000002,
        "leartime_s": 0.03643305899458937,
        "sampletime": 2.0137403109984007,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 334,
        "timesteps": 668000,
        "reward_mean": -0.6317499999999998,
        "reward_max": 0.5443750000000007,
        "reward_min": -2.060375,
        "leartime_s": 0.05366302700713277,
        "sampletime": 1.9504602959787007,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 335,
        "timesteps": 670000,
        "reward_mean": -0.3840999999999997,
        "reward_max": 0.7185625000000005,
        "reward_min": -1.7019375,
        "leartime_s": 0.07273158800671808,
        "sampletime": 2.1548480009951163,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 336,
        "timesteps": 672000,
        "reward_mean": -0.29667499999999974,
        "reward_max": 0.6298125000000009,
        "reward_min": -1.4064999999999999,
        "leartime_s": 0.024005709012271836,
        "sampletime": 1.9107715370191727,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 337,
        "timesteps": 674000,
        "reward_mean": -0.4565999999999998,
        "reward_max": 0.5030625000000005,
        "reward_min": -1.76875,
        "leartime_s": 0.09785033800289966,
        "sampletime": 1.7672802430170123,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 338,
        "timesteps": 676000,
        "reward_mean": -0.24919999999999976,
        "reward_max": 0.7259375000000006,
        "reward_min": -1.77625,
        "leartime_s": 0.033184113999595866,
        "sampletime": 2.0044592379999813,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 339,
        "timesteps": 678000,
        "reward_mean": -0.3425249999999998,
        "reward_max": 0.8255000000000002,
        "reward_min": -1.4285625,
        "leartime_s": 0.026242446998367086,
        "sampletime": 1.9493603169976268,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 340,
        "timesteps": 680000,
        "reward_mean": -0.3335999999999998,
        "reward_max": 0.5640000000000003,
        "reward_min": -1.8591250000000006,
        "leartime_s": 0.04149781001615338,
        "sampletime": 1.784916220989544,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 341,
        "timesteps": 682000,
        "reward_mean": -0.39077499999999976,
        "reward_max": 0.5925625000000007,
        "reward_min": -1.4878125,
        "leartime_s": 0.02832741499878466,
        "sampletime": 1.8599732239963487,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 342,
        "timesteps": 684000,
        "reward_mean": -0.4962499999999999,
        "reward_max": 0.7470625000000004,
        "reward_min": -1.7126875000000001,
        "leartime_s": 0.04313802099204622,
        "sampletime": 2.001467846974265,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 343,
        "timesteps": 686000,
        "reward_mean": -0.5116999999999998,
        "reward_max": 0.3285000000000006,
        "reward_min": -1.6993125000000002,
        "leartime_s": 0.024134900973876938,
        "sampletime": 1.923823627003003,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 344,
        "timesteps": 688000,
        "reward_mean": -0.37992499999999985,
        "reward_max": 0.5273125000000007,
        "reward_min": -1.6557500000000007,
        "leartime_s": 0.027211326989345253,
        "sampletime": 1.6898003569804132,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 345,
        "timesteps": 690000,
        "reward_mean": -0.5033249999999998,
        "reward_max": 0.5941875000000006,
        "reward_min": -2.0106250000000006,
        "leartime_s": 0.041818530997261405,
        "sampletime": 2.0802911359933205,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 346,
        "timesteps": 692000,
        "reward_mean": -0.6888999999999998,
        "reward_max": 0.33175000000000043,
        "reward_min": -2.2646250000000006,
        "leartime_s": 0.035855455993441865,
        "sampletime": 2.1511817360005807,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 347,
        "timesteps": 694000,
        "reward_mean": -0.4411999999999998,
        "reward_max": 0.3725625000000007,
        "reward_min": -1.4668750000000004,
        "leartime_s": 0.05754887600778602,
        "sampletime": 1.7557881649991032,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 348,
        "timesteps": 696000,
        "reward_mean": -0.29359999999999986,
        "reward_max": 0.5680000000000005,
        "reward_min": -1.4712499999999997,
        "leartime_s": 0.04964870502590202,
        "sampletime": 1.6755918489943724,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 349,
        "timesteps": 698000,
        "reward_mean": -0.5018249999999999,
        "reward_max": 0.4887500000000004,
        "reward_min": -1.5803750000000003,
        "leartime_s": 0.06207861201255582,
        "sampletime": 2.1624008800135925,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 350,
        "timesteps": 700000,
        "reward_mean": -0.5181499999999998,
        "reward_max": 0.5221250000000002,
        "reward_min": -2.1122500000000004,
        "leartime_s": 0.027551967999897897,
        "sampletime": 1.7056919739989098,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 351,
        "timesteps": 702000,
        "reward_mean": -0.45762499999999984,
        "reward_max": 0.5640625000000004,
        "reward_min": -1.4786875000000002,
        "leartime_s": 0.040184618992498145,
        "sampletime": 2.082832944986876,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 352,
        "timesteps": 704000,
        "reward_mean": -0.2958499999999997,
        "reward_max": 0.6894375000000004,
        "reward_min": -1.398875,
        "leartime_s": 0.06222742301179096,
        "sampletime": 2.1017462190066,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 353,
        "timesteps": 706000,
        "reward_mean": -0.49982499999999985,
        "reward_max": 0.6373125000000006,
        "reward_min": -1.4993750000000001,
        "leartime_s": 0.034421104995999485,
        "sampletime": 1.6510271469887812,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 354,
        "timesteps": 708000,
        "reward_mean": -0.5213499999999999,
        "reward_max": 0.4463750000000005,
        "reward_min": -1.7175624999999999,
        "leartime_s": 0.033863378019304946,
        "sampletime": 2.1100692139880266,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 355,
        "timesteps": 710000,
        "reward_mean": -0.6100249999999998,
        "reward_max": 0.32037500000000063,
        "reward_min": -2.236125,
        "leartime_s": 0.02915345100336708,
        "sampletime": 1.9777049920230638,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 356,
        "timesteps": 712000,
        "reward_mean": -0.6132499999999999,
        "reward_max": 0.3886250000000002,
        "reward_min": -1.7329375000000005,
        "leartime_s": 0.07296749099623412,
        "sampletime": 1.771127258980414,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 357,
        "timesteps": 714000,
        "reward_mean": -0.6805999999999998,
        "reward_max": 0.16300000000000042,
        "reward_min": -1.91325,
        "leartime_s": 0.0624495759839192,
        "sampletime": 2.0504597469989676,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 358,
        "timesteps": 716000,
        "reward_mean": -0.54585,
        "reward_max": 0.46362500000000034,
        "reward_min": -1.5243750000000005,
        "leartime_s": 0.032059402990853414,
        "sampletime": 2.18900852301158,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 359,
        "timesteps": 718000,
        "reward_mean": -0.32427499999999987,
        "reward_max": 0.6491875000000005,
        "reward_min": -1.5609375000000003,
        "leartime_s": 0.02845849600271322,
        "sampletime": 1.7244259160070214,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 360,
        "timesteps": 720000,
        "reward_mean": -0.6523999999999999,
        "reward_max": 0.5483750000000005,
        "reward_min": -2.1788125000000007,
        "leartime_s": 0.04215761597151868,
        "sampletime": 1.983989543019561,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 361,
        "timesteps": 722000,
        "reward_mean": -0.4522249999999999,
        "reward_max": 0.5608125000000007,
        "reward_min": -1.5333125,
        "leartime_s": 0.04768946999683976,
        "sampletime": 2.0067815990187228,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 362,
        "timesteps": 724000,
        "reward_mean": -0.6788,
        "reward_max": 0.3100625000000005,
        "reward_min": -1.9348750000000006,
        "leartime_s": 0.058975177991669625,
        "sampletime": 1.8354895840166137,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 363,
        "timesteps": 726000,
        "reward_mean": -0.42332499999999995,
        "reward_max": 0.4220000000000003,
        "reward_min": -1.4461875,
        "leartime_s": 0.03243065602146089,
        "sampletime": 2.390089765016455,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 364,
        "timesteps": 728000,
        "reward_mean": -0.7551749999999999,
        "reward_max": 0.1383125000000002,
        "reward_min": -1.9976250000000002,
        "leartime_s": 0.0369253620156087,
        "sampletime": 1.7126702459936496,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 365,
        "timesteps": 730000,
        "reward_mean": -0.780925,
        "reward_max": 0.4013125000000003,
        "reward_min": -1.8545000000000003,
        "leartime_s": 0.03145252901595086,
        "sampletime": 1.6460938390227966,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 366,
        "timesteps": 732000,
        "reward_mean": -0.7860999999999999,
        "reward_max": 0.0748750000000005,
        "reward_min": -2.2498124999999995,
        "leartime_s": 0.03649973901337944,
        "sampletime": 2.1433785150002223,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 367,
        "timesteps": 734000,
        "reward_mean": -0.7746999999999999,
        "reward_max": 0.33706250000000043,
        "reward_min": -2.3670625000000007,
        "leartime_s": 0.04621212399797514,
        "sampletime": 1.8172432710125577,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 368,
        "timesteps": 736000,
        "reward_mean": -0.6799499999999998,
        "reward_max": 0.6846250000000004,
        "reward_min": -1.9915000000000005,
        "leartime_s": 0.09738046099664643,
        "sampletime": 2.214263413014123,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 369,
        "timesteps": 738000,
        "reward_mean": -0.742675,
        "reward_max": 0.32268750000000046,
        "reward_min": -2.5963125000000007,
        "leartime_s": 0.04243949698866345,
        "sampletime": 2.193212793004932,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 370,
        "timesteps": 740000,
        "reward_mean": -0.5079249999999998,
        "reward_max": 0.45343750000000027,
        "reward_min": -1.8221875000000003,
        "leartime_s": 0.08396367297973484,
        "sampletime": 2.1182062980078626,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 371,
        "timesteps": 742000,
        "reward_mean": -0.5627499999999998,
        "reward_max": 0.5061250000000004,
        "reward_min": -1.9676250000000004,
        "leartime_s": 0.021412679023342207,
        "sampletime": 2.1384928670013323,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 372,
        "timesteps": 744000,
        "reward_mean": -0.8221749999999999,
        "reward_max": 0.3734375000000005,
        "reward_min": -2.0262499999999997,
        "leartime_s": 0.04291222000028938,
        "sampletime": 1.6926301129860803,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 373,
        "timesteps": 746000,
        "reward_mean": -0.5838749999999999,
        "reward_max": 0.41031250000000047,
        "reward_min": -1.9330625000000006,
        "leartime_s": 0.075695501989685,
        "sampletime": 2.236526986991521,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 374,
        "timesteps": 748000,
        "reward_mean": -0.42494999999999994,
        "reward_max": 0.3934375000000003,
        "reward_min": -1.6193125000000004,
        "leartime_s": 0.06821053999010473,
        "sampletime": 1.7957920979824848,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 375,
        "timesteps": 750000,
        "reward_mean": -0.7607499999999998,
        "reward_max": 0.1811250000000006,
        "reward_min": -1.944,
        "leartime_s": 0.052930531004676595,
        "sampletime": 1.7446247409970965,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 376,
        "timesteps": 752000,
        "reward_mean": -0.7107749999999998,
        "reward_max": 0.27487500000000054,
        "reward_min": -1.7761875000000003,
        "leartime_s": 0.04312562997802161,
        "sampletime": 2.27485398601857,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 377,
        "timesteps": 754000,
        "reward_mean": -0.5567249999999999,
        "reward_max": 0.37212500000000026,
        "reward_min": -1.7828125000000004,
        "leartime_s": 0.0434805839904584,
        "sampletime": 1.7641101640183479,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 378,
        "timesteps": 756000,
        "reward_mean": -0.799825,
        "reward_max": 0.2587500000000006,
        "reward_min": -2.0145,
        "leartime_s": 0.06311228702543303,
        "sampletime": 2.0482481999788433,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 379,
        "timesteps": 758000,
        "reward_mean": -0.5837249999999999,
        "reward_max": 0.6396250000000002,
        "reward_min": -1.7573125000000003,
        "leartime_s": 0.038202091003768146,
        "sampletime": 2.182864514994435,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 380,
        "timesteps": 760000,
        "reward_mean": -0.7397249999999999,
        "reward_max": 0.2601875000000005,
        "reward_min": -2.0924375,
        "leartime_s": 0.0822834600112401,
        "sampletime": 1.8694674719881732,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 381,
        "timesteps": 762000,
        "reward_mean": -0.6624749999999999,
        "reward_max": 0.47356250000000044,
        "reward_min": -2.312125,
        "leartime_s": 0.05975964100798592,
        "sampletime": 1.9729062689875718,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 382,
        "timesteps": 764000,
        "reward_mean": -0.41739999999999994,
        "reward_max": 0.5595000000000006,
        "reward_min": -1.70075,
        "leartime_s": 0.04370457399636507,
        "sampletime": 1.6913522339891642,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 383,
        "timesteps": 766000,
        "reward_mean": -0.92535,
        "reward_max": 0.06331250000000029,
        "reward_min": -2.0028125000000006,
        "leartime_s": 0.023121500009438023,
        "sampletime": 2.072689065011218,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 384,
        "timesteps": 768000,
        "reward_mean": -0.7994499999999999,
        "reward_max": 0.3821250000000004,
        "reward_min": -1.9735625000000006,
        "leartime_s": 0.041608519008150324,
        "sampletime": 1.7991849410173018,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 385,
        "timesteps": 770000,
        "reward_mean": -0.6554249999999998,
        "reward_max": 0.4946250000000003,
        "reward_min": -1.8825625000000004,
        "leartime_s": 0.027200884011108428,
        "sampletime": 1.770662992988946,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 386,
        "timesteps": 772000,
        "reward_mean": -0.6589749999999999,
        "reward_max": 0.42662500000000064,
        "reward_min": -1.9418125000000002,
        "leartime_s": 0.04618385498179123,
        "sampletime": 2.242565429973183,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 387,
        "timesteps": 774000,
        "reward_mean": -0.618425,
        "reward_max": 0.3939375000000004,
        "reward_min": -1.9719375000000006,
        "leartime_s": 0.059518553025554866,
        "sampletime": 1.746547507995274,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 388,
        "timesteps": 776000,
        "reward_mean": -0.7412249999999999,
        "reward_max": 0.22406250000000028,
        "reward_min": -2.1692499999999995,
        "leartime_s": 0.07477428097627126,
        "sampletime": 1.8370634560124017,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 389,
        "timesteps": 778000,
        "reward_mean": -0.70675,
        "reward_max": 0.1816250000000004,
        "reward_min": -2.3618125,
        "leartime_s": 0.054789281013654545,
        "sampletime": 2.17509680299554,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 390,
        "timesteps": 780000,
        "reward_mean": -0.62315,
        "reward_max": 0.4905000000000005,
        "reward_min": -1.957,
        "leartime_s": 0.06594541200320236,
        "sampletime": 1.863696490006987,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 391,
        "timesteps": 782000,
        "reward_mean": -0.4533,
        "reward_max": 0.6225625000000004,
        "reward_min": -1.7936875000000008,
        "leartime_s": 0.061276986001757905,
        "sampletime": 1.9931199899874628,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 392,
        "timesteps": 784000,
        "reward_mean": -0.71865,
        "reward_max": 0.07412500000000025,
        "reward_min": -1.9640625,
        "leartime_s": 0.04181742001674138,
        "sampletime": 2.04696074599633,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 393,
        "timesteps": 786000,
        "reward_mean": -0.6726499999999999,
        "reward_max": 0.2733125000000005,
        "reward_min": -1.9450625000000004,
        "leartime_s": 0.05622871400555596,
        "sampletime": 1.6993113569915295,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 394,
        "timesteps": 788000,
        "reward_mean": -0.5630499999999999,
        "reward_max": 0.4245625000000003,
        "reward_min": -1.5738750000000001,
        "leartime_s": 0.07568630800233223,
        "sampletime": 2.0523308659903705,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 395,
        "timesteps": 790000,
        "reward_mean": -0.29959999999999987,
        "reward_max": 0.6318125000000002,
        "reward_min": -1.3816250000000003,
        "leartime_s": 0.030851693998556584,
        "sampletime": 2.155525295995176,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 396,
        "timesteps": 792000,
        "reward_mean": -0.40969999999999984,
        "reward_max": 0.5146875000000005,
        "reward_min": -1.7230625000000002,
        "leartime_s": 0.05073153099510819,
        "sampletime": 1.70526675999281,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 397,
        "timesteps": 794000,
        "reward_mean": -0.3782499999999998,
        "reward_max": 0.5158125000000005,
        "reward_min": -1.597625,
        "leartime_s": 0.029428332985844463,
        "sampletime": 2.0961166660126764,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 398,
        "timesteps": 796000,
        "reward_mean": -0.7975,
        "reward_max": 0.48893750000000047,
        "reward_min": -2.1553125000000004,
        "leartime_s": 0.056276332994457334,
        "sampletime": 1.6935608070052695,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 399,
        "timesteps": 798000,
        "reward_mean": -0.33282499999999987,
        "reward_max": 0.9616875000000004,
        "reward_min": -1.6112500000000003,
        "leartime_s": 0.0632262279978022,
        "sampletime": 1.608927126013441,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 400,
        "timesteps": 800000,
        "reward_mean": -0.617375,
        "reward_max": 0.0704375000000004,
        "reward_min": -1.7113125000000007,
        "leartime_s": 0.054276471986668184,
        "sampletime": 2.0905452230072115,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 401,
        "timesteps": 802000,
        "reward_mean": -0.790075,
        "reward_max": 0.20012500000000044,
        "reward_min": -2.058625,
        "leartime_s": 0.033756597986212,
        "sampletime": 2.0416125979973003,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 402,
        "timesteps": 804000,
        "reward_mean": -0.5380999999999999,
        "reward_max": 0.5096875000000004,
        "reward_min": -1.8223750000000005,
        "leartime_s": 0.08152020402485505,
        "sampletime": 1.902423469000496,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 403,
        "timesteps": 806000,
        "reward_mean": -0.5326999999999998,
        "reward_max": 0.5815625000000004,
        "reward_min": -1.5099374999999997,
        "leartime_s": 0.03879045500070788,
        "sampletime": 2.0412591960048303,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 404,
        "timesteps": 808000,
        "reward_mean": -0.8153999999999999,
        "reward_max": 0.07131250000000035,
        "reward_min": -2.3953750000000005,
        "leartime_s": 0.055500935995951295,
        "sampletime": 1.8888552479911596,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 405,
        "timesteps": 810000,
        "reward_mean": -0.6050999999999999,
        "reward_max": 0.3308750000000003,
        "reward_min": -1.9598125,
        "leartime_s": 0.016533102985704318,
        "sampletime": 1.7510476490133442,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 406,
        "timesteps": 812000,
        "reward_mean": -0.5738749999999998,
        "reward_max": 0.4951875000000003,
        "reward_min": -2.0923750000000005,
        "leartime_s": 0.057155201997375116,
        "sampletime": 2.0598371220112313,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 407,
        "timesteps": 814000,
        "reward_mean": -0.8495499999999999,
        "reward_max": 0.019000000000000322,
        "reward_min": -1.9171875000000003,
        "leartime_s": 0.020309892017394304,
        "sampletime": 1.9963578229944687,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 408,
        "timesteps": 816000,
        "reward_mean": -0.7075750000000001,
        "reward_max": 0.3232500000000004,
        "reward_min": -1.79725,
        "leartime_s": 0.0428264880029019,
        "sampletime": 1.7158422580105253,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 409,
        "timesteps": 818000,
        "reward_mean": -0.38352499999999984,
        "reward_max": 0.7353750000000004,
        "reward_min": -1.5371875000000004,
        "leartime_s": 0.022466394992079586,
        "sampletime": 2.109239671000978,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 410,
        "timesteps": 820000,
        "reward_mean": -0.5590249999999999,
        "reward_max": 0.4280000000000004,
        "reward_min": -2.074625,
        "leartime_s": 0.04581438101013191,
        "sampletime": 1.8304280689917505,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 411,
        "timesteps": 822000,
        "reward_mean": -0.36814999999999987,
        "reward_max": 0.6493750000000005,
        "reward_min": -1.7253125,
        "leartime_s": 0.05574658900150098,
        "sampletime": 2.144222023023758,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 412,
        "timesteps": 824000,
        "reward_mean": -0.6517999999999998,
        "reward_max": 0.22187500000000027,
        "reward_min": -1.5333750000000006,
        "leartime_s": 0.07689780698274262,
        "sampletime": 2.299898917990504,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 413,
        "timesteps": 826000,
        "reward_mean": -0.4806999999999998,
        "reward_max": 0.4568125000000005,
        "reward_min": -1.7495,
        "leartime_s": 0.05509267398156226,
        "sampletime": 1.7685057780181523,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 414,
        "timesteps": 828000,
        "reward_mean": -0.3359249999999998,
        "reward_max": 0.4480000000000007,
        "reward_min": -1.2139375000000001,
        "leartime_s": 0.045436698012053967,
        "sampletime": 2.237769480998395,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 415,
        "timesteps": 830000,
        "reward_mean": -0.6010499999999999,
        "reward_max": 0.5114375000000004,
        "reward_min": -1.9479999999999997,
        "leartime_s": 0.04433850999339484,
        "sampletime": 1.765226909017656,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 416,
        "timesteps": 832000,
        "reward_mean": -0.4890249999999999,
        "reward_max": 0.6101250000000003,
        "reward_min": -1.4810624999999995,
        "leartime_s": 0.05212505999952555,
        "sampletime": 1.6330003479961306,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 417,
        "timesteps": 834000,
        "reward_mean": -0.2761749999999997,
        "reward_max": 0.9008125000000006,
        "reward_min": -1.4054375,
        "leartime_s": 0.10860181698808447,
        "sampletime": 2.109739581006579,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 418,
        "timesteps": 836000,
        "reward_mean": -0.49444999999999983,
        "reward_max": 0.34350000000000064,
        "reward_min": -1.5301875,
        "leartime_s": 0.032852845994057134,
        "sampletime": 2.0021841940179,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 419,
        "timesteps": 838000,
        "reward_mean": -0.34684999999999977,
        "reward_max": 0.5355000000000005,
        "reward_min": -2.07175,
        "leartime_s": 0.04335004897438921,
        "sampletime": 1.780409945989959,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 420,
        "timesteps": 840000,
        "reward_mean": -0.4197499999999998,
        "reward_max": 0.7176875000000005,
        "reward_min": -2.0279999999999996,
        "leartime_s": 0.037655727006495,
        "sampletime": 2.1330982799991034,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 421,
        "timesteps": 842000,
        "reward_mean": -0.46562499999999973,
        "reward_max": 0.5121875000000007,
        "reward_min": -1.909625,
        "leartime_s": 0.030753200000617653,
        "sampletime": 1.6234605569916312,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 422,
        "timesteps": 844000,
        "reward_mean": -0.2606249999999998,
        "reward_max": 0.7037500000000005,
        "reward_min": -1.3888749999999994,
        "leartime_s": 0.038782246003393084,
        "sampletime": 2.2828555630112533,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 423,
        "timesteps": 846000,
        "reward_mean": -0.42772499999999986,
        "reward_max": 0.6538125000000006,
        "reward_min": -1.6175000000000006,
        "leartime_s": 0.026418800000101328,
        "sampletime": 1.7391349230019841,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 424,
        "timesteps": 848000,
        "reward_mean": -0.2528499999999998,
        "reward_max": 0.5524375000000004,
        "reward_min": -1.2425625,
        "leartime_s": 0.06706857599783689,
        "sampletime": 1.7062414060055744,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 425,
        "timesteps": 850000,
        "reward_mean": -0.5280249999999997,
        "reward_max": 0.6083125000000004,
        "reward_min": -1.7376250000000002,
        "leartime_s": 0.039386188989738,
        "sampletime": 2.078075010009343,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 426,
        "timesteps": 852000,
        "reward_mean": -0.3049749999999997,
        "reward_max": 0.6818125000000002,
        "reward_min": -1.5290625,
        "leartime_s": 0.06075435702223331,
        "sampletime": 1.7557221809984185,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 427,
        "timesteps": 854000,
        "reward_mean": -0.6490499999999997,
        "reward_max": 0.2965625000000004,
        "reward_min": -1.6909375,
        "leartime_s": 0.06800133400247432,
        "sampletime": 1.4990868419990875,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 428,
        "timesteps": 856000,
        "reward_mean": -0.6240749999999998,
        "reward_max": 0.3006875000000004,
        "reward_min": -2.393,
        "leartime_s": 0.04894386499654502,
        "sampletime": 1.8555029229901265,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 429,
        "timesteps": 858000,
        "reward_mean": -0.2620999999999998,
        "reward_max": 0.5725625000000003,
        "reward_min": -1.4493750000000003,
        "leartime_s": 0.026246827997965738,
        "sampletime": 1.7656999249884393,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 430,
        "timesteps": 860000,
        "reward_mean": -0.6352499999999998,
        "reward_max": 0.4061250000000006,
        "reward_min": -1.8196875000000001,
        "leartime_s": 0.05017062497790903,
        "sampletime": 1.868440243997611,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 431,
        "timesteps": 862000,
        "reward_mean": -0.4586249999999997,
        "reward_max": 0.6824375000000003,
        "reward_min": -2.006,
        "leartime_s": 0.03713856899412349,
        "sampletime": 1.4896066630026326,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 432,
        "timesteps": 864000,
        "reward_mean": -0.09714999999999974,
        "reward_max": 0.9493125000000004,
        "reward_min": -1.1109374999999995,
        "leartime_s": 0.039154008991317824,
        "sampletime": 1.4337788799894042,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 433,
        "timesteps": 866000,
        "reward_mean": -0.7508499999999999,
        "reward_max": 0.20987500000000048,
        "reward_min": -2.3875624999999996,
        "leartime_s": 0.03450870199594647,
        "sampletime": 1.7720737110066693,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 434,
        "timesteps": 868000,
        "reward_mean": -0.2740999999999998,
        "reward_max": 0.5952500000000005,
        "reward_min": -1.647375,
        "leartime_s": 0.026437485998030752,
        "sampletime": 1.8940880830050446,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 435,
        "timesteps": 870000,
        "reward_mean": -0.12309999999999974,
        "reward_max": 0.8278125000000002,
        "reward_min": -1.4867499999999996,
        "leartime_s": 0.03786131797824055,
        "sampletime": 1.7601013039820828,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 436,
        "timesteps": 872000,
        "reward_mean": -0.4597749999999998,
        "reward_max": 0.6034375000000003,
        "reward_min": -1.5039374999999997,
        "leartime_s": 0.06887586298398674,
        "sampletime": 1.5926288870105054,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 437,
        "timesteps": 874000,
        "reward_mean": -0.34787499999999977,
        "reward_max": 0.8380625000000006,
        "reward_min": -2.4546875000000004,
        "leartime_s": 0.07986968601471744,
        "sampletime": 1.7238135799998417,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 438,
        "timesteps": 876000,
        "reward_mean": -0.22527499999999978,
        "reward_max": 0.8357500000000003,
        "reward_min": -1.4884999999999997,
        "leartime_s": 0.06525604199850932,
        "sampletime": 1.8602300710044801,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 439,
        "timesteps": 878000,
        "reward_mean": -0.28487499999999977,
        "reward_max": 0.9053125000000004,
        "reward_min": -1.42,
        "leartime_s": 0.05706528900191188,
        "sampletime": 1.4341685080144089,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 440,
        "timesteps": 880000,
        "reward_mean": -0.3591999999999997,
        "reward_max": 0.6239375000000005,
        "reward_min": -1.350625,
        "leartime_s": 0.024843853985657915,
        "sampletime": 1.6813547599886078,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 441,
        "timesteps": 882000,
        "reward_mean": -0.13507499999999967,
        "reward_max": 0.8135000000000007,
        "reward_min": -1.4361249999999999,
        "leartime_s": 0.04961651100893505,
        "sampletime": 1.8429931819846388,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 442,
        "timesteps": 884000,
        "reward_mean": -0.2378749999999997,
        "reward_max": 0.5820625000000004,
        "reward_min": -1.5905625000000005,
        "leartime_s": 0.04420544800814241,
        "sampletime": 1.7959249669802375,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 443,
        "timesteps": 886000,
        "reward_mean": -0.23232499999999973,
        "reward_max": 0.9730000000000008,
        "reward_min": -1.6556249999999997,
        "leartime_s": 0.044857714005047455,
        "sampletime": 1.553314329998102,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 444,
        "timesteps": 888000,
        "reward_mean": -0.027699999999999735,
        "reward_max": 1.0530000000000004,
        "reward_min": -1.540375,
        "leartime_s": 0.02979543700348586,
        "sampletime": 1.7655024450214114,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 445,
        "timesteps": 890000,
        "reward_mean": -0.14354999999999973,
        "reward_max": 0.8265000000000005,
        "reward_min": -1.4447500000000002,
        "leartime_s": 0.024183163011912256,
        "sampletime": 1.8094362120027654,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 446,
        "timesteps": 892000,
        "reward_mean": -0.1972749999999997,
        "reward_max": 0.8084375000000007,
        "reward_min": -1.233375,
        "leartime_s": 0.06842107701231726,
        "sampletime": 1.5262408950075042,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 447,
        "timesteps": 894000,
        "reward_mean": -0.25474999999999975,
        "reward_max": 0.7361875000000004,
        "reward_min": -1.4400625000000002,
        "leartime_s": 0.05246349301887676,
        "sampletime": 1.6628844779916108,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 448,
        "timesteps": 896000,
        "reward_mean": -0.3411539499999997,
        "reward_max": 0.5975000000000007,
        "reward_min": -1.8290666666666666,
        "leartime_s": 0.044361049978761,
        "sampletime": 1.56872219601064,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 449,
        "timesteps": 898000,
        "reward_mean": -0.47287499999999977,
        "reward_max": 0.44600000000000034,
        "reward_min": -1.5635624999999997,
        "leartime_s": 0.0560435900115408,
        "sampletime": 1.807104084000457,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 450,
        "timesteps": 900000,
        "reward_mean": -0.4284499999999998,
        "reward_max": 0.5039375000000006,
        "reward_min": -1.5958750000000004,
        "leartime_s": 0.026816799014341086,
        "sampletime": 1.7452371930121444,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 451,
        "timesteps": 902000,
        "reward_mean": -0.07914999999999967,
        "reward_max": 1.1004375000000006,
        "reward_min": -1.2303124999999997,
        "leartime_s": 0.021732900000642985,
        "sampletime": 1.8581177500018384,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 452,
        "timesteps": 904000,
        "reward_mean": -0.3027499999999998,
        "reward_max": 0.6116250000000004,
        "reward_min": -1.3269375000000003,
        "leartime_s": 0.026697237975895405,
        "sampletime": 1.5586558979994152,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 453,
        "timesteps": 906000,
        "reward_mean": -0.10949999999999975,
        "reward_max": 0.8458750000000005,
        "reward_min": -1.1206874999999996,
        "leartime_s": 0.06161778399837203,
        "sampletime": 1.7498183250136208,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 454,
        "timesteps": 908000,
        "reward_mean": -0.22412499999999977,
        "reward_max": 0.8416250000000006,
        "reward_min": -1.6805,
        "leartime_s": 0.04817169898888096,
        "sampletime": 2.11919232699438,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 455,
        "timesteps": 910000,
        "reward_mean": -0.46244999999999975,
        "reward_max": 0.5336250000000006,
        "reward_min": -1.7179374999999997,
        "leartime_s": 0.048239526979159564,
        "sampletime": 1.4076918869977817,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 456,
        "timesteps": 912000,
        "reward_mean": -0.29557499999999975,
        "reward_max": 0.9364375000000004,
        "reward_min": -1.7083125000000001,
        "leartime_s": 0.028513113007647917,
        "sampletime": 1.7224924009933602,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 457,
        "timesteps": 914000,
        "reward_mean": -0.30272499999999974,
        "reward_max": 0.7376250000000003,
        "reward_min": -1.637,
        "leartime_s": 0.05483052699128166,
        "sampletime": 1.7858117969881278,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 458,
        "timesteps": 916000,
        "reward_mean": -0.3654249999999997,
        "reward_max": 0.6918125000000006,
        "reward_min": -1.7731875,
        "leartime_s": 0.03047923999838531,
        "sampletime": 1.6648149539832957,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 459,
        "timesteps": 918000,
        "reward_mean": -0.15784999999999974,
        "reward_max": 1.0770000000000006,
        "reward_min": -1.5939375000000002,
        "leartime_s": 0.04439911700319499,
        "sampletime": 1.5298548129794654,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 460,
        "timesteps": 920000,
        "reward_mean": -0.19377499999999975,
        "reward_max": 0.7445625000000005,
        "reward_min": -1.3410625,
        "leartime_s": 0.08197756300796755,
        "sampletime": 1.8569016420224216,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 461,
        "timesteps": 922000,
        "reward_mean": -0.37574999999999975,
        "reward_max": 0.41200000000000025,
        "reward_min": -2.5199374999999997,
        "leartime_s": 0.03578554900013842,
        "sampletime": 1.5152582759910729,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 462,
        "timesteps": 924000,
        "reward_mean": -0.2975749999999997,
        "reward_max": 0.9164375000000005,
        "reward_min": -1.5130625000000002,
        "leartime_s": 0.04201233200728893,
        "sampletime": 1.6955546999815851,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 463,
        "timesteps": 926000,
        "reward_mean": -0.14617499999999972,
        "reward_max": 1.0201250000000006,
        "reward_min": -1.617875,
        "leartime_s": 0.024442674010060728,
        "sampletime": 1.506036229984602,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 464,
        "timesteps": 928000,
        "reward_mean": -0.12772499999999967,
        "reward_max": 0.8805000000000005,
        "reward_min": -1.2100000000000002,
        "leartime_s": 0.09442524399491958,
        "sampletime": 1.8290933570242487,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 465,
        "timesteps": 930000,
        "reward_mean": -0.28939999999999977,
        "reward_max": 0.6310625000000003,
        "reward_min": -1.4146250000000005,
        "leartime_s": 0.058019046002300456,
        "sampletime": 1.9820479769841768,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 466,
        "timesteps": 932000,
        "reward_mean": -0.23012499999999977,
        "reward_max": 0.5260000000000006,
        "reward_min": -1.5581874999999998,
        "leartime_s": 0.024754782993113622,
        "sampletime": 1.7021217999863438,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 467,
        "timesteps": 934000,
        "reward_mean": -0.37699999999999984,
        "reward_max": 0.7941250000000002,
        "reward_min": -1.7703125000000004,
        "leartime_s": 0.08398670802125707,
        "sampletime": 1.858563696994679,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 468,
        "timesteps": 936000,
        "reward_mean": -0.39409999999999973,
        "reward_max": 0.6601250000000005,
        "reward_min": -1.8877500000000003,
        "leartime_s": 0.036378302989760414,
        "sampletime": 1.837724214012269,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 469,
        "timesteps": 938000,
        "reward_mean": 0.09550000000000028,
        "reward_max": 1.0123750000000005,
        "reward_min": -1.3238750000000004,
        "leartime_s": 0.034638709999853745,
        "sampletime": 1.7529231460066512,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 470,
        "timesteps": 940000,
        "reward_mean": -0.01549999999999967,
        "reward_max": 0.7608125000000003,
        "reward_min": -1.7829374999999996,
        "leartime_s": 0.0297033810056746,
        "sampletime": 1.5579343639838044,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 471,
        "timesteps": 942000,
        "reward_mean": 0.03937500000000031,
        "reward_max": 0.9161250000000003,
        "reward_min": -1.7598749999999996,
        "leartime_s": 0.030858223006362095,
        "sampletime": 1.7149110029859003,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 472,
        "timesteps": 944000,
        "reward_mean": -0.11652499999999968,
        "reward_max": 1.1250625000000007,
        "reward_min": -1.1537500000000003,
        "leartime_s": 0.03895333799300715,
        "sampletime": 1.7916415270010475,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 473,
        "timesteps": 946000,
        "reward_mean": -0.09424999999999965,
        "reward_max": 0.9179375000000005,
        "reward_min": -1.0995625,
        "leartime_s": 0.04741844898671843,
        "sampletime": 1.9544303829898126,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 474,
        "timesteps": 948000,
        "reward_mean": 0.29225000000000023,
        "reward_max": 1.2553750000000001,
        "reward_min": -1.158625,
        "leartime_s": 0.026027322019217536,
        "sampletime": 1.560310543020023,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 475,
        "timesteps": 950000,
        "reward_mean": 0.2805250000000003,
        "reward_max": 1.2858750000000003,
        "reward_min": -1.0895625,
        "leartime_s": 0.05397522999555804,
        "sampletime": 1.8277866990247276,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 476,
        "timesteps": 952000,
        "reward_mean": -0.07152499999999974,
        "reward_max": 0.8595625000000007,
        "reward_min": -1.764625,
        "leartime_s": 0.034983821999048814,
        "sampletime": 1.6000267600174993,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 477,
        "timesteps": 954000,
        "reward_mean": -0.15579999999999972,
        "reward_max": 0.6966250000000003,
        "reward_min": -1.5217500000000002,
        "leartime_s": 0.022722578985849395,
        "sampletime": 1.6497464989952277,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 478,
        "timesteps": 956000,
        "reward_mean": -0.08894999999999971,
        "reward_max": 0.8449375000000005,
        "reward_min": -1.299875,
        "leartime_s": 0.06775223001022823,
        "sampletime": 1.6193235899845604,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 479,
        "timesteps": 958000,
        "reward_mean": -0.2679749999999998,
        "reward_max": 0.6441875000000006,
        "reward_min": -1.5036875,
        "leartime_s": 0.04285635400447063,
        "sampletime": 1.8291580739896744,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 480,
        "timesteps": 960000,
        "reward_mean": -0.025749999999999704,
        "reward_max": 0.8577500000000003,
        "reward_min": -1.1428125,
        "leartime_s": 0.03355730097973719,
        "sampletime": 1.7629254450148437,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 481,
        "timesteps": 962000,
        "reward_mean": 0.046950000000000304,
        "reward_max": 0.9911250000000007,
        "reward_min": -1.4790625,
        "leartime_s": 0.023341091990005225,
        "sampletime": 1.752534202998504,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 482,
        "timesteps": 964000,
        "reward_mean": -0.015874999999999716,
        "reward_max": 1.1136875000000002,
        "reward_min": -2.2990625000000007,
        "leartime_s": 0.061258386995177716,
        "sampletime": 1.7149124270072207,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 483,
        "timesteps": 966000,
        "reward_mean": -0.08424999999999963,
        "reward_max": 0.9067500000000003,
        "reward_min": -1.7188124999999999,
        "leartime_s": 0.069423455017386,
        "sampletime": 1.5709781520126853,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 484,
        "timesteps": 968000,
        "reward_mean": 0.00525000000000028,
        "reward_max": 1.0427500000000007,
        "reward_min": -1.0225624999999998,
        "leartime_s": 0.04910041700350121,
        "sampletime": 1.7229468849836849,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 485,
        "timesteps": 970000,
        "reward_mean": -0.24779999999999977,
        "reward_max": 0.8343750000000005,
        "reward_min": -1.4590000000000003,
        "leartime_s": 0.06413481300114654,
        "sampletime": 1.7261958699964453,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 486,
        "timesteps": 972000,
        "reward_mean": -0.09067499999999964,
        "reward_max": 1.0824375000000006,
        "reward_min": -1.2879375,
        "leartime_s": 0.07736679702065885,
        "sampletime": 1.6215340399940033,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 487,
        "timesteps": 974000,
        "reward_mean": -0.053424999999999695,
        "reward_max": 0.9041250000000005,
        "reward_min": -1.6183125000000003,
        "leartime_s": 0.07058452401543036,
        "sampletime": 1.7491312690253835,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 488,
        "timesteps": 976000,
        "reward_mean": -0.20409999999999975,
        "reward_max": 0.8795000000000006,
        "reward_min": -1.265875,
        "leartime_s": 0.025550759019097313,
        "sampletime": 1.7266474429925438,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 489,
        "timesteps": 978000,
        "reward_mean": -0.0992499999999998,
        "reward_max": 0.8878750000000003,
        "reward_min": -1.2193125000000005,
        "leartime_s": 0.059686774999136105,
        "sampletime": 1.7990034309914336,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 490,
        "timesteps": 980000,
        "reward_mean": -0.11184999999999977,
        "reward_max": 0.8123125000000002,
        "reward_min": -1.9849374999999994,
        "leartime_s": 0.09931278700241819,
        "sampletime": 1.6117836410121527,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 491,
        "timesteps": 982000,
        "reward_mean": 0.04315000000000034,
        "reward_max": 1.1576875000000004,
        "reward_min": -1.1899375,
        "leartime_s": 0.032226480019744486,
        "sampletime": 1.4975189229880925,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 492,
        "timesteps": 984000,
        "reward_mean": -0.19552499999999978,
        "reward_max": 0.8271250000000006,
        "reward_min": -1.3318125,
        "leartime_s": 0.03598909400170669,
        "sampletime": 1.62818325398257,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 493,
        "timesteps": 986000,
        "reward_mean": 0.041325000000000243,
        "reward_max": 1.3622500000000008,
        "reward_min": -1.0886875,
        "leartime_s": 0.03285546999541111,
        "sampletime": 1.7462657720025163,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 494,
        "timesteps": 988000,
        "reward_mean": 0.0228000000000003,
        "reward_max": 1.1770000000000005,
        "reward_min": -1.4614375,
        "leartime_s": 0.04462079700897448,
        "sampletime": 1.4057471730047837,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 495,
        "timesteps": 990000,
        "reward_mean": -0.34699999999999975,
        "reward_max": 0.6738750000000003,
        "reward_min": -1.3656875000000002,
        "leartime_s": 0.05267333300434984,
        "sampletime": 2.000940375000937,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 496,
        "timesteps": 992000,
        "reward_mean": -0.09734999999999974,
        "reward_max": 0.9065625000000006,
        "reward_min": -1.1860625,
        "leartime_s": 0.07655081999837421,
        "sampletime": 1.7354021829960402,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 497,
        "timesteps": 994000,
        "reward_mean": 0.01822500000000029,
        "reward_max": 0.9425000000000006,
        "reward_min": -1.253125,
        "leartime_s": 0.02448235999327153,
        "sampletime": 1.5500704419973772,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 498,
        "timesteps": 996000,
        "reward_mean": 0.035025000000000264,
        "reward_max": 0.8897500000000004,
        "reward_min": -1.2113750000000003,
        "leartime_s": 0.05389465400367044,
        "sampletime": 1.8487054590077605,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 499,
        "timesteps": 998000,
        "reward_mean": -0.3835499999999997,
        "reward_max": 0.5635000000000006,
        "reward_min": -1.8089375,
        "leartime_s": 0.05335100498632528,
        "sampletime": 1.9332141810155008,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 500,
        "timesteps": 1000000,
        "reward_mean": 0.1740750000000003,
        "reward_max": 1.3325000000000005,
        "reward_min": -0.9259374999999996,
        "leartime_s": 0.07755192799959332,
        "sampletime": 1.7330280800233595,
        "best_mean": 0.3689250000000003,
        "best_max": 1.2173750000000008,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    }
]