[
    {
        "generation": 1,
        "timesteps": 20000,
        "reward_mean": -39.38632869047619,
        "reward_max": -9.581999999999999,
        "reward_min": -84.21937500000001,
        "leartime_s": 0.01685702399117872,
        "sampletime": 7.595801660994766,
        "best_mean": -39.38632869047619,
        "best_max": -9.581999999999999,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 2,
        "timesteps": 40000,
        "reward_mean": -31.242251666666668,
        "reward_max": -0.40437499999999965,
        "reward_min": -129.80812500000002,
        "leartime_s": 0.010049401986179873,
        "sampletime": 7.9055966320156585,
        "best_mean": -31.242251666666668,
        "best_max": -0.40437499999999965,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 3,
        "timesteps": 60000,
        "reward_mean": -18.653125000000003,
        "reward_max": 0.15250000000000113,
        "reward_min": -65.20375000000001,
        "leartime_s": 0.004547051998088136,
        "sampletime": 7.706650350999553,
        "best_mean": -18.653125000000003,
        "best_max": 0.15250000000000113,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 4,
        "timesteps": 80000,
        "reward_mean": -18.094350000000006,
        "reward_max": 1.674375000000001,
        "reward_min": -38.66000000000002,
        "leartime_s": 0.012883537012385204,
        "sampletime": 7.675200908997795,
        "best_mean": -18.094350000000006,
        "best_max": 1.674375000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 5,
        "timesteps": 100000,
        "reward_mean": -18.124350000000003,
        "reward_max": 1.9443750000000013,
        "reward_min": -40.42812499999999,
        "leartime_s": 0.005408349010394886,
        "sampletime": 7.870936918014195,
        "best_mean": -18.094350000000006,
        "best_max": 1.674375000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 6,
        "timesteps": 120000,
        "reward_mean": -13.70835,
        "reward_max": 0.2575000000000006,
        "reward_min": -98.48062499999997,
        "leartime_s": 0.004268127988325432,
        "sampletime": 7.797528552997392,
        "best_mean": -13.70835,
        "best_max": 0.2575000000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 7,
        "timesteps": 140000,
        "reward_mean": -2.156,
        "reward_max": 0.5600000000000003,
        "reward_min": -18.4325,
        "leartime_s": 0.004355589975602925,
        "sampletime": 7.79552525098552,
        "best_mean": -2.156,
        "best_max": 0.5600000000000003,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 8,
        "timesteps": 160000,
        "reward_mean": -1.2943249999999997,
        "reward_max": 1.453125000000001,
        "reward_min": -22.063125,
        "leartime_s": 0.004466340993531048,
        "sampletime": 7.719624391000252,
        "best_mean": -1.2943249999999997,
        "best_max": 1.453125000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 9,
        "timesteps": 180000,
        "reward_mean": -0.8511499999999999,
        "reward_max": 0.5350000000000007,
        "reward_min": -3.236250000000002,
        "leartime_s": 0.0054842300014570355,
        "sampletime": 7.774987423006678,
        "best_mean": -0.8511499999999999,
        "best_max": 0.5350000000000007,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 10,
        "timesteps": 200000,
        "reward_mean": -0.8344000000000001,
        "reward_max": 0.05875,
        "reward_min": -2.4437500000000005,
        "leartime_s": 0.012887432996649295,
        "sampletime": 7.7730557860049885,
        "best_mean": -0.8344000000000001,
        "best_max": 0.05875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 11,
        "timesteps": 220000,
        "reward_mean": -0.64975,
        "reward_max": 0.1593750000000002,
        "reward_min": -1.6812500000000008,
        "leartime_s": 0.00931892401422374,
        "sampletime": 7.896713170019211,
        "best_mean": -0.64975,
        "best_max": 0.1593750000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 12,
        "timesteps": 240000,
        "reward_mean": -0.9017185000000002,
        "reward_max": -0.009375000000000008,
        "reward_min": -2.2881249999999995,
        "leartime_s": 0.004544541006907821,
        "sampletime": 7.62782768800389,
        "best_mean": -0.64975,
        "best_max": 0.1593750000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 13,
        "timesteps": 260000,
        "reward_mean": -0.75235,
        "reward_max": 0.13000000000000003,
        "reward_min": -1.781875,
        "leartime_s": 0.014771534013561904,
        "sampletime": 7.736887267994462,
        "best_mean": -0.64975,
        "best_max": 0.1593750000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 14,
        "timesteps": 280000,
        "reward_mean": -0.6294749999999999,
        "reward_max": 0.32062500000000016,
        "reward_min": -1.9718749999999985,
        "leartime_s": 0.004766502999700606,
        "sampletime": 7.703200801013736,
        "best_mean": -0.6294749999999999,
        "best_max": 0.32062500000000016,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 15,
        "timesteps": 300000,
        "reward_mean": -0.41945299999999974,
        "reward_max": 0.5718750000000007,
        "reward_min": -1.7712499999999998,
        "leartime_s": 0.00463033199775964,
        "sampletime": 7.8480703470122535,
        "best_mean": -0.41945299999999974,
        "best_max": 0.5718750000000007,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 16,
        "timesteps": 320000,
        "reward_mean": -0.5416749999999995,
        "reward_max": 0.5662500000000006,
        "reward_min": -2.1506249999999993,
        "leartime_s": 0.004798173002200201,
        "sampletime": 8.877089693996822,
        "best_mean": -0.41945299999999974,
        "best_max": 0.5718750000000007,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 17,
        "timesteps": 340000,
        "reward_mean": -0.6257249999999998,
        "reward_max": 0.6675000000000006,
        "reward_min": -2.313125,
        "leartime_s": 0.004884052992565557,
        "sampletime": 8.745338835986331,
        "best_mean": -0.41945299999999974,
        "best_max": 0.5718750000000007,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 18,
        "timesteps": 360000,
        "reward_mean": -0.8074499999999998,
        "reward_max": 0.5887500000000007,
        "reward_min": -2.3212499999999996,
        "leartime_s": 0.006471867993241176,
        "sampletime": 8.42927413401776,
        "best_mean": -0.41945299999999974,
        "best_max": 0.5718750000000007,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 19,
        "timesteps": 380000,
        "reward_mean": 0.06075000000000044,
        "reward_max": 1.2375000000000005,
        "reward_min": -1.85625,
        "leartime_s": 0.004876683990005404,
        "sampletime": 8.55876067499048,
        "best_mean": 0.06075000000000044,
        "best_max": 1.2375000000000005,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 20,
        "timesteps": 400000,
        "reward_mean": 0.07235000000000034,
        "reward_max": 1.1812500000000004,
        "reward_min": -1.2743749999999998,
        "leartime_s": 0.004960033984389156,
        "sampletime": 8.518298844981473,
        "best_mean": 0.07235000000000034,
        "best_max": 1.1812500000000004,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 21,
        "timesteps": 420000,
        "reward_mean": -0.07369999999999961,
        "reward_max": 0.9893750000000003,
        "reward_min": -1.41625,
        "leartime_s": 0.010832594998646528,
        "sampletime": 8.618056723993504,
        "best_mean": 0.07235000000000034,
        "best_max": 1.1812500000000004,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 22,
        "timesteps": 440000,
        "reward_mean": 0.2604250000000004,
        "reward_max": 1.2968750000000004,
        "reward_min": -0.8562499999999993,
        "leartime_s": 0.005013144022086635,
        "sampletime": 8.453950207011076,
        "best_mean": 0.2604250000000004,
        "best_max": 1.2968750000000004,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 23,
        "timesteps": 460000,
        "reward_mean": 0.1942000000000004,
        "reward_max": 1.1943750000000002,
        "reward_min": -0.7531249999999994,
        "leartime_s": 0.005293738009640947,
        "sampletime": 8.476746147993254,
        "best_mean": 0.2604250000000004,
        "best_max": 1.2968750000000004,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 24,
        "timesteps": 480000,
        "reward_mean": 0.16132500000000038,
        "reward_max": 1.1687500000000006,
        "reward_min": -0.5768750000000004,
        "leartime_s": 0.007291112997336313,
        "sampletime": 10.31004644499626,
        "best_mean": 0.2604250000000004,
        "best_max": 1.2968750000000004,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 25,
        "timesteps": 500000,
        "reward_mean": 0.3743000000000006,
        "reward_max": 1.1912500000000006,
        "reward_min": -0.5687499999999983,
        "leartime_s": 0.006739267992088571,
        "sampletime": 10.51193958701333,
        "best_mean": 0.3743000000000006,
        "best_max": 1.1912500000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 26,
        "timesteps": 520000,
        "reward_mean": 0.30482500000000046,
        "reward_max": 1.3762500000000006,
        "reward_min": -0.599375,
        "leartime_s": 0.019693301001098007,
        "sampletime": 10.176479256013408,
        "best_mean": 0.3743000000000006,
        "best_max": 1.1912500000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 27,
        "timesteps": 540000,
        "reward_mean": 0.3594500000000005,
        "reward_max": 1.2875000000000005,
        "reward_min": -0.6393749999999988,
        "leartime_s": 0.005237655976088718,
        "sampletime": 10.265924257982988,
        "best_mean": 0.3743000000000006,
        "best_max": 1.1912500000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 28,
        "timesteps": 560000,
        "reward_mean": -0.008099999999999476,
        "reward_max": 0.7956250000000008,
        "reward_min": -1.1731250000000002,
        "leartime_s": 0.005596108996542171,
        "sampletime": 10.816717509995215,
        "best_mean": 0.3743000000000006,
        "best_max": 1.1912500000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 29,
        "timesteps": 580000,
        "reward_mean": 0.029650000000000537,
        "reward_max": 1.159375000000001,
        "reward_min": -1.7874999999999996,
        "leartime_s": 0.005541988008189946,
        "sampletime": 11.260829614999238,
        "best_mean": 0.3743000000000006,
        "best_max": 1.1912500000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 30,
        "timesteps": 600000,
        "reward_mean": 0.2632750000000006,
        "reward_max": 1.4775000000000007,
        "reward_min": -1.624375,
        "leartime_s": 0.004029244999401271,
        "sampletime": 11.37179283797741,
        "best_mean": 0.3743000000000006,
        "best_max": 1.1912500000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 31,
        "timesteps": 620000,
        "reward_mean": 0.26652500000000046,
        "reward_max": 1.3062500000000006,
        "reward_min": -1.1424999999999996,
        "leartime_s": 0.035319407004863024,
        "sampletime": 11.366784890007693,
        "best_mean": 0.3743000000000006,
        "best_max": 1.1912500000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 32,
        "timesteps": 640000,
        "reward_mean": 0.1655500000000005,
        "reward_max": 1.2587500000000005,
        "reward_min": -1.1356249999999983,
        "leartime_s": 0.005762657994637266,
        "sampletime": 11.734253503993386,
        "best_mean": 0.3743000000000006,
        "best_max": 1.1912500000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 33,
        "timesteps": 660000,
        "reward_mean": 0.31880000000000064,
        "reward_max": 1.725625000000001,
        "reward_min": -1.6974999999999993,
        "leartime_s": 0.005555838986765593,
        "sampletime": 11.881245319993468,
        "best_mean": 0.3743000000000006,
        "best_max": 1.1912500000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 34,
        "timesteps": 680000,
        "reward_mean": 0.5769500000000005,
        "reward_max": 1.695000000000001,
        "reward_min": -0.733125,
        "leartime_s": 0.005596697999862954,
        "sampletime": 11.832757669995772,
        "best_mean": 0.5769500000000005,
        "best_max": 1.695000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 35,
        "timesteps": 700000,
        "reward_mean": 0.5311000000000006,
        "reward_max": 1.7118750000000005,
        "reward_min": -1.053124999999999,
        "leartime_s": 0.008205140999052674,
        "sampletime": 12.214954091003165,
        "best_mean": 0.5769500000000005,
        "best_max": 1.695000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 36,
        "timesteps": 720000,
        "reward_mean": 0.41407500000000064,
        "reward_max": 1.2493750000000008,
        "reward_min": -0.8174999999999999,
        "leartime_s": 0.005735610000556335,
        "sampletime": 11.871173620980699,
        "best_mean": 0.5769500000000005,
        "best_max": 1.695000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 37,
        "timesteps": 740000,
        "reward_mean": 0.8601000000000006,
        "reward_max": 1.8543750000000008,
        "reward_min": -0.0856249999999994,
        "leartime_s": 0.0561923980130814,
        "sampletime": 11.296040212007938,
        "best_mean": 0.8601000000000006,
        "best_max": 1.8543750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 38,
        "timesteps": 760000,
        "reward_mean": 0.7339750000000006,
        "reward_max": 1.4400000000000004,
        "reward_min": -0.26249999999999984,
        "leartime_s": 0.00607410300290212,
        "sampletime": 12.325963517010678,
        "best_mean": 0.8601000000000006,
        "best_max": 1.8543750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 39,
        "timesteps": 780000,
        "reward_mean": 0.6649000000000005,
        "reward_max": 1.677500000000001,
        "reward_min": -0.4206249999999998,
        "leartime_s": 0.006400035985279828,
        "sampletime": 11.497393814992392,
        "best_mean": 0.8601000000000006,
        "best_max": 1.8543750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 40,
        "timesteps": 800000,
        "reward_mean": 0.8877250000000005,
        "reward_max": 1.9487500000000006,
        "reward_min": -0.3262499999999998,
        "leartime_s": 0.005855208000866696,
        "sampletime": 11.23026569999638,
        "best_mean": 0.8877250000000005,
        "best_max": 1.9487500000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 41,
        "timesteps": 820000,
        "reward_mean": 0.8436750000000005,
        "reward_max": 2.1787500000000004,
        "reward_min": -0.09062499999999934,
        "leartime_s": 0.008118519996060058,
        "sampletime": 11.786527206015307,
        "best_mean": 0.8877250000000005,
        "best_max": 1.9487500000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 42,
        "timesteps": 840000,
        "reward_mean": 1.1106250000000004,
        "reward_max": 2.0631250000000008,
        "reward_min": -0.002499999999999421,
        "leartime_s": 0.007761243992717937,
        "sampletime": 12.165577284991741,
        "best_mean": 1.1106250000000004,
        "best_max": 2.0631250000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 43,
        "timesteps": 860000,
        "reward_mean": 0.7857250000000006,
        "reward_max": 1.6262500000000009,
        "reward_min": -0.3787499999999994,
        "leartime_s": 0.025505962024908513,
        "sampletime": 11.214733255008468,
        "best_mean": 1.1106250000000004,
        "best_max": 2.0631250000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 44,
        "timesteps": 880000,
        "reward_mean": 0.5217000000000005,
        "reward_max": 1.585625,
        "reward_min": -1.5024999999999995,
        "leartime_s": 0.029876119981054217,
        "sampletime": 11.386897404998308,
        "best_mean": 1.1106250000000004,
        "best_max": 2.0631250000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 45,
        "timesteps": 900000,
        "reward_mean": 0.9460500000000006,
        "reward_max": 2.1550000000000007,
        "reward_min": -0.4406249999999993,
        "leartime_s": 0.006389834015863016,
        "sampletime": 11.158930328994757,
        "best_mean": 1.1106250000000004,
        "best_max": 2.0631250000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 46,
        "timesteps": 920000,
        "reward_mean": 0.7823000000000006,
        "reward_max": 2.141875,
        "reward_min": -1.6824999999999997,
        "leartime_s": 0.0407779699889943,
        "sampletime": 11.500573238998186,
        "best_mean": 1.1106250000000004,
        "best_max": 2.0631250000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 47,
        "timesteps": 940000,
        "reward_mean": 0.9076750000000007,
        "reward_max": 1.8456250000000007,
        "reward_min": -0.5337500000000001,
        "leartime_s": 0.02869612697395496,
        "sampletime": 11.894952731003286,
        "best_mean": 1.1106250000000004,
        "best_max": 2.0631250000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 48,
        "timesteps": 960000,
        "reward_mean": 0.9933750000000007,
        "reward_max": 2.09375,
        "reward_min": -0.27062499999999934,
        "leartime_s": 0.007342490978771821,
        "sampletime": 11.406506580999121,
        "best_mean": 1.1106250000000004,
        "best_max": 2.0631250000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 49,
        "timesteps": 980000,
        "reward_mean": 0.5063000000000006,
        "reward_max": 1.6868750000000006,
        "reward_min": -1.236249999999999,
        "leartime_s": 0.025706746004289016,
        "sampletime": 12.154882817005273,
        "best_mean": 1.1106250000000004,
        "best_max": 2.0631250000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 50,
        "timesteps": 1000000,
        "reward_mean": 1.1025750000000007,
        "reward_max": 2.2825,
        "reward_min": -1.2737499999999997,
        "leartime_s": 0.0072048289875965565,
        "sampletime": 11.946506852982566,
        "best_mean": 1.1106250000000004,
        "best_max": 2.0631250000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 51,
        "timesteps": 1020000,
        "reward_mean": 0.9325250000000005,
        "reward_max": 1.9625000000000004,
        "reward_min": -0.40687499999999943,
        "leartime_s": 0.025872553000226617,
        "sampletime": 11.692320126021514,
        "best_mean": 1.1106250000000004,
        "best_max": 2.0631250000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 52,
        "timesteps": 1040000,
        "reward_mean": 1.1237000000000008,
        "reward_max": 2.2493750000000006,
        "reward_min": -0.49437499999999934,
        "leartime_s": 0.008632234996184707,
        "sampletime": 11.902381372987293,
        "best_mean": 1.1237000000000008,
        "best_max": 2.2493750000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 53,
        "timesteps": 1060000,
        "reward_mean": 0.7685500000000006,
        "reward_max": 1.6787500000000006,
        "reward_min": -1.0437500000000002,
        "leartime_s": 0.010296563996234909,
        "sampletime": 12.045241749001434,
        "best_mean": 1.1237000000000008,
        "best_max": 2.2493750000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 54,
        "timesteps": 1080000,
        "reward_mean": 0.9735500000000006,
        "reward_max": 2.0718750000000004,
        "reward_min": -0.3931249999999995,
        "leartime_s": 0.006275110994465649,
        "sampletime": 11.161956869007554,
        "best_mean": 1.1237000000000008,
        "best_max": 2.2493750000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 55,
        "timesteps": 1100000,
        "reward_mean": 1.3088000000000006,
        "reward_max": 2.545000000000001,
        "reward_min": -0.21812499999999885,
        "leartime_s": 0.0543033369758632,
        "sampletime": 12.651897453994025,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 56,
        "timesteps": 1120000,
        "reward_mean": 0.5159000000000007,
        "reward_max": 1.6687500000000006,
        "reward_min": -1.1162499999999993,
        "leartime_s": 0.031214402028126642,
        "sampletime": 11.76949925898225,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 57,
        "timesteps": 1140000,
        "reward_mean": 0.9187500000000004,
        "reward_max": 2.0175000000000005,
        "reward_min": -0.3199999999999997,
        "leartime_s": 0.04328014201018959,
        "sampletime": 11.395233223011019,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 58,
        "timesteps": 1160000,
        "reward_mean": 0.6859250000000007,
        "reward_max": 1.9037500000000005,
        "reward_min": -1.5762499999999995,
        "leartime_s": 0.007592822017613798,
        "sampletime": 12.398539499001345,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 59,
        "timesteps": 1180000,
        "reward_mean": 1.0049750000000006,
        "reward_max": 1.9637500000000006,
        "reward_min": -0.7243749999999994,
        "leartime_s": 0.008499830000801012,
        "sampletime": 11.843311201984761,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 60,
        "timesteps": 1200000,
        "reward_mean": 0.6928250000000005,
        "reward_max": 1.5475000000000003,
        "reward_min": -0.5256249999999997,
        "leartime_s": 0.021781559014925733,
        "sampletime": 11.248840459011262,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 61,
        "timesteps": 1220000,
        "reward_mean": 0.6950750000000007,
        "reward_max": 1.8631250000000001,
        "reward_min": -0.6656249999999999,
        "leartime_s": 0.008114647003822029,
        "sampletime": 12.8316261760192,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 62,
        "timesteps": 1240000,
        "reward_mean": 1.1530500000000006,
        "reward_max": 2.2300000000000004,
        "reward_min": 0.023750000000000118,
        "leartime_s": 0.00685802599764429,
        "sampletime": 11.591775320994202,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 63,
        "timesteps": 1260000,
        "reward_mean": 0.8425500000000007,
        "reward_max": 2.0193750000000006,
        "reward_min": -0.39499999999999946,
        "leartime_s": 0.04762064400711097,
        "sampletime": 11.945579325984,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 64,
        "timesteps": 1280000,
        "reward_mean": 1.0345250000000008,
        "reward_max": 1.9500000000000006,
        "reward_min": 0.02375000000000048,
        "leartime_s": 0.0061060199805069715,
        "sampletime": 11.79121692100307,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 65,
        "timesteps": 1300000,
        "reward_mean": 0.9240750000000008,
        "reward_max": 1.8418750000000004,
        "reward_min": -0.23937499999999928,
        "leartime_s": 0.018473342002835125,
        "sampletime": 11.930018971004756,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 66,
        "timesteps": 1320000,
        "reward_mean": 0.8206250000000007,
        "reward_max": 1.8737500000000007,
        "reward_min": -0.7343749999999998,
        "leartime_s": 0.01075230399146676,
        "sampletime": 11.729349862987874,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 67,
        "timesteps": 1340000,
        "reward_mean": 0.8125250000000006,
        "reward_max": 1.8475000000000008,
        "reward_min": -0.10249999999999976,
        "leartime_s": 0.04804737999802455,
        "sampletime": 12.465004751022207,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 68,
        "timesteps": 1360000,
        "reward_mean": 0.9674750000000008,
        "reward_max": 2.0631250000000008,
        "reward_min": -1.0418749999999992,
        "leartime_s": 0.033721082989359275,
        "sampletime": 11.746215715975268,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 69,
        "timesteps": 1380000,
        "reward_mean": 0.8705250000000005,
        "reward_max": 1.7243750000000007,
        "reward_min": -0.26187499999999914,
        "leartime_s": 0.02171288398676552,
        "sampletime": 11.676746160985203,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 70,
        "timesteps": 1400000,
        "reward_mean": 0.9254500000000008,
        "reward_max": 1.8143750000000005,
        "reward_min": -0.17562499999999948,
        "leartime_s": 0.015276724006980658,
        "sampletime": 12.010988824011292,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 71,
        "timesteps": 1420000,
        "reward_mean": 0.9212500000000007,
        "reward_max": 2.030625000000001,
        "reward_min": -0.4449999999999993,
        "leartime_s": 0.018723482004133984,
        "sampletime": 11.661076213989872,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 72,
        "timesteps": 1440000,
        "reward_mean": 0.8704000000000007,
        "reward_max": 2.119375000000001,
        "reward_min": -0.47124999999999895,
        "leartime_s": 0.007019985991064459,
        "sampletime": 11.775130057998467,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 73,
        "timesteps": 1460000,
        "reward_mean": 1.2250250000000005,
        "reward_max": 2.1837500000000007,
        "reward_min": -0.040624999999999634,
        "leartime_s": 0.007427397998981178,
        "sampletime": 12.270495998003753,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 74,
        "timesteps": 1480000,
        "reward_mean": 0.7807750000000006,
        "reward_max": 1.738125000000001,
        "reward_min": -0.27562500000000006,
        "leartime_s": 0.007665762008400634,
        "sampletime": 11.742725446005352,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 75,
        "timesteps": 1500000,
        "reward_mean": 0.49952500000000055,
        "reward_max": 1.5387500000000007,
        "reward_min": -2.248125,
        "leartime_s": 0.010369002004154027,
        "sampletime": 12.216349289985374,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 76,
        "timesteps": 1520000,
        "reward_mean": 0.8227000000000007,
        "reward_max": 1.6037500000000007,
        "reward_min": -0.11999999999999895,
        "leartime_s": 0.010727087006671354,
        "sampletime": 11.740123379015131,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 77,
        "timesteps": 1540000,
        "reward_mean": 0.8549750000000006,
        "reward_max": 1.8975000000000006,
        "reward_min": -0.30374999999999963,
        "leartime_s": 0.023731768975267187,
        "sampletime": 11.360656567994738,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 78,
        "timesteps": 1560000,
        "reward_mean": 1.084875000000001,
        "reward_max": 2.0375,
        "reward_min": 0.3637500000000004,
        "leartime_s": 0.007503480999730527,
        "sampletime": 11.800688446994172,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 79,
        "timesteps": 1580000,
        "reward_mean": 0.9050250000000006,
        "reward_max": 2.158125,
        "reward_min": -0.09374999999999944,
        "leartime_s": 0.011514990997966379,
        "sampletime": 11.886214945989195,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 80,
        "timesteps": 1600000,
        "reward_mean": 0.7717500000000007,
        "reward_max": 1.6637500000000005,
        "reward_min": 0.061250000000000346,
        "leartime_s": 0.021472260996233672,
        "sampletime": 11.958031938993372,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 81,
        "timesteps": 1620000,
        "reward_mean": 0.9765750000000006,
        "reward_max": 1.9918750000000003,
        "reward_min": 0.2681250000000006,
        "leartime_s": 0.022325327998260036,
        "sampletime": 11.80847982200794,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 82,
        "timesteps": 1640000,
        "reward_mean": 1.1167500000000006,
        "reward_max": 1.9900000000000009,
        "reward_min": -0.03562499999999996,
        "leartime_s": 0.027581431990256533,
        "sampletime": 11.696341489994666,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 83,
        "timesteps": 1660000,
        "reward_mean": 1.1116250000000005,
        "reward_max": 1.8175000000000003,
        "reward_min": 0.23750000000000054,
        "leartime_s": 0.016953734011622146,
        "sampletime": 12.093035026016878,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 84,
        "timesteps": 1680000,
        "reward_mean": 1.0765250000000008,
        "reward_max": 1.861250000000001,
        "reward_min": -0.10249999999999987,
        "leartime_s": 0.01080007801647298,
        "sampletime": 12.072598331986228,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 85,
        "timesteps": 1700000,
        "reward_mean": 1.0382500000000008,
        "reward_max": 1.7162500000000007,
        "reward_min": -0.0024999999999995165,
        "leartime_s": 0.009312495996709913,
        "sampletime": 11.777013760001864,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 86,
        "timesteps": 1720000,
        "reward_mean": 0.5978500000000005,
        "reward_max": 1.510625000000001,
        "reward_min": -0.8649999999999995,
        "leartime_s": 0.02547814100398682,
        "sampletime": 11.730531269015046,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 87,
        "timesteps": 1740000,
        "reward_mean": 0.7191250000000007,
        "reward_max": 1.510000000000001,
        "reward_min": -0.3224999999999997,
        "leartime_s": 0.02390215898049064,
        "sampletime": 11.722039336978924,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 88,
        "timesteps": 1760000,
        "reward_mean": 0.7391000000000009,
        "reward_max": 1.4637500000000006,
        "reward_min": -0.396875,
        "leartime_s": 0.010110988980159163,
        "sampletime": 11.96054846799234,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 89,
        "timesteps": 1780000,
        "reward_mean": 1.0150000000000008,
        "reward_max": 1.994375000000001,
        "reward_min": -0.2056249999999994,
        "leartime_s": 0.022415398998418823,
        "sampletime": 12.078191451990278,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 90,
        "timesteps": 1800000,
        "reward_mean": 1.3084750000000005,
        "reward_max": 2.1725000000000008,
        "reward_min": 0.5000000000000004,
        "leartime_s": 0.05074789302307181,
        "sampletime": 11.836111620010342,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 91,
        "timesteps": 1820000,
        "reward_mean": 0.7406500000000007,
        "reward_max": 1.6175000000000008,
        "reward_min": -0.19499999999999945,
        "leartime_s": 0.011073185974964872,
        "sampletime": 11.980142006999813,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 92,
        "timesteps": 1840000,
        "reward_mean": 0.9096250000000006,
        "reward_max": 1.9556250000000004,
        "reward_min": -0.3162499999999996,
        "leartime_s": 0.02914131700526923,
        "sampletime": 11.975707119010622,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 93,
        "timesteps": 1860000,
        "reward_mean": 0.8908250000000005,
        "reward_max": 1.7481250000000006,
        "reward_min": -0.6793750000000002,
        "leartime_s": 0.033026652003172785,
        "sampletime": 12.260042220004834,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 94,
        "timesteps": 1880000,
        "reward_mean": 0.8063250000000006,
        "reward_max": 1.6768750000000006,
        "reward_min": -0.4893749999999999,
        "leartime_s": 0.008285826974315569,
        "sampletime": 11.681481078994693,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 95,
        "timesteps": 1900000,
        "reward_mean": 0.8984000000000005,
        "reward_max": 1.7931250000000005,
        "reward_min": -0.4987499999999997,
        "leartime_s": 0.007454217993654311,
        "sampletime": 11.68598075999762,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 96,
        "timesteps": 1920000,
        "reward_mean": 1.0358250000000007,
        "reward_max": 2.036250000000001,
        "reward_min": -0.03874999999999894,
        "leartime_s": 0.028716642991639674,
        "sampletime": 11.494721856026445,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 97,
        "timesteps": 1940000,
        "reward_mean": 0.7846000000000006,
        "reward_max": 1.6768750000000008,
        "reward_min": -0.34312499999999957,
        "leartime_s": 0.0270041809999384,
        "sampletime": 11.495476106996648,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 98,
        "timesteps": 1960000,
        "reward_mean": 0.8111250000000005,
        "reward_max": 1.7662500000000003,
        "reward_min": -0.7199999999999998,
        "leartime_s": 0.03148211998632178,
        "sampletime": 11.793987580022076,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 99,
        "timesteps": 1980000,
        "reward_mean": 0.7772500000000007,
        "reward_max": 1.611250000000001,
        "reward_min": -0.10812499999999882,
        "leartime_s": 0.008175374008715153,
        "sampletime": 11.543740324006649,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 100,
        "timesteps": 2000000,
        "reward_mean": 0.8865750000000007,
        "reward_max": 1.6950000000000007,
        "reward_min": -0.23499999999999951,
        "leartime_s": 0.008302847010781989,
        "sampletime": 11.630946912016952,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 101,
        "timesteps": 2020000,
        "reward_mean": 0.7133750000000006,
        "reward_max": 1.8425000000000002,
        "reward_min": -0.3056249999999995,
        "leartime_s": 0.020835303992498666,
        "sampletime": 10.525139050994767,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 102,
        "timesteps": 2040000,
        "reward_mean": 1.1573500000000008,
        "reward_max": 2.018125000000001,
        "reward_min": -0.41937499999999944,
        "leartime_s": 0.02674863301217556,
        "sampletime": 10.134395980014233,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 103,
        "timesteps": 2060000,
        "reward_mean": 0.7831000000000006,
        "reward_max": 1.5612500000000005,
        "reward_min": -0.2606249999999992,
        "leartime_s": 0.022300793993053958,
        "sampletime": 10.040633735974552,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 104,
        "timesteps": 2080000,
        "reward_mean": 0.7643500000000006,
        "reward_max": 1.6275000000000004,
        "reward_min": -0.33749999999999947,
        "leartime_s": 0.008299305016407743,
        "sampletime": 10.327821438986575,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 105,
        "timesteps": 2100000,
        "reward_mean": 0.8247250000000006,
        "reward_max": 1.8781250000000003,
        "reward_min": -0.3937499999999997,
        "leartime_s": 0.015754177002236247,
        "sampletime": 10.230533486988861,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 106,
        "timesteps": 2120000,
        "reward_mean": 0.8515750000000006,
        "reward_max": 1.8500000000000005,
        "reward_min": -0.7706249999999994,
        "leartime_s": 0.01114225698984228,
        "sampletime": 10.588635650987271,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 107,
        "timesteps": 2140000,
        "reward_mean": 0.9082500000000006,
        "reward_max": 1.9593750000000008,
        "reward_min": -0.1687499999999994,
        "leartime_s": 0.013048350985627621,
        "sampletime": 10.119628699001623,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 108,
        "timesteps": 2160000,
        "reward_mean": 0.9006000000000005,
        "reward_max": 1.8812500000000008,
        "reward_min": -0.02437499999999919,
        "leartime_s": 0.015286194015061483,
        "sampletime": 10.698760961007793,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 109,
        "timesteps": 2180000,
        "reward_mean": 0.8453000000000006,
        "reward_max": 1.8825000000000003,
        "reward_min": -0.30499999999999955,
        "leartime_s": 0.00837962600053288,
        "sampletime": 10.444888796977466,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 110,
        "timesteps": 2200000,
        "reward_mean": 0.8565000000000007,
        "reward_max": 1.8862500000000004,
        "reward_min": -0.38562499999999944,
        "leartime_s": 0.009110119979595765,
        "sampletime": 10.264109459996689,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 111,
        "timesteps": 2220000,
        "reward_mean": 0.8207250000000006,
        "reward_max": 1.7631250000000005,
        "reward_min": -0.1918749999999997,
        "leartime_s": 0.010943036002572626,
        "sampletime": 10.161406620987691,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 112,
        "timesteps": 2240000,
        "reward_mean": 0.8185250000000006,
        "reward_max": 1.6775000000000007,
        "reward_min": -0.17812499999999928,
        "leartime_s": 0.009619974007364362,
        "sampletime": 10.152352789998986,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 113,
        "timesteps": 2260000,
        "reward_mean": 0.5792250000000005,
        "reward_max": 1.7100000000000006,
        "reward_min": -0.34750000000000014,
        "leartime_s": 0.039857082010712475,
        "sampletime": 10.818407966988161,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 114,
        "timesteps": 2280000,
        "reward_mean": 0.7076000000000006,
        "reward_max": 1.7862500000000006,
        "reward_min": -0.22374999999999945,
        "leartime_s": 0.023001771012786776,
        "sampletime": 9.750548482988961,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 115,
        "timesteps": 2300000,
        "reward_mean": 0.9225750000000007,
        "reward_max": 1.805625000000001,
        "reward_min": -0.04312499999999972,
        "leartime_s": 0.017681437981082126,
        "sampletime": 8.981911765993573,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 116,
        "timesteps": 2320000,
        "reward_mean": 0.7699250000000006,
        "reward_max": 1.6025000000000005,
        "reward_min": -0.03187499999999949,
        "leartime_s": 0.020944443007465452,
        "sampletime": 9.334158138983184,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 117,
        "timesteps": 2340000,
        "reward_mean": 0.7155750000000006,
        "reward_max": 1.7306250000000003,
        "reward_min": -0.23999999999999908,
        "leartime_s": 0.009494694008026272,
        "sampletime": 8.647162323002703,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 118,
        "timesteps": 2360000,
        "reward_mean": 0.6132750000000006,
        "reward_max": 1.4443750000000009,
        "reward_min": -0.7218749999999992,
        "leartime_s": 0.010429971996927634,
        "sampletime": 9.49956398701761,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 119,
        "timesteps": 2380000,
        "reward_mean": 0.7156000000000008,
        "reward_max": 1.431250000000001,
        "reward_min": -0.4068749999999997,
        "leartime_s": 0.016206517000682652,
        "sampletime": 9.879546115000267,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 120,
        "timesteps": 2400000,
        "reward_mean": 0.8209000000000005,
        "reward_max": 1.8437500000000004,
        "reward_min": -0.07687499999999942,
        "leartime_s": 0.02258595998864621,
        "sampletime": 11.298874493018957,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 121,
        "timesteps": 2420000,
        "reward_mean": 0.7096500000000006,
        "reward_max": 1.630000000000001,
        "reward_min": -0.19999999999999893,
        "leartime_s": 0.05671976102166809,
        "sampletime": 11.549292224983219,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 122,
        "timesteps": 2440000,
        "reward_mean": 0.45362500000000067,
        "reward_max": 1.3531250000000008,
        "reward_min": -0.560624999999999,
        "leartime_s": 0.012051529018208385,
        "sampletime": 11.287297236005543,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 123,
        "timesteps": 2460000,
        "reward_mean": 1.0215250000000007,
        "reward_max": 2.065,
        "reward_min": -0.07249999999999943,
        "leartime_s": 0.0291140710178297,
        "sampletime": 11.976173705013935,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 124,
        "timesteps": 2480000,
        "reward_mean": 0.7037750000000006,
        "reward_max": 1.9937500000000004,
        "reward_min": -0.55,
        "leartime_s": 0.039945830998476595,
        "sampletime": 11.575670641992474,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 125,
        "timesteps": 2500000,
        "reward_mean": 0.6860250000000007,
        "reward_max": 1.6175000000000008,
        "reward_min": -0.3031249999999992,
        "leartime_s": 0.009400382987223566,
        "sampletime": 11.20649544900516,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 126,
        "timesteps": 2520000,
        "reward_mean": 0.6314000000000005,
        "reward_max": 1.9043750000000008,
        "reward_min": -0.40812499999999974,
        "leartime_s": 0.012854739994509146,
        "sampletime": 12.123043960978976,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 127,
        "timesteps": 2540000,
        "reward_mean": 0.5610000000000005,
        "reward_max": 1.4418750000000005,
        "reward_min": -0.3112499999999993,
        "leartime_s": 0.03142804899835028,
        "sampletime": 12.280331374000525,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 128,
        "timesteps": 2560000,
        "reward_mean": 0.6240750000000006,
        "reward_max": 1.6912500000000006,
        "reward_min": -0.5574999999999994,
        "leartime_s": 0.012064103997545317,
        "sampletime": 11.499216348020127,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 129,
        "timesteps": 2580000,
        "reward_mean": 0.4422000000000005,
        "reward_max": 1.4356250000000006,
        "reward_min": -0.5099999999999996,
        "leartime_s": 0.009947237005690113,
        "sampletime": 11.721590403001755,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 130,
        "timesteps": 2600000,
        "reward_mean": 0.5449500000000006,
        "reward_max": 1.4325000000000006,
        "reward_min": -0.5643749999999994,
        "leartime_s": 0.010151999013032764,
        "sampletime": 11.83149197101011,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 131,
        "timesteps": 2620000,
        "reward_mean": 0.7884250000000006,
        "reward_max": 1.7281250000000004,
        "reward_min": -0.4568749999999998,
        "leartime_s": 0.007773701014230028,
        "sampletime": 11.255287189997034,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 132,
        "timesteps": 2640000,
        "reward_mean": 0.3587250000000007,
        "reward_max": 1.1987500000000004,
        "reward_min": -1.3812499999999992,
        "leartime_s": 0.02943002901156433,
        "sampletime": 11.098681200004648,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 133,
        "timesteps": 2660000,
        "reward_mean": 0.7272000000000006,
        "reward_max": 1.8875000000000008,
        "reward_min": -0.8093749999999994,
        "leartime_s": 0.0294121990154963,
        "sampletime": 11.869676903996151,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 134,
        "timesteps": 2680000,
        "reward_mean": 0.46147500000000063,
        "reward_max": 1.4556250000000006,
        "reward_min": -0.3731249999999996,
        "leartime_s": 0.025813801010372117,
        "sampletime": 11.146239499998046,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 135,
        "timesteps": 2700000,
        "reward_mean": 0.9619250000000006,
        "reward_max": 1.965,
        "reward_min": -0.05249999999999942,
        "leartime_s": 0.009458784013986588,
        "sampletime": 12.055992965993937,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 136,
        "timesteps": 2720000,
        "reward_mean": 0.9829000000000006,
        "reward_max": 2.1750000000000007,
        "reward_min": -0.10562499999999936,
        "leartime_s": 0.01028682998730801,
        "sampletime": 11.483023312990554,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 137,
        "timesteps": 2740000,
        "reward_mean": 0.9382500000000007,
        "reward_max": 1.8687500000000008,
        "reward_min": -0.4493749999999995,
        "leartime_s": 0.010532301996136084,
        "sampletime": 11.987655851000454,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 138,
        "timesteps": 2760000,
        "reward_mean": 0.7179250000000006,
        "reward_max": 1.5681250000000009,
        "reward_min": -0.39812499999999945,
        "leartime_s": 0.030626679013948888,
        "sampletime": 12.036908626003424,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 139,
        "timesteps": 2780000,
        "reward_mean": 0.5511250000000006,
        "reward_max": 1.350000000000001,
        "reward_min": -0.7949999999999993,
        "leartime_s": 0.011750892008421943,
        "sampletime": 11.361866054008715,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 140,
        "timesteps": 2800000,
        "reward_mean": 0.6805250000000007,
        "reward_max": 1.495,
        "reward_min": -0.1818749999999995,
        "leartime_s": 0.02665337800863199,
        "sampletime": 11.888653203990543,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 141,
        "timesteps": 2820000,
        "reward_mean": 0.6349250000000006,
        "reward_max": 2.020625000000001,
        "reward_min": -0.4987499999999991,
        "leartime_s": 0.00996018701698631,
        "sampletime": 11.439061615994433,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 142,
        "timesteps": 2840000,
        "reward_mean": 0.8103750000000008,
        "reward_max": 1.847500000000001,
        "reward_min": -0.36812499999999987,
        "leartime_s": 0.01323183299973607,
        "sampletime": 11.797653365996666,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 143,
        "timesteps": 2860000,
        "reward_mean": 0.9016250000000007,
        "reward_max": 1.8362500000000008,
        "reward_min": -0.7662499999999993,
        "leartime_s": 0.02720335201593116,
        "sampletime": 11.815184553997824,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 144,
        "timesteps": 2880000,
        "reward_mean": 0.6335000000000007,
        "reward_max": 1.6025000000000005,
        "reward_min": -0.3987499999999997,
        "leartime_s": 0.014378142019268125,
        "sampletime": 11.867662061995361,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 145,
        "timesteps": 2900000,
        "reward_mean": 0.7356500000000006,
        "reward_max": 2.1900000000000004,
        "reward_min": -0.5949999999999995,
        "leartime_s": 0.011252877011429518,
        "sampletime": 11.843961789010791,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 146,
        "timesteps": 2920000,
        "reward_mean": 0.8217250000000006,
        "reward_max": 2.0631250000000003,
        "reward_min": -1.1724999999999997,
        "leartime_s": 0.010526241996558383,
        "sampletime": 12.008243641990703,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 147,
        "timesteps": 2940000,
        "reward_mean": 0.5361250000000006,
        "reward_max": 1.6268750000000005,
        "reward_min": -1.3606249999999995,
        "leartime_s": 0.05593758498434909,
        "sampletime": 11.949351405986818,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 148,
        "timesteps": 2960000,
        "reward_mean": 0.8789250000000005,
        "reward_max": 1.950000000000001,
        "reward_min": -0.24374999999999977,
        "leartime_s": 0.009900806995574385,
        "sampletime": 12.136858313024277,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 149,
        "timesteps": 2980000,
        "reward_mean": 0.9453250000000005,
        "reward_max": 2.121875,
        "reward_min": -0.20312499999999958,
        "leartime_s": 0.024678832007339224,
        "sampletime": 11.83442163001746,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 150,
        "timesteps": 3000000,
        "reward_mean": 0.9746000000000007,
        "reward_max": 1.8850000000000005,
        "reward_min": -0.4443749999999999,
        "leartime_s": 0.01038100098958239,
        "sampletime": 11.706586596992565,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 151,
        "timesteps": 3020000,
        "reward_mean": 0.7978250000000007,
        "reward_max": 1.713750000000001,
        "reward_min": -0.790625,
        "leartime_s": 0.044254454027395695,
        "sampletime": 11.896899321000092,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 152,
        "timesteps": 3040000,
        "reward_mean": 0.8789000000000007,
        "reward_max": 1.8450000000000006,
        "reward_min": -0.20124999999999965,
        "leartime_s": 0.04702324199024588,
        "sampletime": 12.037230190995615,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 153,
        "timesteps": 3060000,
        "reward_mean": 1.2026750000000006,
        "reward_max": 2.2225000000000006,
        "reward_min": -0.7925000000000002,
        "leartime_s": 0.03108756200526841,
        "sampletime": 11.763929294975242,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 154,
        "timesteps": 3080000,
        "reward_mean": 1.0338250000000007,
        "reward_max": 2.0593750000000006,
        "reward_min": 0.058125000000000746,
        "leartime_s": 0.07800701301312074,
        "sampletime": 11.7078475849994,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 155,
        "timesteps": 3100000,
        "reward_mean": 1.0613500000000007,
        "reward_max": 2.203125,
        "reward_min": 0.16937500000000083,
        "leartime_s": 0.04129142197780311,
        "sampletime": 11.3631311969948,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 156,
        "timesteps": 3120000,
        "reward_mean": 0.9527750000000007,
        "reward_max": 1.9287500000000006,
        "reward_min": -0.30187500000000006,
        "leartime_s": 0.029078305989969522,
        "sampletime": 11.92277162897517,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 157,
        "timesteps": 3140000,
        "reward_mean": 0.9587000000000007,
        "reward_max": 1.9525000000000006,
        "reward_min": 0.0175000000000003,
        "leartime_s": 0.01807233100407757,
        "sampletime": 11.856221917987568,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 158,
        "timesteps": 3160000,
        "reward_mean": 0.6191500000000005,
        "reward_max": 1.6212500000000005,
        "reward_min": -0.7725,
        "leartime_s": 0.012547506979899481,
        "sampletime": 11.274452331999782,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 159,
        "timesteps": 3180000,
        "reward_mean": 1.0222500000000008,
        "reward_max": 2.031250000000001,
        "reward_min": -0.034999999999999865,
        "leartime_s": 0.058633095992263407,
        "sampletime": 11.910175626020646,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 160,
        "timesteps": 3200000,
        "reward_mean": 0.6983250000000006,
        "reward_max": 1.7006250000000003,
        "reward_min": -0.2849999999999995,
        "leartime_s": 0.024699973000679165,
        "sampletime": 11.630553419003263,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 161,
        "timesteps": 3220000,
        "reward_mean": 1.1153500000000007,
        "reward_max": 2.0656250000000007,
        "reward_min": 0.12000000000000044,
        "leartime_s": 0.025393107993295416,
        "sampletime": 10.700987625023117,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 162,
        "timesteps": 3240000,
        "reward_mean": 0.6959250000000007,
        "reward_max": 1.5718750000000004,
        "reward_min": -0.5556249999999998,
        "leartime_s": 0.03013493400067091,
        "sampletime": 9.541330616979394,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 163,
        "timesteps": 3260000,
        "reward_mean": 1.1047500000000006,
        "reward_max": 2.1318750000000004,
        "reward_min": -0.16249999999999964,
        "leartime_s": 0.02247916502528824,
        "sampletime": 9.566071966022719,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 164,
        "timesteps": 3280000,
        "reward_mean": 1.1259500000000005,
        "reward_max": 2.215,
        "reward_min": 0.025625000000000342,
        "leartime_s": 0.01131267799064517,
        "sampletime": 9.84489159900113,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 165,
        "timesteps": 3300000,
        "reward_mean": 1.0418000000000007,
        "reward_max": 2.028125000000001,
        "reward_min": -0.25624999999999953,
        "leartime_s": 0.01051145201199688,
        "sampletime": 9.765761223010486,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 166,
        "timesteps": 3320000,
        "reward_mean": 1.0332250000000007,
        "reward_max": 2.155625000000001,
        "reward_min": -0.031249999999999306,
        "leartime_s": 0.011653231020318344,
        "sampletime": 11.035974425991299,
        "best_mean": 1.3088000000000006,
        "best_max": 2.545000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 167,
        "timesteps": 3340000,
        "reward_mean": 1.3854000000000009,
        "reward_max": 2.5818750000000015,
        "reward_min": 0.3400000000000006,
        "leartime_s": 0.02481585298664868,
        "sampletime": 11.824754121014848,
        "best_mean": 1.3854000000000009,
        "best_max": 2.5818750000000015,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 168,
        "timesteps": 3360000,
        "reward_mean": 0.8284000000000007,
        "reward_max": 2.1150000000000007,
        "reward_min": -1.0624999999999993,
        "leartime_s": 0.02374773198971525,
        "sampletime": 11.386108139005955,
        "best_mean": 1.3854000000000009,
        "best_max": 2.5818750000000015,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 169,
        "timesteps": 3380000,
        "reward_mean": 0.9316000000000006,
        "reward_max": 2.090000000000001,
        "reward_min": -0.11562499999999955,
        "leartime_s": 0.02315572099178098,
        "sampletime": 11.784657859010622,
        "best_mean": 1.3854000000000009,
        "best_max": 2.5818750000000015,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 170,
        "timesteps": 3400000,
        "reward_mean": 1.1000250000000005,
        "reward_max": 2.6468750000000005,
        "reward_min": -0.036875000000000074,
        "leartime_s": 0.01626127798226662,
        "sampletime": 11.720610249001766,
        "best_mean": 1.3854000000000009,
        "best_max": 2.5818750000000015,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 171,
        "timesteps": 3420000,
        "reward_mean": 1.1024500000000008,
        "reward_max": 2.3075000000000006,
        "reward_min": -0.056874999999999495,
        "leartime_s": 0.01936893700622022,
        "sampletime": 11.689036030991701,
        "best_mean": 1.3854000000000009,
        "best_max": 2.5818750000000015,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 172,
        "timesteps": 3440000,
        "reward_mean": 0.9695000000000006,
        "reward_max": 1.8675000000000006,
        "reward_min": 0.013750000000000567,
        "leartime_s": 0.02058402498369105,
        "sampletime": 11.607849861000432,
        "best_mean": 1.3854000000000009,
        "best_max": 2.5818750000000015,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 173,
        "timesteps": 3460000,
        "reward_mean": 1.0748000000000006,
        "reward_max": 2.2231250000000005,
        "reward_min": 0.1850000000000005,
        "leartime_s": 0.024717071995837614,
        "sampletime": 11.664564761013025,
        "best_mean": 1.3854000000000009,
        "best_max": 2.5818750000000015,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 174,
        "timesteps": 3480000,
        "reward_mean": 1.1647500000000008,
        "reward_max": 2.0712500000000005,
        "reward_min": -0.16375000000000028,
        "leartime_s": 0.02112123102415353,
        "sampletime": 11.383889082004316,
        "best_mean": 1.3854000000000009,
        "best_max": 2.5818750000000015,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 175,
        "timesteps": 3500000,
        "reward_mean": 1.2004500000000007,
        "reward_max": 2.10875,
        "reward_min": -0.23562499999999972,
        "leartime_s": 0.012901861016871408,
        "sampletime": 11.605016549990978,
        "best_mean": 1.3854000000000009,
        "best_max": 2.5818750000000015,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 176,
        "timesteps": 3520000,
        "reward_mean": 1.1058500000000004,
        "reward_max": 2.201250000000001,
        "reward_min": -0.3274999999999999,
        "leartime_s": 0.012502523983130231,
        "sampletime": 11.618243119999534,
        "best_mean": 1.3854000000000009,
        "best_max": 2.5818750000000015,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 177,
        "timesteps": 3540000,
        "reward_mean": 1.1399500000000005,
        "reward_max": 2.2543750000000005,
        "reward_min": -0.10062499999999969,
        "leartime_s": 0.011347503983415663,
        "sampletime": 11.276041212986456,
        "best_mean": 1.3854000000000009,
        "best_max": 2.5818750000000015,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 178,
        "timesteps": 3560000,
        "reward_mean": 1.1320000000000006,
        "reward_max": 2.1881250000000008,
        "reward_min": -0.038749999999999535,
        "leartime_s": 0.01339798397384584,
        "sampletime": 11.914629819017136,
        "best_mean": 1.3854000000000009,
        "best_max": 2.5818750000000015,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 179,
        "timesteps": 3580000,
        "reward_mean": 0.8935000000000006,
        "reward_max": 2.0250000000000012,
        "reward_min": -0.9387499999999993,
        "leartime_s": 0.014014229003805667,
        "sampletime": 11.186317544983467,
        "best_mean": 1.3854000000000009,
        "best_max": 2.5818750000000015,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 180,
        "timesteps": 3600000,
        "reward_mean": 1.2671750000000004,
        "reward_max": 2.615625,
        "reward_min": -0.016875000000000473,
        "leartime_s": 0.03505926500656642,
        "sampletime": 11.355647125979885,
        "best_mean": 1.3854000000000009,
        "best_max": 2.5818750000000015,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 181,
        "timesteps": 3620000,
        "reward_mean": 1.3905250000000005,
        "reward_max": 2.5587500000000003,
        "reward_min": 0.32750000000000057,
        "leartime_s": 0.08719848102191463,
        "sampletime": 11.735879621992353,
        "best_mean": 1.3905250000000005,
        "best_max": 2.5587500000000003,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 182,
        "timesteps": 3640000,
        "reward_mean": 1.5076500000000008,
        "reward_max": 2.7575000000000003,
        "reward_min": 0.4106250000000011,
        "leartime_s": 0.05371739101246931,
        "sampletime": 11.637047587020788,
        "best_mean": 1.5076500000000008,
        "best_max": 2.7575000000000003,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 183,
        "timesteps": 3660000,
        "reward_mean": 1.0182250000000004,
        "reward_max": 2.1906250000000003,
        "reward_min": 0.018125000000000738,
        "leartime_s": 0.06402769600390457,
        "sampletime": 11.85032000602223,
        "best_mean": 1.5076500000000008,
        "best_max": 2.7575000000000003,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 184,
        "timesteps": 3680000,
        "reward_mean": 1.0771750000000007,
        "reward_max": 1.8743750000000003,
        "reward_min": 0.012500000000000289,
        "leartime_s": 0.019231279991799966,
        "sampletime": 11.488240976002999,
        "best_mean": 1.5076500000000008,
        "best_max": 2.7575000000000003,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 185,
        "timesteps": 3700000,
        "reward_mean": 1.1083000000000007,
        "reward_max": 2.1068750000000005,
        "reward_min": 0.09250000000000061,
        "leartime_s": 0.07943605299806222,
        "sampletime": 11.221660698007327,
        "best_mean": 1.5076500000000008,
        "best_max": 2.7575000000000003,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 186,
        "timesteps": 3720000,
        "reward_mean": 1.2407250000000005,
        "reward_max": 2.0900000000000003,
        "reward_min": 0.3462500000000007,
        "leartime_s": 0.012147942994488403,
        "sampletime": 11.91359444198315,
        "best_mean": 1.5076500000000008,
        "best_max": 2.7575000000000003,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 187,
        "timesteps": 3740000,
        "reward_mean": 1.1502000000000006,
        "reward_max": 2.3600000000000003,
        "reward_min": -0.1931250000000002,
        "leartime_s": 0.014827506005531177,
        "sampletime": 11.371182721020887,
        "best_mean": 1.5076500000000008,
        "best_max": 2.7575000000000003,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 188,
        "timesteps": 3760000,
        "reward_mean": 1.2858500000000008,
        "reward_max": 2.2693750000000006,
        "reward_min": 0.21375000000000016,
        "leartime_s": 0.013511083991033956,
        "sampletime": 11.302376879000803,
        "best_mean": 1.5076500000000008,
        "best_max": 2.7575000000000003,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 189,
        "timesteps": 3780000,
        "reward_mean": 1.3556000000000006,
        "reward_max": 2.2762500000000006,
        "reward_min": -0.07750000000000039,
        "leartime_s": 0.07355251000262797,
        "sampletime": 12.010344021982746,
        "best_mean": 1.5076500000000008,
        "best_max": 2.7575000000000003,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 190,
        "timesteps": 3800000,
        "reward_mean": 1.0489000000000008,
        "reward_max": 2.0331250000000005,
        "reward_min": -0.30624999999999913,
        "leartime_s": 0.08714192098705098,
        "sampletime": 10.818799861997832,
        "best_mean": 1.5076500000000008,
        "best_max": 2.7575000000000003,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 191,
        "timesteps": 3820000,
        "reward_mean": 1.0711500000000005,
        "reward_max": 2.2493750000000006,
        "reward_min": 0.02000000000000076,
        "leartime_s": 0.01641398502397351,
        "sampletime": 11.94205206699553,
        "best_mean": 1.5076500000000008,
        "best_max": 2.7575000000000003,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 192,
        "timesteps": 3840000,
        "reward_mean": 0.8703500000000006,
        "reward_max": 1.8025000000000004,
        "reward_min": -0.2656249999999999,
        "leartime_s": 0.050302085001021624,
        "sampletime": 11.239818856003694,
        "best_mean": 1.5076500000000008,
        "best_max": 2.7575000000000003,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 193,
        "timesteps": 3860000,
        "reward_mean": 1.0752750000000006,
        "reward_max": 1.9856250000000004,
        "reward_min": 0.010625000000000273,
        "leartime_s": 0.012673443998210132,
        "sampletime": 11.479054722993169,
        "best_mean": 1.5076500000000008,
        "best_max": 2.7575000000000003,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 194,
        "timesteps": 3880000,
        "reward_mean": 0.9301500000000007,
        "reward_max": 2.131250000000001,
        "reward_min": -0.10749999999999979,
        "leartime_s": 0.03508585799136199,
        "sampletime": 11.970982886996353,
        "best_mean": 1.5076500000000008,
        "best_max": 2.7575000000000003,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 195,
        "timesteps": 3900000,
        "reward_mean": 0.7883000000000007,
        "reward_max": 1.6800000000000004,
        "reward_min": 0.04062500000000041,
        "leartime_s": 0.058432121004443616,
        "sampletime": 11.284133742999984,
        "best_mean": 1.5076500000000008,
        "best_max": 2.7575000000000003,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 196,
        "timesteps": 3920000,
        "reward_mean": 0.9310750000000007,
        "reward_max": 1.7368750000000008,
        "reward_min": 0.11625000000000035,
        "leartime_s": 0.015766830008942634,
        "sampletime": 11.129030821000924,
        "best_mean": 1.5076500000000008,
        "best_max": 2.7575000000000003,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 197,
        "timesteps": 3940000,
        "reward_mean": 0.9658500000000005,
        "reward_max": 2.390625000000001,
        "reward_min": -0.4418749999999998,
        "leartime_s": 0.011860687984153628,
        "sampletime": 11.630268851993605,
        "best_mean": 1.5076500000000008,
        "best_max": 2.7575000000000003,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 198,
        "timesteps": 3960000,
        "reward_mean": 1.3768500000000006,
        "reward_max": 2.422500000000001,
        "reward_min": 0.36500000000000044,
        "leartime_s": 0.03512154897907749,
        "sampletime": 11.193039681995288,
        "best_mean": 1.5076500000000008,
        "best_max": 2.7575000000000003,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 199,
        "timesteps": 3980000,
        "reward_mean": 1.2748000000000006,
        "reward_max": 2.43875,
        "reward_min": 0.2037500000000005,
        "leartime_s": 0.05017647301428951,
        "sampletime": 11.821722911990946,
        "best_mean": 1.5076500000000008,
        "best_max": 2.7575000000000003,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 200,
        "timesteps": 4000000,
        "reward_mean": 1.5118750000000007,
        "reward_max": 2.521875,
        "reward_min": 0.12000000000000102,
        "leartime_s": 0.018459729006281123,
        "sampletime": 11.44724243998644,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 201,
        "timesteps": 4020000,
        "reward_mean": 1.0262500000000006,
        "reward_max": 2.258750000000001,
        "reward_min": -0.19624999999999962,
        "leartime_s": 0.03073237300850451,
        "sampletime": 11.006498298986116,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 202,
        "timesteps": 4040000,
        "reward_mean": 1.0887750000000005,
        "reward_max": 2.2806250000000006,
        "reward_min": -0.09874999999999926,
        "leartime_s": 0.04204768597264774,
        "sampletime": 11.998248874995625,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 203,
        "timesteps": 4060000,
        "reward_mean": 1.1432750000000005,
        "reward_max": 2.2343750000000004,
        "reward_min": 0.22437500000000019,
        "leartime_s": 0.03543823701329529,
        "sampletime": 11.661594420002075,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 204,
        "timesteps": 4080000,
        "reward_mean": 0.8687500000000006,
        "reward_max": 1.8331250000000003,
        "reward_min": -0.24749999999999994,
        "leartime_s": 0.025266787997679785,
        "sampletime": 10.387056583014783,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 205,
        "timesteps": 4100000,
        "reward_mean": 1.0349000000000008,
        "reward_max": 2.2150000000000007,
        "reward_min": -0.2081249999999995,
        "leartime_s": 0.07446960799279623,
        "sampletime": 8.65111019500182,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 206,
        "timesteps": 4120000,
        "reward_mean": 0.9649250000000006,
        "reward_max": 2.0125000000000006,
        "reward_min": -0.4343749999999997,
        "leartime_s": 0.026023623999208212,
        "sampletime": 8.676655037008459,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 207,
        "timesteps": 4140000,
        "reward_mean": 1.1240250000000005,
        "reward_max": 2.0187500000000007,
        "reward_min": -0.3893749999999998,
        "leartime_s": 0.012068064999766648,
        "sampletime": 9.159777046996169,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 208,
        "timesteps": 4160000,
        "reward_mean": 0.3832500000000007,
        "reward_max": 1.4575000000000002,
        "reward_min": -1.0843749999999985,
        "leartime_s": 0.012901015987154096,
        "sampletime": 9.334239740972407,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 209,
        "timesteps": 4180000,
        "reward_mean": 1.2041000000000006,
        "reward_max": 2.1393750000000007,
        "reward_min": 0.3081250000000007,
        "leartime_s": 0.02221931901294738,
        "sampletime": 9.18131999799516,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 210,
        "timesteps": 4200000,
        "reward_mean": 0.7723750000000007,
        "reward_max": 1.9375000000000007,
        "reward_min": -0.6368749999999991,
        "leartime_s": 0.034288157999981195,
        "sampletime": 8.91594289400382,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 211,
        "timesteps": 4220000,
        "reward_mean": 1.3714000000000006,
        "reward_max": 2.4793750000000006,
        "reward_min": 0.03875000000000044,
        "leartime_s": 0.0323124110000208,
        "sampletime": 8.822405048995279,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 212,
        "timesteps": 4240000,
        "reward_mean": 0.9845000000000005,
        "reward_max": 1.987500000000001,
        "reward_min": -0.04312499999999937,
        "leartime_s": 0.012616560998139903,
        "sampletime": 8.939068040024722,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 213,
        "timesteps": 4260000,
        "reward_mean": 0.8307750000000007,
        "reward_max": 1.7368750000000008,
        "reward_min": -0.4406249999999996,
        "leartime_s": 0.013013877003686503,
        "sampletime": 8.777299743989715,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 214,
        "timesteps": 4280000,
        "reward_mean": 0.7487500000000007,
        "reward_max": 1.8968750000000008,
        "reward_min": -0.713749999999999,
        "leartime_s": 0.028937022987520322,
        "sampletime": 9.066922809986863,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 215,
        "timesteps": 4300000,
        "reward_mean": 0.9907500000000006,
        "reward_max": 2.091875000000001,
        "reward_min": -0.7187500000000004,
        "leartime_s": 0.012448978988686576,
        "sampletime": 9.22605521400692,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 216,
        "timesteps": 4320000,
        "reward_mean": 1.2054250000000006,
        "reward_max": 2.2031250000000004,
        "reward_min": -0.01812499999999937,
        "leartime_s": 0.020123175985645503,
        "sampletime": 8.821313103981083,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 217,
        "timesteps": 4340000,
        "reward_mean": 1.2357500000000003,
        "reward_max": 2.468125,
        "reward_min": 0.050000000000000266,
        "leartime_s": 0.013827380986185744,
        "sampletime": 9.414971985999728,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 218,
        "timesteps": 4360000,
        "reward_mean": 0.6680500000000006,
        "reward_max": 1.7268750000000008,
        "reward_min": -1.3531250000000001,
        "leartime_s": 0.012463572027627379,
        "sampletime": 9.205697618977865,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 219,
        "timesteps": 4380000,
        "reward_mean": 0.8673500000000006,
        "reward_max": 1.6693750000000007,
        "reward_min": -0.16312499999999933,
        "leartime_s": 0.014697159989736974,
        "sampletime": 9.35133380201296,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 220,
        "timesteps": 4400000,
        "reward_mean": 1.1900750000000007,
        "reward_max": 2.4400000000000004,
        "reward_min": 0.08250000000000035,
        "leartime_s": 0.03378196302219294,
        "sampletime": 8.980517817981308,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 221,
        "timesteps": 4420000,
        "reward_mean": 1.0687750000000005,
        "reward_max": 2.1812500000000004,
        "reward_min": -0.17562499999999967,
        "leartime_s": 0.01426968298619613,
        "sampletime": 8.90545162401395,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 222,
        "timesteps": 4440000,
        "reward_mean": 0.8015500000000007,
        "reward_max": 1.7337500000000008,
        "reward_min": -0.2587499999999994,
        "leartime_s": 0.01686689499183558,
        "sampletime": 10.643518728000345,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 223,
        "timesteps": 4460000,
        "reward_mean": 1.0295500000000004,
        "reward_max": 2.263750000000001,
        "reward_min": -0.8800000000000001,
        "leartime_s": 0.03222858000663109,
        "sampletime": 10.301308026973857,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 224,
        "timesteps": 4480000,
        "reward_mean": 0.7395000000000007,
        "reward_max": 1.5518750000000008,
        "reward_min": -0.26374999999999915,
        "leartime_s": 0.01990818901685998,
        "sampletime": 11.963584584998898,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 225,
        "timesteps": 4500000,
        "reward_mean": 1.0314500000000006,
        "reward_max": 2.32625,
        "reward_min": -0.20624999999999932,
        "leartime_s": 0.013344348000828177,
        "sampletime": 11.51974342498579,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 226,
        "timesteps": 4520000,
        "reward_mean": 0.9864750000000005,
        "reward_max": 2.0356250000000005,
        "reward_min": -0.3275000000000001,
        "leartime_s": 0.03322806899086572,
        "sampletime": 11.141083040012745,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 227,
        "timesteps": 4540000,
        "reward_mean": 1.0495250000000005,
        "reward_max": 2.2225000000000006,
        "reward_min": -0.008749999999999772,
        "leartime_s": 0.013401580014033243,
        "sampletime": 11.74735899400548,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 228,
        "timesteps": 4560000,
        "reward_mean": 1.0685000000000007,
        "reward_max": 1.9381250000000003,
        "reward_min": 0.28625000000000034,
        "leartime_s": 0.019105612998828292,
        "sampletime": 11.138739257992711,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 229,
        "timesteps": 4580000,
        "reward_mean": 0.7849000000000008,
        "reward_max": 2.1993750000000007,
        "reward_min": -1.313124999999998,
        "leartime_s": 0.053701880999142304,
        "sampletime": 11.86782572400989,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 230,
        "timesteps": 4600000,
        "reward_mean": 1.0365250000000006,
        "reward_max": 2.308125,
        "reward_min": -0.8425000000000001,
        "leartime_s": 0.023172943998361006,
        "sampletime": 11.794136924989289,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 231,
        "timesteps": 4620000,
        "reward_mean": 1.0299750000000008,
        "reward_max": 2.0675000000000003,
        "reward_min": -0.41062499999999913,
        "leartime_s": 0.015225745999487117,
        "sampletime": 11.338130479998654,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 232,
        "timesteps": 4640000,
        "reward_mean": 0.8502750000000006,
        "reward_max": 1.9687500000000004,
        "reward_min": -0.7368749999999998,
        "leartime_s": 0.011761424015276134,
        "sampletime": 11.70475306501612,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 233,
        "timesteps": 4660000,
        "reward_mean": 0.6697000000000006,
        "reward_max": 1.6206250000000004,
        "reward_min": -0.7706250000000001,
        "leartime_s": 0.034720808995189145,
        "sampletime": 11.649859694007318,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 234,
        "timesteps": 4680000,
        "reward_mean": 0.6682250000000006,
        "reward_max": 1.6600000000000008,
        "reward_min": -0.48437499999999994,
        "leartime_s": 0.017716492002364248,
        "sampletime": 11.618084349989658,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 235,
        "timesteps": 4700000,
        "reward_mean": 0.8646500000000008,
        "reward_max": 2.0925000000000007,
        "reward_min": -0.24124999999999958,
        "leartime_s": 0.047991026018280536,
        "sampletime": 11.756979286001297,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 236,
        "timesteps": 4720000,
        "reward_mean": 0.7801250000000007,
        "reward_max": 1.8725000000000007,
        "reward_min": -0.8606249999999998,
        "leartime_s": 0.015288943017367274,
        "sampletime": 11.866653175995452,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 237,
        "timesteps": 4740000,
        "reward_mean": 0.7469250000000007,
        "reward_max": 2.1543750000000004,
        "reward_min": -1.4306249999999991,
        "leartime_s": 0.014769626985071227,
        "sampletime": 11.835189947014442,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 238,
        "timesteps": 4760000,
        "reward_mean": 0.8546250000000004,
        "reward_max": 2.3043750000000007,
        "reward_min": -0.6562500000000001,
        "leartime_s": 0.013729019003221765,
        "sampletime": 11.47367962100543,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 239,
        "timesteps": 4780000,
        "reward_mean": 0.7819500000000005,
        "reward_max": 1.7843750000000007,
        "reward_min": -1.0137500000000006,
        "leartime_s": 0.01812068501021713,
        "sampletime": 11.40146494199871,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 240,
        "timesteps": 4800000,
        "reward_mean": 0.7750000000000006,
        "reward_max": 1.8793750000000007,
        "reward_min": -0.5106249999999992,
        "leartime_s": 0.03898225899320096,
        "sampletime": 11.772789226000896,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 241,
        "timesteps": 4820000,
        "reward_mean": 1.0045250000000006,
        "reward_max": 2.0287500000000005,
        "reward_min": -0.4568749999999995,
        "leartime_s": 0.017446290992666036,
        "sampletime": 11.298812778026331,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 242,
        "timesteps": 4840000,
        "reward_mean": 1.0587250000000006,
        "reward_max": 2.145625000000001,
        "reward_min": -0.2931249999999994,
        "leartime_s": 0.014894369000103325,
        "sampletime": 11.552789766981732,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 243,
        "timesteps": 4860000,
        "reward_mean": 1.0888000000000007,
        "reward_max": 1.9587500000000007,
        "reward_min": 0.23687500000000045,
        "leartime_s": 0.013973452994832769,
        "sampletime": 12.087849219009513,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 244,
        "timesteps": 4880000,
        "reward_mean": 1.1255250000000006,
        "reward_max": 2.43625,
        "reward_min": -0.03499999999999928,
        "leartime_s": 0.01575985600356944,
        "sampletime": 11.654395916993963,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 245,
        "timesteps": 4900000,
        "reward_mean": 1.0245250000000006,
        "reward_max": 2.155000000000001,
        "reward_min": -0.3468749999999997,
        "leartime_s": 0.023742029996355996,
        "sampletime": 11.351902688998962,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 246,
        "timesteps": 4920000,
        "reward_mean": 0.9308000000000006,
        "reward_max": 1.861875000000001,
        "reward_min": -0.26874999999999916,
        "leartime_s": 0.03852225802256726,
        "sampletime": 11.816605627012905,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 247,
        "timesteps": 4940000,
        "reward_mean": 0.8405750000000007,
        "reward_max": 2.147500000000001,
        "reward_min": -0.8493749999999993,
        "leartime_s": 0.05453228502301499,
        "sampletime": 11.78081900300458,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 248,
        "timesteps": 4960000,
        "reward_mean": 1.3591000000000006,
        "reward_max": 2.6387500000000004,
        "reward_min": -0.06437499999999946,
        "leartime_s": 0.055436333001125604,
        "sampletime": 11.602654090005672,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 249,
        "timesteps": 4980000,
        "reward_mean": 0.7128500000000005,
        "reward_max": 1.9025000000000005,
        "reward_min": -0.8462499999999997,
        "leartime_s": 0.014262943004723638,
        "sampletime": 11.813766467006644,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 250,
        "timesteps": 5000000,
        "reward_mean": 0.6306000000000006,
        "reward_max": 1.4918750000000012,
        "reward_min": -0.9293749999999994,
        "leartime_s": 0.029104971006745473,
        "sampletime": 12.109639732982032,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 251,
        "timesteps": 5020000,
        "reward_mean": 0.7781250000000006,
        "reward_max": 1.9212500000000006,
        "reward_min": -0.6431249999999992,
        "leartime_s": 0.01927359399269335,
        "sampletime": 11.561557080014609,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 252,
        "timesteps": 5040000,
        "reward_mean": 0.4604250000000006,
        "reward_max": 1.601250000000001,
        "reward_min": -1.1131250000000001,
        "leartime_s": 0.08449157100403681,
        "sampletime": 11.769514712010277,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 253,
        "timesteps": 5060000,
        "reward_mean": 0.9010750000000005,
        "reward_max": 1.8212500000000003,
        "reward_min": -0.9287499999999994,
        "leartime_s": 0.04454280500067398,
        "sampletime": 11.66842668299796,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 254,
        "timesteps": 5080000,
        "reward_mean": 0.7929750000000005,
        "reward_max": 2.318750000000001,
        "reward_min": -0.7712499999999999,
        "leartime_s": 0.02745738800149411,
        "sampletime": 11.764682060020277,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 255,
        "timesteps": 5100000,
        "reward_mean": 0.7304000000000005,
        "reward_max": 2.06625,
        "reward_min": -1.5824999999999994,
        "leartime_s": 0.015233932004775852,
        "sampletime": 11.337944819009863,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 256,
        "timesteps": 5120000,
        "reward_mean": 0.7019750000000006,
        "reward_max": 1.9993750000000003,
        "reward_min": -0.6512499999999994,
        "leartime_s": 0.02129181899363175,
        "sampletime": 11.233313267992344,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 257,
        "timesteps": 5140000,
        "reward_mean": 1.0706000000000007,
        "reward_max": 2.1106250000000006,
        "reward_min": -0.379375,
        "leartime_s": 0.015631485992344096,
        "sampletime": 11.91789212700678,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 258,
        "timesteps": 5160000,
        "reward_mean": 0.7847250000000007,
        "reward_max": 1.6362500000000009,
        "reward_min": -0.6224999999999999,
        "leartime_s": 0.0183289650012739,
        "sampletime": 11.701309608994052,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 259,
        "timesteps": 5180000,
        "reward_mean": 0.8160000000000007,
        "reward_max": 1.8668750000000005,
        "reward_min": -0.35562499999999936,
        "leartime_s": 0.0479537210194394,
        "sampletime": 11.396779684990179,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 260,
        "timesteps": 5200000,
        "reward_mean": 0.8679000000000008,
        "reward_max": 1.9093750000000007,
        "reward_min": -1.0168749999999998,
        "leartime_s": 0.019164030003594235,
        "sampletime": 11.799881378014106,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 261,
        "timesteps": 5220000,
        "reward_mean": 0.6224000000000003,
        "reward_max": 2.2000000000000006,
        "reward_min": -1.0137500000000002,
        "leartime_s": 0.05690631098696031,
        "sampletime": 12.337838913983433,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 262,
        "timesteps": 5240000,
        "reward_mean": 0.7015500000000007,
        "reward_max": 2.2243750000000007,
        "reward_min": -0.8037499999999993,
        "leartime_s": 0.02911521101486869,
        "sampletime": 11.276957606023643,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 263,
        "timesteps": 5260000,
        "reward_mean": 0.5498500000000006,
        "reward_max": 1.7337500000000008,
        "reward_min": -1.506875,
        "leartime_s": 0.03581385497818701,
        "sampletime": 12.221205134992488,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 264,
        "timesteps": 5280000,
        "reward_mean": 0.8147500000000006,
        "reward_max": 1.9631250000000011,
        "reward_min": -0.63,
        "leartime_s": 0.017784713010769337,
        "sampletime": 11.52738265201333,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 265,
        "timesteps": 5300000,
        "reward_mean": 1.0371500000000005,
        "reward_max": 2.0662500000000006,
        "reward_min": -0.925624999999999,
        "leartime_s": 0.03351695599849336,
        "sampletime": 11.210265684989281,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 266,
        "timesteps": 5320000,
        "reward_mean": 0.5567750000000006,
        "reward_max": 1.6125000000000007,
        "reward_min": -1.7437500000000012,
        "leartime_s": 0.018188513990025967,
        "sampletime": 12.107558040006552,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 267,
        "timesteps": 5340000,
        "reward_mean": 0.4366250000000006,
        "reward_max": 1.5381250000000009,
        "reward_min": -1.3124999999999996,
        "leartime_s": 0.03711875301087275,
        "sampletime": 11.607825701998081,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 268,
        "timesteps": 5360000,
        "reward_mean": 0.7389500000000007,
        "reward_max": 1.9312500000000008,
        "reward_min": -0.7874999999999999,
        "leartime_s": 0.03829380200477317,
        "sampletime": 11.679054959997302,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 269,
        "timesteps": 5380000,
        "reward_mean": 0.7059750000000007,
        "reward_max": 1.8518750000000006,
        "reward_min": -0.3318749999999995,
        "leartime_s": 0.017454428976634517,
        "sampletime": 11.49433627599501,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 270,
        "timesteps": 5400000,
        "reward_mean": 0.7951000000000006,
        "reward_max": 2.2856250000000005,
        "reward_min": -1.2850000000000001,
        "leartime_s": 0.018631165992701426,
        "sampletime": 11.640745284996228,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 271,
        "timesteps": 5420000,
        "reward_mean": 0.8136750000000006,
        "reward_max": 2.190000000000001,
        "reward_min": -0.5999999999999999,
        "leartime_s": 0.020170640986179933,
        "sampletime": 11.694964091002475,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 272,
        "timesteps": 5440000,
        "reward_mean": 0.42727500000000057,
        "reward_max": 2.2406250000000005,
        "reward_min": -1.7774999999999996,
        "leartime_s": 0.012845470977481455,
        "sampletime": 11.723564178013476,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 273,
        "timesteps": 5460000,
        "reward_mean": 1.1048500000000003,
        "reward_max": 2.0612500000000002,
        "reward_min": -0.08249999999999982,
        "leartime_s": 0.015444721007952467,
        "sampletime": 11.582687315007206,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 274,
        "timesteps": 5480000,
        "reward_mean": 0.9092750000000005,
        "reward_max": 2.1881250000000008,
        "reward_min": -1.543125,
        "leartime_s": 0.023611676006112248,
        "sampletime": 11.562910537992138,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 275,
        "timesteps": 5500000,
        "reward_mean": 0.7137500000000006,
        "reward_max": 1.8381250000000007,
        "reward_min": -2.174375000000001,
        "leartime_s": 0.018505768006434664,
        "sampletime": 12.016803665988846,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 276,
        "timesteps": 5520000,
        "reward_mean": 1.2609750000000008,
        "reward_max": 2.3306250000000004,
        "reward_min": -0.11249999999999914,
        "leartime_s": 0.06259179199696518,
        "sampletime": 11.278012619004585,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 277,
        "timesteps": 5540000,
        "reward_mean": 0.8386500000000006,
        "reward_max": 2.4762500000000003,
        "reward_min": -1.19875,
        "leartime_s": 0.028309184999670833,
        "sampletime": 11.448375375999603,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 278,
        "timesteps": 5560000,
        "reward_mean": 0.9000250000000006,
        "reward_max": 2.262500000000001,
        "reward_min": -0.26937499999999936,
        "leartime_s": 0.01581806701142341,
        "sampletime": 12.193828018003842,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 279,
        "timesteps": 5580000,
        "reward_mean": 0.5682750000000008,
        "reward_max": 1.4300000000000008,
        "reward_min": -0.5468749999999992,
        "leartime_s": 0.04133522600750439,
        "sampletime": 11.542336774989963,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 280,
        "timesteps": 5600000,
        "reward_mean": 0.7021250000000007,
        "reward_max": 1.6775000000000007,
        "reward_min": -0.6318749999999994,
        "leartime_s": 0.015291818999685347,
        "sampletime": 12.067092338984367,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 281,
        "timesteps": 5620000,
        "reward_mean": 0.8493250000000008,
        "reward_max": 2.0518750000000003,
        "reward_min": -0.82125,
        "leartime_s": 0.01850018900586292,
        "sampletime": 11.869027916982304,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 282,
        "timesteps": 5640000,
        "reward_mean": 0.7973500000000006,
        "reward_max": 1.8325000000000007,
        "reward_min": -1.10625,
        "leartime_s": 0.019649338006274775,
        "sampletime": 11.14708745200187,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 283,
        "timesteps": 5660000,
        "reward_mean": 0.6002000000000005,
        "reward_max": 1.7262500000000012,
        "reward_min": -1.1943749999999995,
        "leartime_s": 0.020950756006641313,
        "sampletime": 12.025874645012664,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 284,
        "timesteps": 5680000,
        "reward_mean": 1.2053750000000005,
        "reward_max": 2.4531250000000004,
        "reward_min": -0.5162499999999998,
        "leartime_s": 0.06788460299139842,
        "sampletime": 11.615281558973948,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 285,
        "timesteps": 5700000,
        "reward_mean": 0.6576250000000007,
        "reward_max": 1.7756250000000011,
        "reward_min": -0.7212499999999997,
        "leartime_s": 0.015417172980960459,
        "sampletime": 11.599106453999411,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 286,
        "timesteps": 5720000,
        "reward_mean": 0.9055750000000005,
        "reward_max": 1.8631250000000004,
        "reward_min": -1.5512499999999994,
        "leartime_s": 0.016778175020590425,
        "sampletime": 11.557062798994593,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 287,
        "timesteps": 5740000,
        "reward_mean": 0.8755750000000008,
        "reward_max": 2.1137500000000005,
        "reward_min": -1.031875,
        "leartime_s": 0.04239762498764321,
        "sampletime": 11.850704957993003,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 288,
        "timesteps": 5760000,
        "reward_mean": 0.5996500000000006,
        "reward_max": 1.8775000000000004,
        "reward_min": -0.8399999999999993,
        "leartime_s": 0.06208971200976521,
        "sampletime": 11.544257288012886,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 289,
        "timesteps": 5780000,
        "reward_mean": 0.8419750000000007,
        "reward_max": 1.8681250000000007,
        "reward_min": -0.47249999999999936,
        "leartime_s": 0.016731220996007323,
        "sampletime": 11.834504144993844,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 290,
        "timesteps": 5800000,
        "reward_mean": 0.8809250000000006,
        "reward_max": 1.7575000000000005,
        "reward_min": -0.7793750000000002,
        "leartime_s": 0.02968183602206409,
        "sampletime": 11.32239516300615,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 291,
        "timesteps": 5820000,
        "reward_mean": 1.0738250000000005,
        "reward_max": 2.073750000000001,
        "reward_min": -0.024374999999999133,
        "leartime_s": 0.055567817005794495,
        "sampletime": 11.789812745992094,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 292,
        "timesteps": 5840000,
        "reward_mean": 1.0705500000000006,
        "reward_max": 1.960000000000001,
        "reward_min": 0.12000000000000063,
        "leartime_s": 0.04268024300108664,
        "sampletime": 11.67788486299105,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 293,
        "timesteps": 5860000,
        "reward_mean": 0.8669750000000006,
        "reward_max": 2.0725000000000002,
        "reward_min": -0.3599999999999996,
        "leartime_s": 0.02197593101300299,
        "sampletime": 11.389520513999742,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 294,
        "timesteps": 5880000,
        "reward_mean": 0.8042000000000006,
        "reward_max": 1.9125000000000005,
        "reward_min": -0.4056249999999993,
        "leartime_s": 0.078726771986112,
        "sampletime": 11.37342319599702,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 295,
        "timesteps": 5900000,
        "reward_mean": 0.8531000000000006,
        "reward_max": 1.9218750000000004,
        "reward_min": -1.3149999999999995,
        "leartime_s": 0.0873191189893987,
        "sampletime": 12.176074635994155,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 296,
        "timesteps": 5920000,
        "reward_mean": 0.8095000000000007,
        "reward_max": 1.6718750000000009,
        "reward_min": -0.31374999999999953,
        "leartime_s": 0.04044465802144259,
        "sampletime": 11.231946565996623,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 297,
        "timesteps": 5940000,
        "reward_mean": 1.0463750000000005,
        "reward_max": 1.7543750000000002,
        "reward_min": 0.03625000000000045,
        "leartime_s": 0.053636063006706536,
        "sampletime": 11.883683020016178,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 298,
        "timesteps": 5960000,
        "reward_mean": 0.9466500000000005,
        "reward_max": 1.9437500000000005,
        "reward_min": 0.049375000000000134,
        "leartime_s": 0.05949756799964234,
        "sampletime": 11.011247627000557,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 299,
        "timesteps": 5980000,
        "reward_mean": 1.0992250000000006,
        "reward_max": 2.0812500000000003,
        "reward_min": -0.196875,
        "leartime_s": 0.027706369990482926,
        "sampletime": 11.729151770996395,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 300,
        "timesteps": 6000000,
        "reward_mean": 1.1614000000000007,
        "reward_max": 2.1412500000000003,
        "reward_min": -0.07812499999999925,
        "leartime_s": 0.042169029999058694,
        "sampletime": 11.65786417099298,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 301,
        "timesteps": 6020000,
        "reward_mean": 0.8448500000000005,
        "reward_max": 1.6456250000000008,
        "reward_min": -0.2843749999999995,
        "leartime_s": 0.049558090016944334,
        "sampletime": 11.244657114992151,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 302,
        "timesteps": 6040000,
        "reward_mean": 1.0829500000000007,
        "reward_max": 1.9968750000000006,
        "reward_min": 0.13625000000000065,
        "leartime_s": 0.043561200000112876,
        "sampletime": 9.542600780987414,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 303,
        "timesteps": 6060000,
        "reward_mean": 0.9580405000000006,
        "reward_max": 2.066250000000001,
        "reward_min": -0.6025000000000001,
        "leartime_s": 0.03964819299289957,
        "sampletime": 9.42779512697598,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 304,
        "timesteps": 6080000,
        "reward_mean": 0.9250500000000006,
        "reward_max": 1.8068750000000005,
        "reward_min": 0.08375000000000056,
        "leartime_s": 0.03146031900541857,
        "sampletime": 9.80004815099528,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 305,
        "timesteps": 6100000,
        "reward_mean": 0.9621750000000007,
        "reward_max": 1.6393750000000005,
        "reward_min": 0.19812500000000122,
        "leartime_s": 0.01597755801049061,
        "sampletime": 9.384747987001901,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 306,
        "timesteps": 6120000,
        "reward_mean": 0.8496750000000007,
        "reward_max": 2.0281250000000006,
        "reward_min": -0.06499999999999927,
        "leartime_s": 0.03286067600129172,
        "sampletime": 9.667280015011784,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 307,
        "timesteps": 6140000,
        "reward_mean": 1.0026750000000006,
        "reward_max": 1.8643750000000006,
        "reward_min": 0.1643750000000005,
        "leartime_s": 0.033420894003938884,
        "sampletime": 8.765485690993955,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 308,
        "timesteps": 6160000,
        "reward_mean": 1.0090500000000004,
        "reward_max": 2.4212500000000006,
        "reward_min": -0.6287499999999998,
        "leartime_s": 0.015910374000668526,
        "sampletime": 7.960675189999165,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 309,
        "timesteps": 6180000,
        "reward_mean": 0.9592500000000007,
        "reward_max": 2.0493750000000004,
        "reward_min": -0.5249999999999994,
        "leartime_s": 0.0158733940043021,
        "sampletime": 7.710794505983358,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 310,
        "timesteps": 6200000,
        "reward_mean": 1.3137500000000006,
        "reward_max": 2.3525,
        "reward_min": 0.508125000000001,
        "leartime_s": 0.031416095996974036,
        "sampletime": 7.692608558980282,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 311,
        "timesteps": 6220000,
        "reward_mean": 1.0115750000000008,
        "reward_max": 1.8331250000000008,
        "reward_min": -0.16187499999999955,
        "leartime_s": 0.019708547013578936,
        "sampletime": 7.654118123988155,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 312,
        "timesteps": 6240000,
        "reward_mean": 0.9158000000000006,
        "reward_max": 1.8500000000000008,
        "reward_min": -0.2524999999999995,
        "leartime_s": 0.019335841003339738,
        "sampletime": 7.844617214985192,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 313,
        "timesteps": 6260000,
        "reward_mean": 0.9421250000000007,
        "reward_max": 2.0881250000000007,
        "reward_min": -0.5368749999999991,
        "leartime_s": 0.016189761023269966,
        "sampletime": 7.676646129984874,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 314,
        "timesteps": 6280000,
        "reward_mean": 0.9516250000000007,
        "reward_max": 2.006250000000001,
        "reward_min": 0.06687500000000057,
        "leartime_s": 0.017248384014237672,
        "sampletime": 7.964320872008102,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 315,
        "timesteps": 6300000,
        "reward_mean": 0.9275500000000008,
        "reward_max": 1.7112500000000002,
        "reward_min": 0.07437500000000015,
        "leartime_s": 0.016228591004619375,
        "sampletime": 7.747342299000593,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 316,
        "timesteps": 6320000,
        "reward_mean": 1.2864500000000008,
        "reward_max": 2.276875000000001,
        "reward_min": 0.4143750000000008,
        "leartime_s": 0.0371338709956035,
        "sampletime": 7.903242433007108,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 317,
        "timesteps": 6340000,
        "reward_mean": 0.9743500000000007,
        "reward_max": 1.9693750000000003,
        "reward_min": 0.030000000000000703,
        "leartime_s": 0.016226240986725315,
        "sampletime": 7.799369951011613,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 318,
        "timesteps": 6360000,
        "reward_mean": 0.6783000000000007,
        "reward_max": 1.5462500000000008,
        "reward_min": -0.26687499999999953,
        "leartime_s": 0.019307149981614202,
        "sampletime": 7.855508692999138,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 319,
        "timesteps": 6380000,
        "reward_mean": 1.0460500000000006,
        "reward_max": 2.070625,
        "reward_min": -0.09124999999999914,
        "leartime_s": 0.02529948699520901,
        "sampletime": 7.9005229430040345,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 320,
        "timesteps": 6400000,
        "reward_mean": 0.7859750000000009,
        "reward_max": 1.6575000000000002,
        "reward_min": -0.07624999999999954,
        "leartime_s": 0.01918333998764865,
        "sampletime": 7.7348205049929675,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 321,
        "timesteps": 6420000,
        "reward_mean": 0.8316000000000007,
        "reward_max": 1.6412500000000008,
        "reward_min": 0.05375000000000036,
        "leartime_s": 0.016992343007586896,
        "sampletime": 7.894556998013286,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 322,
        "timesteps": 6440000,
        "reward_mean": 1.2082750000000009,
        "reward_max": 2.1006250000000004,
        "reward_min": 0.46562500000000046,
        "leartime_s": 0.0382711999991443,
        "sampletime": 8.614035228005378,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 323,
        "timesteps": 6460000,
        "reward_mean": 0.9803000000000006,
        "reward_max": 1.8175000000000003,
        "reward_min": -0.2999999999999988,
        "leartime_s": 0.04420369802392088,
        "sampletime": 9.214847244002158,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 324,
        "timesteps": 6480000,
        "reward_mean": 0.8594500000000007,
        "reward_max": 1.8050000000000008,
        "reward_min": 0.09437500000000076,
        "leartime_s": 0.022870502987643704,
        "sampletime": 9.0642631080118,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 325,
        "timesteps": 6500000,
        "reward_mean": 0.8062000000000007,
        "reward_max": 1.7531250000000005,
        "reward_min": -0.23624999999999968,
        "leartime_s": 0.016442688007373363,
        "sampletime": 8.804450723982882,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 326,
        "timesteps": 6520000,
        "reward_mean": 1.0943000000000007,
        "reward_max": 1.9175000000000004,
        "reward_min": 0.33812500000000023,
        "leartime_s": 0.03820579100283794,
        "sampletime": 8.858271311008139,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 327,
        "timesteps": 6540000,
        "reward_mean": 0.8702500000000006,
        "reward_max": 1.8368750000000005,
        "reward_min": -0.35562499999999936,
        "leartime_s": 0.02421639100066386,
        "sampletime": 9.138542990025599,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 328,
        "timesteps": 6560000,
        "reward_mean": 0.8246000000000007,
        "reward_max": 1.602500000000001,
        "reward_min": 0.04437500000000078,
        "leartime_s": 0.01882141799433157,
        "sampletime": 9.089010268013226,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 329,
        "timesteps": 6580000,
        "reward_mean": 0.9365000000000007,
        "reward_max": 1.9068750000000003,
        "reward_min": 0.3056250000000006,
        "leartime_s": 0.04069984701345675,
        "sampletime": 8.719666921009775,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 330,
        "timesteps": 6600000,
        "reward_mean": 1.0925750000000007,
        "reward_max": 1.8618750000000004,
        "reward_min": 0.2625000000000006,
        "leartime_s": 0.020228598004905507,
        "sampletime": 9.302264165977249,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 331,
        "timesteps": 6620000,
        "reward_mean": 0.7388500000000006,
        "reward_max": 1.481875000000001,
        "reward_min": -0.19312499999999924,
        "leartime_s": 0.02056040000752546,
        "sampletime": 9.290638301987201,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 332,
        "timesteps": 6640000,
        "reward_mean": 0.7038500000000006,
        "reward_max": 1.5143750000000007,
        "reward_min": -0.6443749999999998,
        "leartime_s": 0.03429917700123042,
        "sampletime": 8.808601249998901,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 333,
        "timesteps": 6660000,
        "reward_mean": 0.9822500000000007,
        "reward_max": 1.7881250000000006,
        "reward_min": -0.3212500000000002,
        "leartime_s": 0.018251442001201212,
        "sampletime": 9.433870036009466,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 334,
        "timesteps": 6680000,
        "reward_mean": 0.8210500000000006,
        "reward_max": 1.8300000000000007,
        "reward_min": -0.054374999999999715,
        "leartime_s": 0.043874505994608626,
        "sampletime": 8.759495223988779,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 335,
        "timesteps": 6700000,
        "reward_mean": 0.5388750000000007,
        "reward_max": 1.3762500000000006,
        "reward_min": -0.39249999999999907,
        "leartime_s": 0.018082743015838787,
        "sampletime": 8.800470385001972,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 336,
        "timesteps": 6720000,
        "reward_mean": 0.7441250000000007,
        "reward_max": 1.4112500000000006,
        "reward_min": -0.11749999999999977,
        "leartime_s": 0.024698372988495976,
        "sampletime": 8.775809086015215,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 337,
        "timesteps": 6740000,
        "reward_mean": 0.6987750000000007,
        "reward_max": 1.5593750000000008,
        "reward_min": -0.14062499999999992,
        "leartime_s": 0.0325315980007872,
        "sampletime": 8.950313534005545,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 338,
        "timesteps": 6760000,
        "reward_mean": 0.7032500000000007,
        "reward_max": 1.506875000000001,
        "reward_min": -0.175,
        "leartime_s": 0.04465068699209951,
        "sampletime": 8.818994291999843,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 339,
        "timesteps": 6780000,
        "reward_mean": 0.5920500000000006,
        "reward_max": 1.6900000000000004,
        "reward_min": -1.19625,
        "leartime_s": 0.03718911999021657,
        "sampletime": 8.778602439007955,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 340,
        "timesteps": 6800000,
        "reward_mean": 0.5762000000000005,
        "reward_max": 1.4887500000000007,
        "reward_min": -0.1712499999999994,
        "leartime_s": 0.022630046994891018,
        "sampletime": 9.135773782007163,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 341,
        "timesteps": 6820000,
        "reward_mean": 0.5932750000000006,
        "reward_max": 1.2931250000000007,
        "reward_min": -0.23999999999999955,
        "leartime_s": 0.01999164800508879,
        "sampletime": 8.977975202025846,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 342,
        "timesteps": 6840000,
        "reward_mean": 0.7489000000000007,
        "reward_max": 1.7031250000000007,
        "reward_min": -0.2568749999999998,
        "leartime_s": 0.020879363000858575,
        "sampletime": 9.778574990981724,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 343,
        "timesteps": 6860000,
        "reward_mean": 1.0206750000000007,
        "reward_max": 1.9662500000000005,
        "reward_min": 0.05000000000000036,
        "leartime_s": 0.0396815630083438,
        "sampletime": 10.517355966992909,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 344,
        "timesteps": 6880000,
        "reward_mean": 0.7232250000000006,
        "reward_max": 1.5818750000000006,
        "reward_min": 0.04875000000000064,
        "leartime_s": 0.02115458800108172,
        "sampletime": 10.563978808990214,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 345,
        "timesteps": 6900000,
        "reward_mean": 0.6218000000000007,
        "reward_max": 1.6262500000000004,
        "reward_min": -0.2599999999999991,
        "leartime_s": 0.033935495011974126,
        "sampletime": 11.227717329020379,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 346,
        "timesteps": 6920000,
        "reward_mean": 0.5754750000000007,
        "reward_max": 1.452500000000001,
        "reward_min": -0.3774999999999996,
        "leartime_s": 0.0439416530134622,
        "sampletime": 12.048866179015022,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 347,
        "timesteps": 6940000,
        "reward_mean": 0.42715000000000064,
        "reward_max": 1.1912500000000006,
        "reward_min": -0.8749999999999998,
        "leartime_s": 0.029219041985925287,
        "sampletime": 12.777161530015292,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 348,
        "timesteps": 6960000,
        "reward_mean": 0.6627250000000006,
        "reward_max": 1.8331250000000003,
        "reward_min": -0.2899999999999994,
        "leartime_s": 0.05134386301506311,
        "sampletime": 13.046464087994536,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 349,
        "timesteps": 6980000,
        "reward_mean": 0.38742500000000063,
        "reward_max": 1.1600000000000006,
        "reward_min": -0.7356249999999992,
        "leartime_s": 0.022780379018513486,
        "sampletime": 12.147420033987146,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 350,
        "timesteps": 7000000,
        "reward_mean": 0.4811250000000007,
        "reward_max": 1.5975000000000006,
        "reward_min": -0.6756249999999999,
        "leartime_s": 0.02662121198954992,
        "sampletime": 12.346367991995066,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 351,
        "timesteps": 7020000,
        "reward_mean": 0.5182500000000005,
        "reward_max": 1.2487500000000005,
        "reward_min": -0.23187499999999966,
        "leartime_s": 0.01939529099036008,
        "sampletime": 12.362670578993857,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 352,
        "timesteps": 7040000,
        "reward_mean": 0.7685750000000007,
        "reward_max": 1.791875000000001,
        "reward_min": -0.41499999999999926,
        "leartime_s": 0.048381129978224635,
        "sampletime": 12.621270450996235,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 353,
        "timesteps": 7060000,
        "reward_mean": 0.5335750000000006,
        "reward_max": 1.2481250000000008,
        "reward_min": -0.2931249999999997,
        "leartime_s": 0.07690014300169423,
        "sampletime": 12.34150238102302,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 354,
        "timesteps": 7080000,
        "reward_mean": 0.6781750000000006,
        "reward_max": 1.601875000000001,
        "reward_min": -0.09812499999999963,
        "leartime_s": 0.051665417006006464,
        "sampletime": 11.708944242011057,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 355,
        "timesteps": 7100000,
        "reward_mean": 0.36337500000000056,
        "reward_max": 1.1112500000000007,
        "reward_min": -1.2693749999999993,
        "leartime_s": 0.06013473798520863,
        "sampletime": 12.32512379498803,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 356,
        "timesteps": 7120000,
        "reward_mean": 0.46472500000000055,
        "reward_max": 1.5368750000000007,
        "reward_min": -0.6443749999999995,
        "leartime_s": 0.032888649991946295,
        "sampletime": 12.575375030981377,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 357,
        "timesteps": 7140000,
        "reward_mean": 0.6153000000000005,
        "reward_max": 1.6481250000000003,
        "reward_min": -0.7287499999999995,
        "leartime_s": 0.05961674900026992,
        "sampletime": 12.193835894024232,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 358,
        "timesteps": 7160000,
        "reward_mean": 0.4891250000000007,
        "reward_max": 1.5975000000000006,
        "reward_min": -0.9999999999999991,
        "leartime_s": 0.046992671996122226,
        "sampletime": 12.422188113996526,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 359,
        "timesteps": 7180000,
        "reward_mean": 0.4987500000000007,
        "reward_max": 1.322500000000001,
        "reward_min": -0.6599999999999997,
        "leartime_s": 0.03438347901101224,
        "sampletime": 11.96508222198463,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 360,
        "timesteps": 7200000,
        "reward_mean": 0.6179000000000007,
        "reward_max": 1.4600000000000009,
        "reward_min": -0.4574999999999997,
        "leartime_s": 0.10465508402558044,
        "sampletime": 12.137562129006255,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 361,
        "timesteps": 7220000,
        "reward_mean": 0.08140000000000057,
        "reward_max": 1.5062500000000005,
        "reward_min": -1.8681249999999996,
        "leartime_s": 0.055055462988093495,
        "sampletime": 12.21168215299258,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 362,
        "timesteps": 7240000,
        "reward_mean": 0.6831500000000007,
        "reward_max": 1.6512500000000008,
        "reward_min": -0.7631249999999992,
        "leartime_s": 0.041032653010915965,
        "sampletime": 12.461921095993603,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 363,
        "timesteps": 7260000,
        "reward_mean": 0.40392500000000053,
        "reward_max": 1.3950000000000007,
        "reward_min": -0.9643749999999998,
        "leartime_s": 0.024179681990062818,
        "sampletime": 12.064751463010907,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 364,
        "timesteps": 7280000,
        "reward_mean": 0.2714500000000005,
        "reward_max": 1.7056250000000004,
        "reward_min": -0.8074999999999994,
        "leartime_s": 0.05006543698254973,
        "sampletime": 12.725043658982031,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 365,
        "timesteps": 7300000,
        "reward_mean": 0.23577500000000054,
        "reward_max": 1.3362500000000008,
        "reward_min": -1.3274999999999995,
        "leartime_s": 0.03252994400099851,
        "sampletime": 12.238617333001457,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 366,
        "timesteps": 7320000,
        "reward_mean": 0.5140750000000006,
        "reward_max": 1.371875000000001,
        "reward_min": -0.2362499999999996,
        "leartime_s": 0.06556509400252253,
        "sampletime": 12.105899440997746,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 367,
        "timesteps": 7340000,
        "reward_mean": 0.6149750000000006,
        "reward_max": 1.6812500000000006,
        "reward_min": -0.6024999999999993,
        "leartime_s": 0.02619172100094147,
        "sampletime": 12.425531273998786,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 368,
        "timesteps": 7360000,
        "reward_mean": 0.3893250000000006,
        "reward_max": 1.3906250000000004,
        "reward_min": -1.1181250000000003,
        "leartime_s": 0.022362321004038677,
        "sampletime": 12.697385640989523,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 369,
        "timesteps": 7380000,
        "reward_mean": 0.3494000000000006,
        "reward_max": 1.4800000000000006,
        "reward_min": -1.6649999999999998,
        "leartime_s": 0.060128260985948145,
        "sampletime": 12.281615476997104,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 370,
        "timesteps": 7400000,
        "reward_mean": -0.14534999999999945,
        "reward_max": 1.2031250000000004,
        "reward_min": -2.4312499999999995,
        "leartime_s": 0.06998827599454671,
        "sampletime": 12.164238343015313,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 371,
        "timesteps": 7420000,
        "reward_mean": 0.43035000000000057,
        "reward_max": 1.4081250000000005,
        "reward_min": -0.3618749999999995,
        "leartime_s": 0.0403376079921145,
        "sampletime": 12.749162459978834,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 372,
        "timesteps": 7440000,
        "reward_mean": 0.7725750000000005,
        "reward_max": 1.8331250000000006,
        "reward_min": -0.006874999999999382,
        "leartime_s": 0.050444085005437955,
        "sampletime": 12.314093517983565,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 373,
        "timesteps": 7460000,
        "reward_mean": 0.3378750000000006,
        "reward_max": 1.2550000000000006,
        "reward_min": -1.0637499999999998,
        "leartime_s": 0.0437811259762384,
        "sampletime": 12.41752186298254,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 374,
        "timesteps": 7480000,
        "reward_mean": 0.35092500000000065,
        "reward_max": 1.2725000000000006,
        "reward_min": -1.396874999999999,
        "leartime_s": 0.04448486299952492,
        "sampletime": 12.782334406976588,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 375,
        "timesteps": 7500000,
        "reward_mean": 0.2592750000000006,
        "reward_max": 1.3425000000000007,
        "reward_min": -0.7862500000000002,
        "leartime_s": 0.03413431000080891,
        "sampletime": 12.863369403989054,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 376,
        "timesteps": 7520000,
        "reward_mean": 0.1946750000000004,
        "reward_max": 1.5837500000000002,
        "reward_min": -1.3818749999999995,
        "leartime_s": 0.048287281999364495,
        "sampletime": 11.945192940009292,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 377,
        "timesteps": 7540000,
        "reward_mean": 0.25827500000000053,
        "reward_max": 1.1975000000000007,
        "reward_min": -1.313125,
        "leartime_s": 0.02354976098285988,
        "sampletime": 12.427326901990455,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 378,
        "timesteps": 7560000,
        "reward_mean": 0.33012500000000067,
        "reward_max": 1.2537500000000006,
        "reward_min": -0.9712499999999986,
        "leartime_s": 0.04050163697684184,
        "sampletime": 11.624761704995763,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 379,
        "timesteps": 7580000,
        "reward_mean": 0.42887500000000056,
        "reward_max": 1.4231250000000004,
        "reward_min": -0.9156249999999995,
        "leartime_s": 0.018987448973348364,
        "sampletime": 11.095273419021396,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 380,
        "timesteps": 7600000,
        "reward_mean": 0.3337000000000006,
        "reward_max": 1.3243750000000007,
        "reward_min": -1.0693749999999989,
        "leartime_s": 0.025757643015822396,
        "sampletime": 10.660596105008153,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 381,
        "timesteps": 7620000,
        "reward_mean": -0.04339999999999957,
        "reward_max": 0.9343750000000001,
        "reward_min": -0.9612499999999999,
        "leartime_s": 0.034600837010657415,
        "sampletime": 10.363389060017653,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 382,
        "timesteps": 7640000,
        "reward_mean": 0.30937500000000057,
        "reward_max": 1.3881250000000005,
        "reward_min": -1.2474999999999994,
        "leartime_s": 0.019254403974628076,
        "sampletime": 10.642484759999206,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 383,
        "timesteps": 7660000,
        "reward_mean": 0.30997500000000056,
        "reward_max": 1.3850000000000002,
        "reward_min": -1.2174999999999998,
        "leartime_s": 0.019144803984090686,
        "sampletime": 8.605828333995305,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 384,
        "timesteps": 7680000,
        "reward_mean": 0.3442500000000005,
        "reward_max": 1.2368750000000004,
        "reward_min": -0.7437499999999992,
        "leartime_s": 0.025094853015616536,
        "sampletime": 9.102666748978663,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 385,
        "timesteps": 7700000,
        "reward_mean": 0.8132500000000005,
        "reward_max": 1.8725000000000005,
        "reward_min": -0.06249999999999983,
        "leartime_s": 0.02456875197822228,
        "sampletime": 8.969567570980871,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 386,
        "timesteps": 7720000,
        "reward_mean": 0.7036750000000005,
        "reward_max": 1.6518750000000004,
        "reward_min": -0.7706249999999996,
        "leartime_s": 0.02065102302003652,
        "sampletime": 9.223450784978922,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 387,
        "timesteps": 7740000,
        "reward_mean": 0.5886500000000006,
        "reward_max": 1.5675000000000003,
        "reward_min": -0.39687499999999964,
        "leartime_s": 0.020594146015355363,
        "sampletime": 9.163785737007856,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 388,
        "timesteps": 7760000,
        "reward_mean": 0.5159250000000005,
        "reward_max": 1.3462500000000008,
        "reward_min": -0.3193749999999996,
        "leartime_s": 0.019017693994101137,
        "sampletime": 8.96585475601023,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 389,
        "timesteps": 7780000,
        "reward_mean": 0.6371500000000007,
        "reward_max": 1.633750000000001,
        "reward_min": -1.0981249999999994,
        "leartime_s": 0.03397063602460548,
        "sampletime": 8.923805430007633,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 390,
        "timesteps": 7800000,
        "reward_mean": 0.8283500000000006,
        "reward_max": 1.7475000000000005,
        "reward_min": -0.3774999999999996,
        "leartime_s": 0.02269648600486107,
        "sampletime": 8.931219688995043,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 391,
        "timesteps": 7820000,
        "reward_mean": 0.6410500000000007,
        "reward_max": 1.7037500000000012,
        "reward_min": -0.21187499999999956,
        "leartime_s": 0.021809174009831622,
        "sampletime": 9.112943448999431,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 392,
        "timesteps": 7840000,
        "reward_mean": 0.5616250000000006,
        "reward_max": 1.474375,
        "reward_min": -0.35624999999999957,
        "leartime_s": 0.018627894984092563,
        "sampletime": 9.043266915017739,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 393,
        "timesteps": 7860000,
        "reward_mean": 0.5452250000000006,
        "reward_max": 1.4387500000000002,
        "reward_min": -0.6912499999999996,
        "leartime_s": 0.021746318001532927,
        "sampletime": 9.165909909002949,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 394,
        "timesteps": 7880000,
        "reward_mean": 0.7150500000000006,
        "reward_max": 1.5675000000000006,
        "reward_min": 0.06750000000000048,
        "leartime_s": 0.06163738601026125,
        "sampletime": 9.268738605984254,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 395,
        "timesteps": 7900000,
        "reward_mean": 0.7208500000000005,
        "reward_max": 1.7043750000000009,
        "reward_min": -0.01812499999999949,
        "leartime_s": 0.023948736023157835,
        "sampletime": 8.990675120992819,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 396,
        "timesteps": 7920000,
        "reward_mean": 0.5882750000000007,
        "reward_max": 1.4531250000000004,
        "reward_min": -0.3862499999999992,
        "leartime_s": 0.02162415799102746,
        "sampletime": 9.146517382992897,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 397,
        "timesteps": 7940000,
        "reward_mean": 0.7846500000000006,
        "reward_max": 1.704375000000001,
        "reward_min": -0.09499999999999956,
        "leartime_s": 0.028900576988235116,
        "sampletime": 9.05399349500658,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 398,
        "timesteps": 7960000,
        "reward_mean": 0.5907750000000005,
        "reward_max": 1.5300000000000007,
        "reward_min": -0.655,
        "leartime_s": 0.031882196984952316,
        "sampletime": 8.780229285010137,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 399,
        "timesteps": 7980000,
        "reward_mean": 0.5762250000000005,
        "reward_max": 1.4281250000000012,
        "reward_min": -0.3568749999999996,
        "leartime_s": 0.019256517000030726,
        "sampletime": 10.052484740008367,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 400,
        "timesteps": 8000000,
        "reward_mean": 1.0222250000000008,
        "reward_max": 2.2231250000000014,
        "reward_min": 0.20437500000000036,
        "leartime_s": 0.020746594003867358,
        "sampletime": 11.188853409985313,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 401,
        "timesteps": 8020000,
        "reward_mean": 0.49567500000000064,
        "reward_max": 1.263125000000001,
        "reward_min": -0.6456249999999986,
        "leartime_s": 0.045753674989100546,
        "sampletime": 12.679677945998264,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 402,
        "timesteps": 8040000,
        "reward_mean": 0.8149000000000006,
        "reward_max": 1.7431250000000005,
        "reward_min": 0.003125000000000669,
        "leartime_s": 0.06118409501505084,
        "sampletime": 12.04909616598161,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 403,
        "timesteps": 8060000,
        "reward_mean": 0.7525500000000007,
        "reward_max": 1.6187500000000008,
        "reward_min": -0.07562499999999928,
        "leartime_s": 0.0640887200133875,
        "sampletime": 11.849142791994382,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 404,
        "timesteps": 8080000,
        "reward_mean": 0.8872500000000005,
        "reward_max": 1.7975000000000008,
        "reward_min": -0.1606249999999994,
        "leartime_s": 0.06414337499882095,
        "sampletime": 12.32313165999949,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 405,
        "timesteps": 8100000,
        "reward_mean": 0.5281000000000005,
        "reward_max": 1.9287500000000004,
        "reward_min": -0.8349999999999996,
        "leartime_s": 0.022339689021464437,
        "sampletime": 12.34826402500039,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 406,
        "timesteps": 8120000,
        "reward_mean": 0.9110000000000008,
        "reward_max": 1.6956250000000013,
        "reward_min": 0.11687500000000059,
        "leartime_s": 0.030666771985124797,
        "sampletime": 12.406572767009493,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 407,
        "timesteps": 8140000,
        "reward_mean": 0.9159000000000007,
        "reward_max": 2.0493750000000004,
        "reward_min": 0.09812500000000066,
        "leartime_s": 0.04409439899609424,
        "sampletime": 12.501444905006792,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 408,
        "timesteps": 8160000,
        "reward_mean": 0.4873250000000006,
        "reward_max": 1.6437500000000007,
        "reward_min": -1.1512499999999992,
        "leartime_s": 0.027801293996162713,
        "sampletime": 12.031895151973004,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 409,
        "timesteps": 8180000,
        "reward_mean": 0.4302500000000006,
        "reward_max": 1.8756250000000003,
        "reward_min": -1.2618750000000007,
        "leartime_s": 0.047155527980066836,
        "sampletime": 12.48582000398892,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 410,
        "timesteps": 8200000,
        "reward_mean": 0.6187500000000007,
        "reward_max": 1.6387500000000004,
        "reward_min": -1.1862499999999996,
        "leartime_s": 0.05112473401823081,
        "sampletime": 12.156729962996906,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 411,
        "timesteps": 8220000,
        "reward_mean": 0.5902000000000005,
        "reward_max": 1.63625,
        "reward_min": -0.7524999999999995,
        "leartime_s": 0.04823558000498451,
        "sampletime": 12.05298030198901,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 412,
        "timesteps": 8240000,
        "reward_mean": 0.8228250000000007,
        "reward_max": 1.7662500000000008,
        "reward_min": -0.029374999999999776,
        "leartime_s": 0.06513154599815607,
        "sampletime": 12.101872680999804,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 413,
        "timesteps": 8260000,
        "reward_mean": 0.6839750000000006,
        "reward_max": 1.5750000000000006,
        "reward_min": -0.24374999999999913,
        "leartime_s": 0.025782414013519883,
        "sampletime": 12.176830965006957,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 414,
        "timesteps": 8280000,
        "reward_mean": 0.6213000000000006,
        "reward_max": 1.5268750000000002,
        "reward_min": -0.8424999999999997,
        "leartime_s": 0.025611574994400144,
        "sampletime": 11.697589526011143,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 415,
        "timesteps": 8300000,
        "reward_mean": 0.8396750000000007,
        "reward_max": 2.1006250000000004,
        "reward_min": -0.10124999999999924,
        "leartime_s": 0.060048013023333624,
        "sampletime": 12.39881748901098,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 416,
        "timesteps": 8320000,
        "reward_mean": 0.4793000000000007,
        "reward_max": 1.4606250000000007,
        "reward_min": -0.7031249999999993,
        "leartime_s": 0.07477379398187622,
        "sampletime": 12.376596945978235,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 417,
        "timesteps": 8340000,
        "reward_mean": 0.5180250000000007,
        "reward_max": 1.521250000000001,
        "reward_min": -0.4587499999999998,
        "leartime_s": 0.03151723399059847,
        "sampletime": 12.163169557985384,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 418,
        "timesteps": 8360000,
        "reward_mean": 0.7935750000000006,
        "reward_max": 1.7187500000000002,
        "reward_min": -0.0793749999999995,
        "leartime_s": 0.0288039050064981,
        "sampletime": 12.62092352801119,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 419,
        "timesteps": 8380000,
        "reward_mean": 1.0001000000000007,
        "reward_max": 2.0143750000000007,
        "reward_min": 0.08062500000000049,
        "leartime_s": 0.05537333499523811,
        "sampletime": 12.126111153018428,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 420,
        "timesteps": 8400000,
        "reward_mean": 0.6290750000000008,
        "reward_max": 1.5162500000000008,
        "reward_min": -1.0062499999999996,
        "leartime_s": 0.039425469993148,
        "sampletime": 12.562599408003734,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 421,
        "timesteps": 8420000,
        "reward_mean": 1.1076750000000006,
        "reward_max": 1.8881250000000007,
        "reward_min": 0.20875000000000088,
        "leartime_s": 0.0706983609998133,
        "sampletime": 12.636832166987006,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 422,
        "timesteps": 8440000,
        "reward_mean": 0.7214250000000006,
        "reward_max": 1.7187500000000009,
        "reward_min": -0.7287499999999993,
        "leartime_s": 0.06061919700005092,
        "sampletime": 11.81533897999907,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 423,
        "timesteps": 8460000,
        "reward_mean": 0.8708500000000008,
        "reward_max": 1.6600000000000008,
        "reward_min": -0.0024999999999990724,
        "leartime_s": 0.019778476998908445,
        "sampletime": 12.492249271977926,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 424,
        "timesteps": 8480000,
        "reward_mean": 0.5856500000000008,
        "reward_max": 1.5206250000000006,
        "reward_min": -0.6162499999999991,
        "leartime_s": 0.020981502981157973,
        "sampletime": 11.785572727996623,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 425,
        "timesteps": 8500000,
        "reward_mean": 0.5200500000000007,
        "reward_max": 1.6106250000000006,
        "reward_min": -1.14125,
        "leartime_s": 0.09139146099914797,
        "sampletime": 12.516370729979826,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 426,
        "timesteps": 8520000,
        "reward_mean": 0.7911500000000008,
        "reward_max": 1.6106250000000009,
        "reward_min": -0.012499999999999331,
        "leartime_s": 0.022906883008545265,
        "sampletime": 12.602347934996942,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 427,
        "timesteps": 8540000,
        "reward_mean": 0.8084750000000008,
        "reward_max": 1.883750000000001,
        "reward_min": -0.47562499999999946,
        "leartime_s": 0.041755154001293704,
        "sampletime": 12.269906481000362,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 428,
        "timesteps": 8560000,
        "reward_mean": 0.9561250000000007,
        "reward_max": 1.7731250000000005,
        "reward_min": -0.01812499999999933,
        "leartime_s": 0.030990658997325227,
        "sampletime": 12.631382074992871,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 429,
        "timesteps": 8580000,
        "reward_mean": 0.7069000000000007,
        "reward_max": 1.5250000000000008,
        "reward_min": -0.20124999999999965,
        "leartime_s": 0.058422580012120306,
        "sampletime": 12.472039964981377,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 430,
        "timesteps": 8600000,
        "reward_mean": 0.8413500000000008,
        "reward_max": 1.648750000000001,
        "reward_min": -0.2406249999999989,
        "leartime_s": 0.029692853015149012,
        "sampletime": 11.984030230989447,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 431,
        "timesteps": 8620000,
        "reward_mean": 0.9096250000000007,
        "reward_max": 1.6431250000000008,
        "reward_min": -0.05312499999999916,
        "leartime_s": 0.036259089974919334,
        "sampletime": 12.272888946987223,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 432,
        "timesteps": 8640000,
        "reward_mean": 0.7951000000000006,
        "reward_max": 1.632500000000001,
        "reward_min": -0.42437499999999884,
        "leartime_s": 0.09171850798884407,
        "sampletime": 12.33243848301936,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 433,
        "timesteps": 8660000,
        "reward_mean": 0.5693500000000006,
        "reward_max": 1.389375000000001,
        "reward_min": -0.37499999999999944,
        "leartime_s": 0.02298196399351582,
        "sampletime": 12.062364012992475,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 434,
        "timesteps": 8680000,
        "reward_mean": 0.8268250000000007,
        "reward_max": 1.7150000000000003,
        "reward_min": -0.18812499999999976,
        "leartime_s": 0.04856895198463462,
        "sampletime": 12.296493753994582,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 435,
        "timesteps": 8700000,
        "reward_mean": 0.5361250000000009,
        "reward_max": 1.4656250000000008,
        "reward_min": -1.0243749999999987,
        "leartime_s": 0.06786154498695396,
        "sampletime": 12.259404111013282,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 436,
        "timesteps": 8720000,
        "reward_mean": 1.146125000000001,
        "reward_max": 2.3268750000000007,
        "reward_min": 0.4268750000000005,
        "leartime_s": 0.065773887996329,
        "sampletime": 12.001415617996827,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 437,
        "timesteps": 8740000,
        "reward_mean": 0.9381000000000008,
        "reward_max": 1.7343750000000007,
        "reward_min": 0.057500000000000745,
        "leartime_s": 0.02653675401234068,
        "sampletime": 9.440384051005822,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 438,
        "timesteps": 8760000,
        "reward_mean": 0.7954250000000007,
        "reward_max": 1.8031250000000008,
        "reward_min": -0.2924999999999994,
        "leartime_s": 0.02176226698793471,
        "sampletime": 8.88331249798648,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 439,
        "timesteps": 8780000,
        "reward_mean": 0.7208500000000005,
        "reward_max": 1.662500000000001,
        "reward_min": -0.3887499999999991,
        "leartime_s": 0.021520549984415993,
        "sampletime": 8.970986016007373,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 440,
        "timesteps": 8800000,
        "reward_mean": 0.7827250000000008,
        "reward_max": 1.9512500000000002,
        "reward_min": -0.6212499999999994,
        "leartime_s": 0.049159620015416294,
        "sampletime": 9.11487762699835,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 441,
        "timesteps": 8820000,
        "reward_mean": 1.0615750000000008,
        "reward_max": 1.9650000000000005,
        "reward_min": 0.2906250000000008,
        "leartime_s": 0.022109583020210266,
        "sampletime": 9.258505695994245,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 442,
        "timesteps": 8840000,
        "reward_mean": 0.8851000000000008,
        "reward_max": 1.8537500000000007,
        "reward_min": -0.16562499999999902,
        "leartime_s": 0.03667235400644131,
        "sampletime": 8.886421544011682,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 443,
        "timesteps": 8860000,
        "reward_mean": 0.8367750000000008,
        "reward_max": 1.6756250000000013,
        "reward_min": 0.051875000000000726,
        "leartime_s": 0.025757494004210457,
        "sampletime": 9.088737195997965,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 444,
        "timesteps": 8880000,
        "reward_mean": 0.9946500000000008,
        "reward_max": 1.911875000000001,
        "reward_min": 0.23875000000000066,
        "leartime_s": 0.04492897499585524,
        "sampletime": 9.319591626001056,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 445,
        "timesteps": 8900000,
        "reward_mean": 1.0865500000000006,
        "reward_max": 1.9600000000000006,
        "reward_min": 0.2937500000000005,
        "leartime_s": 0.038022472988814116,
        "sampletime": 8.953776089998428,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 446,
        "timesteps": 8920000,
        "reward_mean": 0.7430500000000009,
        "reward_max": 2.111250000000001,
        "reward_min": -0.6068749999999993,
        "leartime_s": 0.049097998009528965,
        "sampletime": 11.015648564993171,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 447,
        "timesteps": 8940000,
        "reward_mean": 1.1513500000000008,
        "reward_max": 2.536250000000001,
        "reward_min": 0.24625000000000058,
        "leartime_s": 0.03701066100620665,
        "sampletime": 11.892306669993559,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 448,
        "timesteps": 8960000,
        "reward_mean": 0.6016500000000008,
        "reward_max": 1.6831250000000009,
        "reward_min": -0.24499999999999889,
        "leartime_s": 0.06030013598501682,
        "sampletime": 12.661107691994403,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 449,
        "timesteps": 8980000,
        "reward_mean": 0.9823500000000008,
        "reward_max": 1.9262500000000005,
        "reward_min": 0.025000000000000466,
        "leartime_s": 0.02353810498607345,
        "sampletime": 12.505549633002374,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 450,
        "timesteps": 9000000,
        "reward_mean": 0.6536750000000008,
        "reward_max": 1.4187500000000008,
        "reward_min": -0.16624999999999895,
        "leartime_s": 0.05746262997854501,
        "sampletime": 11.746553072996903,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 451,
        "timesteps": 9020000,
        "reward_mean": 1.0182500000000008,
        "reward_max": 2.1837500000000007,
        "reward_min": -0.4512499999999996,
        "leartime_s": 0.0533242890087422,
        "sampletime": 10.458275151991984,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 452,
        "timesteps": 9040000,
        "reward_mean": 0.9616750000000007,
        "reward_max": 1.8931250000000008,
        "reward_min": -0.013749999999999277,
        "leartime_s": 0.03190350500517525,
        "sampletime": 10.415328489994863,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 453,
        "timesteps": 9060000,
        "reward_mean": 0.6259750000000006,
        "reward_max": 1.4987500000000005,
        "reward_min": -1.0387499999999994,
        "leartime_s": 0.0322395559924189,
        "sampletime": 10.435553894989425,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 454,
        "timesteps": 9080000,
        "reward_mean": 0.9676750000000008,
        "reward_max": 1.8675000000000008,
        "reward_min": 0.08937500000000038,
        "leartime_s": 0.054494209005497396,
        "sampletime": 10.592553371010581,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 455,
        "timesteps": 9100000,
        "reward_mean": 0.6537250000000008,
        "reward_max": 1.5743750000000007,
        "reward_min": -0.8437499999999991,
        "leartime_s": 0.022276949981460348,
        "sampletime": 10.385543798998697,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 456,
        "timesteps": 9120000,
        "reward_mean": 0.7580250000000007,
        "reward_max": 1.727500000000001,
        "reward_min": -0.42812499999999937,
        "leartime_s": 0.08214748301543295,
        "sampletime": 10.600366612023208,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 457,
        "timesteps": 9140000,
        "reward_mean": 0.5270750000000008,
        "reward_max": 1.3887500000000008,
        "reward_min": -1.6524999999999985,
        "leartime_s": 0.03534121799748391,
        "sampletime": 10.781840640993323,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 458,
        "timesteps": 9160000,
        "reward_mean": 0.6676750000000007,
        "reward_max": 1.631250000000001,
        "reward_min": -0.20624999999999935,
        "leartime_s": 0.07139320200076327,
        "sampletime": 10.660548768995795,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 459,
        "timesteps": 9180000,
        "reward_mean": 0.6923750000000006,
        "reward_max": 1.8093750000000006,
        "reward_min": -0.5237499999999996,
        "leartime_s": 0.02296310497331433,
        "sampletime": 10.380855091003468,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 460,
        "timesteps": 9200000,
        "reward_mean": 0.7980500000000006,
        "reward_max": 1.9425000000000006,
        "reward_min": -0.45999999999999963,
        "leartime_s": 0.05485090598813258,
        "sampletime": 10.354309162998106,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 461,
        "timesteps": 9220000,
        "reward_mean": 0.8237500000000006,
        "reward_max": 1.6912500000000006,
        "reward_min": -0.5612499999999998,
        "leartime_s": 0.04641228500986472,
        "sampletime": 10.41071836501942,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 462,
        "timesteps": 9240000,
        "reward_mean": 0.8157250000000006,
        "reward_max": 1.7093750000000005,
        "reward_min": -0.03437499999999975,
        "leartime_s": 0.05194398300955072,
        "sampletime": 10.278580652025994,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 463,
        "timesteps": 9260000,
        "reward_mean": 0.6853750000000007,
        "reward_max": 1.9550000000000005,
        "reward_min": -1.9093749999999994,
        "leartime_s": 0.02875215301173739,
        "sampletime": 10.272154939972097,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 464,
        "timesteps": 9280000,
        "reward_mean": 0.8502500000000007,
        "reward_max": 1.7293750000000012,
        "reward_min": -0.3512499999999992,
        "leartime_s": 0.05554445501184091,
        "sampletime": 10.238088123995112,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 465,
        "timesteps": 9300000,
        "reward_mean": 0.9108250000000008,
        "reward_max": 1.9043750000000008,
        "reward_min": -0.6062499999999995,
        "leartime_s": 0.04367910698056221,
        "sampletime": 9.980804908991558,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 466,
        "timesteps": 9320000,
        "reward_mean": 0.6830000000000009,
        "reward_max": 2.080625000000001,
        "reward_min": -0.4949999999999991,
        "leartime_s": 0.024511898984201252,
        "sampletime": 10.182457320013782,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 467,
        "timesteps": 9340000,
        "reward_mean": 0.5688500000000007,
        "reward_max": 1.9500000000000004,
        "reward_min": -2.089999999999999,
        "leartime_s": 0.03056954700150527,
        "sampletime": 10.411079673009226,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 468,
        "timesteps": 9360000,
        "reward_mean": 0.7167250000000008,
        "reward_max": 1.6331250000000006,
        "reward_min": -0.3037499999999995,
        "leartime_s": 0.02314098400529474,
        "sampletime": 10.49290429399116,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 469,
        "timesteps": 9380000,
        "reward_mean": 0.9200250000000008,
        "reward_max": 2.1881250000000003,
        "reward_min": -0.8362499999999994,
        "leartime_s": 0.05887461299425922,
        "sampletime": 10.166689900011988,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 470,
        "timesteps": 9400000,
        "reward_mean": 0.9908000000000008,
        "reward_max": 2.0012500000000006,
        "reward_min": 0.10625000000000084,
        "leartime_s": 0.05083886400097981,
        "sampletime": 10.446736649988452,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 471,
        "timesteps": 9420000,
        "reward_mean": 0.7525000000000008,
        "reward_max": 1.7031250000000009,
        "reward_min": -0.35624999999999896,
        "leartime_s": 0.02601390000199899,
        "sampletime": 10.449559895001585,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 472,
        "timesteps": 9440000,
        "reward_mean": 0.7864750000000006,
        "reward_max": 1.8431250000000001,
        "reward_min": -0.8374999999999992,
        "leartime_s": 0.022344869008520618,
        "sampletime": 10.640318780002417,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 473,
        "timesteps": 9460000,
        "reward_mean": 0.7080500000000007,
        "reward_max": 1.5506250000000006,
        "reward_min": -1.2399999999999989,
        "leartime_s": 0.07747611499507912,
        "sampletime": 10.864940765983192,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 474,
        "timesteps": 9480000,
        "reward_mean": 0.7940250000000008,
        "reward_max": 1.9387500000000004,
        "reward_min": -0.24062499999999976,
        "leartime_s": 0.05200527000124566,
        "sampletime": 10.537403725000331,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 475,
        "timesteps": 9500000,
        "reward_mean": 0.7915750000000007,
        "reward_max": 1.6881250000000005,
        "reward_min": -1.1949999999999994,
        "leartime_s": 0.05395584300276823,
        "sampletime": 10.7679218010162,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 476,
        "timesteps": 9520000,
        "reward_mean": 0.9429500000000007,
        "reward_max": 1.8075000000000006,
        "reward_min": -0.4687499999999994,
        "leartime_s": 0.03217789001064375,
        "sampletime": 10.715028289007023,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 477,
        "timesteps": 9540000,
        "reward_mean": 0.9979250000000008,
        "reward_max": 2.116250000000001,
        "reward_min": 0.006250000000000772,
        "leartime_s": 0.04363737101084553,
        "sampletime": 10.47781648801174,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 478,
        "timesteps": 9560000,
        "reward_mean": 1.2497750000000007,
        "reward_max": 2.0237500000000006,
        "reward_min": 0.031875000000000334,
        "leartime_s": 0.05115436701453291,
        "sampletime": 10.602570583025226,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 479,
        "timesteps": 9580000,
        "reward_mean": 0.9687000000000008,
        "reward_max": 2.002500000000001,
        "reward_min": -0.15312499999999957,
        "leartime_s": 0.024373211985221133,
        "sampletime": 10.894734175002668,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 480,
        "timesteps": 9600000,
        "reward_mean": 0.7489750000000007,
        "reward_max": 1.6881250000000012,
        "reward_min": -0.6693749999999997,
        "leartime_s": 0.022669001977192238,
        "sampletime": 10.339199753012508,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 481,
        "timesteps": 9620000,
        "reward_mean": 0.9458500000000006,
        "reward_max": 2.3637500000000005,
        "reward_min": -0.5468749999999992,
        "leartime_s": 0.038366221007891,
        "sampletime": 10.013045905012405,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 482,
        "timesteps": 9640000,
        "reward_mean": 0.8428750000000009,
        "reward_max": 1.932500000000001,
        "reward_min": -0.2837499999999993,
        "leartime_s": 0.024573033006163314,
        "sampletime": 10.56903839498409,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 483,
        "timesteps": 9660000,
        "reward_mean": 0.45675000000000066,
        "reward_max": 1.6487500000000006,
        "reward_min": -0.9168749999999994,
        "leartime_s": 0.06141242600278929,
        "sampletime": 8.914930216007633,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 484,
        "timesteps": 9680000,
        "reward_mean": 0.9256000000000009,
        "reward_max": 1.979375000000001,
        "reward_min": -0.07999999999999957,
        "leartime_s": 0.022732392011675984,
        "sampletime": 8.752162322984077,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 485,
        "timesteps": 9700000,
        "reward_mean": 1.0809000000000006,
        "reward_max": 2.0143750000000002,
        "reward_min": -0.12187499999999946,
        "leartime_s": 0.025530771003104746,
        "sampletime": 9.661521425994579,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 486,
        "timesteps": 9720000,
        "reward_mean": 0.7636750000000009,
        "reward_max": 1.9531250000000013,
        "reward_min": -0.9293749999999993,
        "leartime_s": 0.03487053100252524,
        "sampletime": 10.182306703994982,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 487,
        "timesteps": 9740000,
        "reward_mean": 0.5277250000000008,
        "reward_max": 1.7131250000000011,
        "reward_min": -0.9687499999999996,
        "leartime_s": 0.040408095985185355,
        "sampletime": 9.385069683979964,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 488,
        "timesteps": 9760000,
        "reward_mean": 0.7905750000000008,
        "reward_max": 1.6943750000000009,
        "reward_min": -0.22687499999999977,
        "leartime_s": 0.02799079701071605,
        "sampletime": 9.760989770002197,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 489,
        "timesteps": 9780000,
        "reward_mean": 1.0885000000000007,
        "reward_max": 2.1693750000000005,
        "reward_min": -0.1012499999999998,
        "leartime_s": 0.0803384410100989,
        "sampletime": 10.2267869579955,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 490,
        "timesteps": 9800000,
        "reward_mean": 0.7077500000000007,
        "reward_max": 1.916250000000001,
        "reward_min": -1.1174999999999995,
        "leartime_s": 0.023935210978379473,
        "sampletime": 9.2697585169808,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 491,
        "timesteps": 9820000,
        "reward_mean": 0.9194750000000006,
        "reward_max": 2.321250000000001,
        "reward_min": -0.39124999999999915,
        "leartime_s": 0.03218679499696009,
        "sampletime": 9.541803625994362,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 492,
        "timesteps": 9840000,
        "reward_mean": 0.6793500000000008,
        "reward_max": 1.7700000000000011,
        "reward_min": -0.36437499999999956,
        "leartime_s": 0.06014985099318437,
        "sampletime": 9.83867965999525,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 493,
        "timesteps": 9860000,
        "reward_mean": 0.5128750000000006,
        "reward_max": 1.7112500000000006,
        "reward_min": -0.966875,
        "leartime_s": 0.03773823898518458,
        "sampletime": 9.540190485975472,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 494,
        "timesteps": 9880000,
        "reward_mean": 0.7080750000000007,
        "reward_max": 1.773750000000001,
        "reward_min": -0.8912499999999995,
        "leartime_s": 0.023618341016117483,
        "sampletime": 9.270774060016265,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 495,
        "timesteps": 9900000,
        "reward_mean": 0.6537000000000007,
        "reward_max": 1.545000000000001,
        "reward_min": -0.6375000000000008,
        "leartime_s": 0.033800728007918224,
        "sampletime": 9.746627015003469,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 496,
        "timesteps": 9920000,
        "reward_mean": 0.7478750000000007,
        "reward_max": 2.0312500000000004,
        "reward_min": -0.9787499999999996,
        "leartime_s": 0.02793614999973215,
        "sampletime": 9.624195517011685,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 497,
        "timesteps": 9940000,
        "reward_mean": 0.21405000000000068,
        "reward_max": 1.3775000000000006,
        "reward_min": -1.168749999999999,
        "leartime_s": 0.058843106002314016,
        "sampletime": 9.460042699996848,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 498,
        "timesteps": 9960000,
        "reward_mean": 0.5555750000000007,
        "reward_max": 1.7525000000000008,
        "reward_min": -1.198124999999999,
        "leartime_s": 0.03784157501650043,
        "sampletime": 9.348034160997486,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 499,
        "timesteps": 9980000,
        "reward_mean": 0.4147500000000006,
        "reward_max": 1.6343750000000008,
        "reward_min": -1.9724999999999997,
        "leartime_s": 0.023199479997856542,
        "sampletime": 9.938014229002874,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 500,
        "timesteps": 10000000,
        "reward_mean": 0.48675000000000057,
        "reward_max": 2.126875000000001,
        "reward_min": -1.034374999999999,
        "leartime_s": 0.04102956398855895,
        "sampletime": 9.576972832990577,
        "best_mean": 1.5118750000000007,
        "best_max": 2.521875,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    }
]