[
    {
        "generation": 1,
        "timesteps": 20000,
        "reward_mean": -39.57538592857143,
        "reward_max": -7.032500000000001,
        "reward_min": -79.61749999999999,
        "leartime_s": 0.018514883005991578,
        "sampletime": 9.704526375018759,
        "best_mean": -39.57538592857143,
        "best_max": -7.032500000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 2,
        "timesteps": 40000,
        "reward_mean": -36.21929233333333,
        "reward_max": -0.35437499999999994,
        "reward_min": -110.16125000000001,
        "leartime_s": 0.013485230010701343,
        "sampletime": 9.847020080982475,
        "best_mean": -36.21929233333333,
        "best_max": -0.35437499999999994,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 3,
        "timesteps": 60000,
        "reward_mean": -20.876475,
        "reward_max": 0.5693750000000014,
        "reward_min": -156.395,
        "leartime_s": 0.005435186991235241,
        "sampletime": 9.219693104008911,
        "best_mean": -20.876475,
        "best_max": 0.5693750000000014,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 4,
        "timesteps": 80000,
        "reward_mean": -18.265700000000002,
        "reward_max": 1.2062500000000014,
        "reward_min": -53.75999999999999,
        "leartime_s": 0.007769529998768121,
        "sampletime": 9.982309197977884,
        "best_mean": -18.265700000000002,
        "best_max": 1.2062500000000014,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 5,
        "timesteps": 100000,
        "reward_mean": -18.099225,
        "reward_max": 0.3931250000000012,
        "reward_min": -38.31125000000001,
        "leartime_s": 0.004841891000978649,
        "sampletime": 9.371916537988,
        "best_mean": -18.099225,
        "best_max": 0.3931250000000012,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 6,
        "timesteps": 120000,
        "reward_mean": -19.499875,
        "reward_max": 0.9200000000000006,
        "reward_min": -75.046875,
        "leartime_s": 0.021185880003031343,
        "sampletime": 9.825014554022346,
        "best_mean": -18.099225,
        "best_max": 0.3931250000000012,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 7,
        "timesteps": 140000,
        "reward_mean": -17.03835,
        "reward_max": -2.2612500000000004,
        "reward_min": -93.32062499999998,
        "leartime_s": 0.005100492999190465,
        "sampletime": 11.015069639019202,
        "best_mean": -17.03835,
        "best_max": -2.2612500000000004,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 8,
        "timesteps": 160000,
        "reward_mean": -12.261650000000001,
        "reward_max": -4.667499999999999,
        "reward_min": -51.54750000000001,
        "leartime_s": 0.005868598003871739,
        "sampletime": 10.340021729003638,
        "best_mean": -12.261650000000001,
        "best_max": -4.667499999999999,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 9,
        "timesteps": 180000,
        "reward_mean": -8.235599999999998,
        "reward_max": -1.743125,
        "reward_min": -21.536875,
        "leartime_s": 0.007169799006078392,
        "sampletime": 10.638060805009445,
        "best_mean": -8.235599999999998,
        "best_max": -1.743125,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 10,
        "timesteps": 200000,
        "reward_mean": -4.759525,
        "reward_max": -1.4024999999999999,
        "reward_min": -17.93125,
        "leartime_s": 0.012927773001138121,
        "sampletime": 10.681375439016847,
        "best_mean": -4.759525,
        "best_max": -1.4024999999999999,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 11,
        "timesteps": 220000,
        "reward_mean": -2.8069249999999992,
        "reward_max": -1.0099999999999998,
        "reward_min": -6.237499999999999,
        "leartime_s": 0.005093484011013061,
        "sampletime": 10.205390849994728,
        "best_mean": -2.8069249999999992,
        "best_max": -1.0099999999999998,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 12,
        "timesteps": 240000,
        "reward_mean": -2.0782249999999998,
        "reward_max": -0.71,
        "reward_min": -4.2,
        "leartime_s": 0.043498029990587384,
        "sampletime": 10.552022025978658,
        "best_mean": -2.0782249999999998,
        "best_max": -0.71,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 13,
        "timesteps": 260000,
        "reward_mean": -1.9419749999999998,
        "reward_max": -0.6893750000000002,
        "reward_min": -3.9018749999999986,
        "leartime_s": 0.028024604980600998,
        "sampletime": 10.90522680999129,
        "best_mean": -1.9419749999999998,
        "best_max": -0.6893750000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 14,
        "timesteps": 280000,
        "reward_mean": -1.66165,
        "reward_max": -0.82625,
        "reward_min": -2.8187499999999988,
        "leartime_s": 0.03105273499386385,
        "sampletime": 10.368893648992525,
        "best_mean": -1.66165,
        "best_max": -0.82625,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 15,
        "timesteps": 300000,
        "reward_mean": -1.780975,
        "reward_max": -0.6118750000000003,
        "reward_min": -4.0493749999999995,
        "leartime_s": 0.004974993003997952,
        "sampletime": 10.312038209987804,
        "best_mean": -1.66165,
        "best_max": -0.82625,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 16,
        "timesteps": 320000,
        "reward_mean": -2.1926499999999995,
        "reward_max": -0.9237500000000002,
        "reward_min": -4.439999999999997,
        "leartime_s": 0.005073503009043634,
        "sampletime": 11.038437597977463,
        "best_mean": -1.66165,
        "best_max": -0.82625,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 17,
        "timesteps": 340000,
        "reward_mean": -1.787575,
        "reward_max": -0.7725000000000002,
        "reward_min": -3.85875,
        "leartime_s": 0.03056194301461801,
        "sampletime": 10.168834145995788,
        "best_mean": -1.66165,
        "best_max": -0.82625,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 18,
        "timesteps": 360000,
        "reward_mean": -2.0705249999999995,
        "reward_max": -0.9056250000000005,
        "reward_min": -4.433749999999999,
        "leartime_s": 0.04034352698363364,
        "sampletime": 11.042800158000318,
        "best_mean": -1.66165,
        "best_max": -0.82625,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 19,
        "timesteps": 380000,
        "reward_mean": -1.8904499999999997,
        "reward_max": -0.6018750000000003,
        "reward_min": -4.651874999999999,
        "leartime_s": 0.00566854901262559,
        "sampletime": 10.513820509979269,
        "best_mean": -1.66165,
        "best_max": -0.82625,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 20,
        "timesteps": 400000,
        "reward_mean": -1.7933749999999995,
        "reward_max": -0.6200000000000002,
        "reward_min": -3.3956249999999972,
        "leartime_s": 0.005813610012410209,
        "sampletime": 10.396031807002146,
        "best_mean": -1.66165,
        "best_max": -0.82625,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 21,
        "timesteps": 420000,
        "reward_mean": -1.8194999999999997,
        "reward_max": -0.7725000000000003,
        "reward_min": -3.2181249999999997,
        "leartime_s": 0.014201062003849074,
        "sampletime": 11.352740425994853,
        "best_mean": -1.66165,
        "best_max": -0.82625,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 22,
        "timesteps": 440000,
        "reward_mean": -1.8636,
        "reward_max": -0.9650000000000003,
        "reward_min": -3.2124999999999995,
        "leartime_s": 0.005596927017904818,
        "sampletime": 10.400845447991742,
        "best_mean": -1.66165,
        "best_max": -0.82625,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 23,
        "timesteps": 460000,
        "reward_mean": -1.802275,
        "reward_max": -0.8881250000000004,
        "reward_min": -3.3100000000000005,
        "leartime_s": 0.005233546020463109,
        "sampletime": 10.840208009001799,
        "best_mean": -1.66165,
        "best_max": -0.82625,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 24,
        "timesteps": 480000,
        "reward_mean": -1.572825,
        "reward_max": -0.6393750000000001,
        "reward_min": -3.7231249999999996,
        "leartime_s": 0.006064570014132187,
        "sampletime": 10.410248808009783,
        "best_mean": -1.572825,
        "best_max": -0.6393750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 25,
        "timesteps": 500000,
        "reward_mean": -1.7119499999999996,
        "reward_max": -0.8587500000000002,
        "reward_min": -3.193749999999997,
        "leartime_s": 0.01782351898145862,
        "sampletime": 10.643619385024067,
        "best_mean": -1.572825,
        "best_max": -0.6393750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 26,
        "timesteps": 520000,
        "reward_mean": -1.604975,
        "reward_max": -0.8881250000000004,
        "reward_min": -3.1325000000000003,
        "leartime_s": 0.057385066989809275,
        "sampletime": 11.108961719000945,
        "best_mean": -1.572825,
        "best_max": -0.6393750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 27,
        "timesteps": 540000,
        "reward_mean": -1.820825,
        "reward_max": -0.5006250000000001,
        "reward_min": -3.6518750000000004,
        "leartime_s": 0.017036392993759364,
        "sampletime": 10.299279130005743,
        "best_mean": -1.572825,
        "best_max": -0.6393750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 28,
        "timesteps": 560000,
        "reward_mean": -1.8223249999999998,
        "reward_max": -0.7175000000000002,
        "reward_min": -3.9012499999999983,
        "leartime_s": 0.010620738001307473,
        "sampletime": 10.698385925003095,
        "best_mean": -1.572825,
        "best_max": -0.6393750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 29,
        "timesteps": 580000,
        "reward_mean": -1.8748499999999995,
        "reward_max": -0.2587499999999999,
        "reward_min": -3.728749999999998,
        "leartime_s": 0.005830437003169209,
        "sampletime": 10.934966379980324,
        "best_mean": -1.572825,
        "best_max": -0.6393750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 30,
        "timesteps": 600000,
        "reward_mean": -1.4503,
        "reward_max": -0.5081250000000002,
        "reward_min": -3.154999999999999,
        "leartime_s": 0.006030347023624927,
        "sampletime": 10.336184912011959,
        "best_mean": -1.4503,
        "best_max": -0.5081250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 31,
        "timesteps": 620000,
        "reward_mean": -1.728175,
        "reward_max": -0.33562499999999995,
        "reward_min": -3.5418749999999974,
        "leartime_s": 0.0061195470043458045,
        "sampletime": 10.522181977983564,
        "best_mean": -1.4503,
        "best_max": -0.5081250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 32,
        "timesteps": 640000,
        "reward_mean": -1.497125,
        "reward_max": -0.46625,
        "reward_min": -3.9318749999999993,
        "leartime_s": 0.010064072004752234,
        "sampletime": 10.777852903003804,
        "best_mean": -1.4503,
        "best_max": -0.5081250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 33,
        "timesteps": 660000,
        "reward_mean": -1.5745499999999997,
        "reward_max": -0.56875,
        "reward_min": -3.156874999999998,
        "leartime_s": 0.018983216024935246,
        "sampletime": 11.137974284996744,
        "best_mean": -1.4503,
        "best_max": -0.5081250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 34,
        "timesteps": 680000,
        "reward_mean": -1.6809749999999999,
        "reward_max": -0.3987499999999999,
        "reward_min": -4.172499999999996,
        "leartime_s": 0.019493980973493308,
        "sampletime": 10.440128971007653,
        "best_mean": -1.4503,
        "best_max": -0.5081250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 35,
        "timesteps": 700000,
        "reward_mean": -1.4335,
        "reward_max": -0.43562500000000004,
        "reward_min": -2.881874999999998,
        "leartime_s": 0.02616683198721148,
        "sampletime": 10.77613582299091,
        "best_mean": -1.4335,
        "best_max": -0.43562500000000004,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 36,
        "timesteps": 720000,
        "reward_mean": -1.0623250000000002,
        "reward_max": -0.11812499999999977,
        "reward_min": -2.205,
        "leartime_s": 0.04182659101206809,
        "sampletime": 11.331230579002295,
        "best_mean": -1.0623250000000002,
        "best_max": -0.11812499999999977,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 37,
        "timesteps": 740000,
        "reward_mean": -1.4345583333333334,
        "reward_max": -0.48812500000000014,
        "reward_min": -3.259374999999999,
        "leartime_s": 0.00604562001535669,
        "sampletime": 10.55037449998781,
        "best_mean": -1.0623250000000002,
        "best_max": -0.11812499999999977,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 38,
        "timesteps": 760000,
        "reward_mean": -1.4789,
        "reward_max": -0.37937499999999996,
        "reward_min": -2.957499999999999,
        "leartime_s": 0.005875150003703311,
        "sampletime": 11.2980471040064,
        "best_mean": -1.0623250000000002,
        "best_max": -0.11812499999999977,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 39,
        "timesteps": 780000,
        "reward_mean": -1.4827500000000002,
        "reward_max": -0.44374999999999987,
        "reward_min": -2.63,
        "leartime_s": 0.006477273011114448,
        "sampletime": 10.491766541003017,
        "best_mean": -1.0623250000000002,
        "best_max": -0.11812499999999977,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 40,
        "timesteps": 800000,
        "reward_mean": -1.38915,
        "reward_max": -0.27687499999999976,
        "reward_min": -3.1374999999999997,
        "leartime_s": 0.05111278500407934,
        "sampletime": 10.166923811018933,
        "best_mean": -1.0623250000000002,
        "best_max": -0.11812499999999977,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 41,
        "timesteps": 820000,
        "reward_mean": -1.4614500000000001,
        "reward_max": -0.6337500000000004,
        "reward_min": -2.6868749999999992,
        "leartime_s": 0.029020940011832863,
        "sampletime": 11.435690512007568,
        "best_mean": -1.0623250000000002,
        "best_max": -0.11812499999999977,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 42,
        "timesteps": 840000,
        "reward_mean": -1.2405,
        "reward_max": -0.36437499999999995,
        "reward_min": -2.3924999999999996,
        "leartime_s": 0.016656177991535515,
        "sampletime": 11.046733385010157,
        "best_mean": -1.0623250000000002,
        "best_max": -0.11812499999999977,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 43,
        "timesteps": 860000,
        "reward_mean": -1.5527343333333332,
        "reward_max": -0.6062500000000002,
        "reward_min": -2.839374999999999,
        "leartime_s": 0.007192334975115955,
        "sampletime": 10.514709628012497,
        "best_mean": -1.0623250000000002,
        "best_max": -0.11812499999999977,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 44,
        "timesteps": 880000,
        "reward_mean": -1.170525,
        "reward_max": -0.47125000000000017,
        "reward_min": -2.488125,
        "leartime_s": 0.007118417997844517,
        "sampletime": 11.548093298013555,
        "best_mean": -1.0623250000000002,
        "best_max": -0.11812499999999977,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 45,
        "timesteps": 900000,
        "reward_mean": -1.2747249999999999,
        "reward_max": -0.41812500000000014,
        "reward_min": -2.1806249999999996,
        "leartime_s": 0.006553846993483603,
        "sampletime": 10.66354821799905,
        "best_mean": -1.0623250000000002,
        "best_max": -0.11812499999999977,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 46,
        "timesteps": 920000,
        "reward_mean": -1.4216000000000002,
        "reward_max": -0.35000000000000003,
        "reward_min": -2.7418749999999994,
        "leartime_s": 0.007282598002348095,
        "sampletime": 10.94718271199963,
        "best_mean": -1.0623250000000002,
        "best_max": -0.11812499999999977,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 47,
        "timesteps": 940000,
        "reward_mean": -1.330125,
        "reward_max": -0.5231249999999996,
        "reward_min": -2.93125,
        "leartime_s": 0.0064882680017035455,
        "sampletime": 10.985364393010968,
        "best_mean": -1.0623250000000002,
        "best_max": -0.11812499999999977,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 48,
        "timesteps": 960000,
        "reward_mean": -1.479,
        "reward_max": -0.37375,
        "reward_min": -2.857499999999999,
        "leartime_s": 0.016010224993806332,
        "sampletime": 10.41767714699381,
        "best_mean": -1.0623250000000002,
        "best_max": -0.11812499999999977,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 49,
        "timesteps": 980000,
        "reward_mean": -1.521525,
        "reward_max": -0.5356250000000001,
        "reward_min": -3.5187499999999994,
        "leartime_s": 0.020896460016956553,
        "sampletime": 11.355317627982004,
        "best_mean": -1.0623250000000002,
        "best_max": -0.11812499999999977,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 50,
        "timesteps": 1000000,
        "reward_mean": -1.536425,
        "reward_max": -0.4912499999999999,
        "reward_min": -4.191249999999999,
        "leartime_s": 0.011465504008810967,
        "sampletime": 11.08431020998978,
        "best_mean": -1.0623250000000002,
        "best_max": -0.11812499999999977,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 51,
        "timesteps": 1020000,
        "reward_mean": -1.6916999999999998,
        "reward_max": -0.7481250000000003,
        "reward_min": -3.646874999999998,
        "leartime_s": 0.00945285800844431,
        "sampletime": 10.580260215996532,
        "best_mean": -1.0623250000000002,
        "best_max": -0.11812499999999977,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 52,
        "timesteps": 1040000,
        "reward_mean": -1.3670499999999999,
        "reward_max": -0.5356250000000002,
        "reward_min": -3.6900000000000004,
        "leartime_s": 0.006570569996256381,
        "sampletime": 11.169236446992727,
        "best_mean": -1.0623250000000002,
        "best_max": -0.11812499999999977,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 53,
        "timesteps": 1060000,
        "reward_mean": -1.5095,
        "reward_max": -0.5887500000000002,
        "reward_min": -3.926249999999999,
        "leartime_s": 0.016659288987284526,
        "sampletime": 10.548190318018897,
        "best_mean": -1.0623250000000002,
        "best_max": -0.11812499999999977,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 54,
        "timesteps": 1080000,
        "reward_mean": -1.2678000000000003,
        "reward_max": -0.543125,
        "reward_min": -2.824999999999999,
        "leartime_s": 0.02813827700447291,
        "sampletime": 11.435067568003433,
        "best_mean": -1.0623250000000002,
        "best_max": -0.11812499999999977,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 55,
        "timesteps": 1100000,
        "reward_mean": -1.8227999999999998,
        "reward_max": -0.6206250000000001,
        "reward_min": -4.416249999999999,
        "leartime_s": 0.0074747930048033595,
        "sampletime": 10.362085214001127,
        "best_mean": -1.0623250000000002,
        "best_max": -0.11812499999999977,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 56,
        "timesteps": 1120000,
        "reward_mean": -1.614575,
        "reward_max": -0.4775000000000001,
        "reward_min": -3.8387499999999997,
        "leartime_s": 0.007213442993815988,
        "sampletime": 10.882996966014616,
        "best_mean": -1.0623250000000002,
        "best_max": -0.11812499999999977,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 57,
        "timesteps": 1140000,
        "reward_mean": -2.1681999999999997,
        "reward_max": -0.7387500000000001,
        "reward_min": -4.680624999999998,
        "leartime_s": 0.007728873984888196,
        "sampletime": 10.958716624998488,
        "best_mean": -1.0623250000000002,
        "best_max": -0.11812499999999977,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 58,
        "timesteps": 1160000,
        "reward_mean": -1.9563499999999998,
        "reward_max": -0.28062500000000007,
        "reward_min": -5.087499999999999,
        "leartime_s": 0.016184904001420364,
        "sampletime": 10.582117876998382,
        "best_mean": -1.0623250000000002,
        "best_max": -0.11812499999999977,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 59,
        "timesteps": 1180000,
        "reward_mean": -1.610125,
        "reward_max": -0.6237500000000005,
        "reward_min": -3.59,
        "leartime_s": 0.01031181399594061,
        "sampletime": 10.634656731999712,
        "best_mean": -1.0623250000000002,
        "best_max": -0.11812499999999977,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 60,
        "timesteps": 1200000,
        "reward_mean": -1.4580500000000003,
        "reward_max": -0.3006250000000001,
        "reward_min": -3.048125,
        "leartime_s": 0.007158006017562002,
        "sampletime": 10.987721789017087,
        "best_mean": -1.0623250000000002,
        "best_max": -0.11812499999999977,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 61,
        "timesteps": 1220000,
        "reward_mean": -1.4400000000000002,
        "reward_max": -0.5775000000000001,
        "reward_min": -3.0200000000000005,
        "leartime_s": 0.011882582010002807,
        "sampletime": 10.842922918993281,
        "best_mean": -1.0623250000000002,
        "best_max": -0.11812499999999977,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 62,
        "timesteps": 1240000,
        "reward_mean": -1.57165,
        "reward_max": -0.500625,
        "reward_min": -3.6556249999999997,
        "leartime_s": 0.03057277901098132,
        "sampletime": 11.175995942990994,
        "best_mean": -1.0623250000000002,
        "best_max": -0.11812499999999977,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 63,
        "timesteps": 1260000,
        "reward_mean": -1.2570908333333333,
        "reward_max": -0.2893749999999998,
        "reward_min": -2.6912499999999993,
        "leartime_s": 0.018565400008810684,
        "sampletime": 10.936561890994199,
        "best_mean": -1.0623250000000002,
        "best_max": -0.11812499999999977,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 64,
        "timesteps": 1280000,
        "reward_mean": -1.5223499999999999,
        "reward_max": -0.25687499999999985,
        "reward_min": -3.5012500000000006,
        "leartime_s": 0.035819632990751415,
        "sampletime": 10.497893784980988,
        "best_mean": -1.0623250000000002,
        "best_max": -0.11812499999999977,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 65,
        "timesteps": 1300000,
        "reward_mean": -1.7132749999999999,
        "reward_max": -0.5468749999999999,
        "reward_min": -3.7768749999999978,
        "leartime_s": 0.02189583401195705,
        "sampletime": 10.987681547005195,
        "best_mean": -1.0623250000000002,
        "best_max": -0.11812499999999977,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 66,
        "timesteps": 1320000,
        "reward_mean": -1.6394000000000002,
        "reward_max": -0.6725,
        "reward_min": -3.42125,
        "leartime_s": 0.017503586976090446,
        "sampletime": 10.368782517994987,
        "best_mean": -1.0623250000000002,
        "best_max": -0.11812499999999977,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 67,
        "timesteps": 1340000,
        "reward_mean": -1.476175,
        "reward_max": -0.21874999999999992,
        "reward_min": -3.2024999999999997,
        "leartime_s": 0.024249993002740666,
        "sampletime": 10.81406173898722,
        "best_mean": -1.0623250000000002,
        "best_max": -0.11812499999999977,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 68,
        "timesteps": 1360000,
        "reward_mean": -1.441875,
        "reward_max": -0.2856249999999997,
        "reward_min": -4.014374999999999,
        "leartime_s": 0.024920555006247014,
        "sampletime": 10.532932739006355,
        "best_mean": -1.0623250000000002,
        "best_max": -0.11812499999999977,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 69,
        "timesteps": 1380000,
        "reward_mean": -1.420625,
        "reward_max": -0.5743750000000002,
        "reward_min": -3.039374999999999,
        "leartime_s": 0.015666452003642917,
        "sampletime": 10.897112750011729,
        "best_mean": -1.0623250000000002,
        "best_max": -0.11812499999999977,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 70,
        "timesteps": 1400000,
        "reward_mean": -1.739,
        "reward_max": -0.5531250000000001,
        "reward_min": -3.754374999999998,
        "leartime_s": 0.03643031499814242,
        "sampletime": 10.487135128001682,
        "best_mean": -1.0623250000000002,
        "best_max": -0.11812499999999977,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 71,
        "timesteps": 1420000,
        "reward_mean": -1.4987499999999998,
        "reward_max": -0.37375,
        "reward_min": -3.8593749999999987,
        "leartime_s": 0.018004273006226867,
        "sampletime": 10.751622651005164,
        "best_mean": -1.0623250000000002,
        "best_max": -0.11812499999999977,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 72,
        "timesteps": 1440000,
        "reward_mean": -1.5395999999999999,
        "reward_max": -0.5675000000000001,
        "reward_min": -3.4049999999999985,
        "leartime_s": 0.025279665016569197,
        "sampletime": 10.333631768007763,
        "best_mean": -1.0623250000000002,
        "best_max": -0.11812499999999977,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 73,
        "timesteps": 1460000,
        "reward_mean": -1.35955,
        "reward_max": -0.39750000000000013,
        "reward_min": -3.539999999999999,
        "leartime_s": 0.016521655983524397,
        "sampletime": 10.85900151799433,
        "best_mean": -1.0623250000000002,
        "best_max": -0.11812499999999977,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 74,
        "timesteps": 1480000,
        "reward_mean": -1.49815,
        "reward_max": -0.6825000000000001,
        "reward_min": -3.277499999999999,
        "leartime_s": 0.01721242899657227,
        "sampletime": 10.727631576010026,
        "best_mean": -1.0623250000000002,
        "best_max": -0.11812499999999977,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 75,
        "timesteps": 1500000,
        "reward_mean": -1.6115249999999997,
        "reward_max": -0.33624999999999994,
        "reward_min": -3.9924999999999993,
        "leartime_s": 0.012694844015641138,
        "sampletime": 10.412938958004816,
        "best_mean": -1.0623250000000002,
        "best_max": -0.11812499999999977,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 76,
        "timesteps": 1520000,
        "reward_mean": -1.1862249999999999,
        "reward_max": -0.39562500000000006,
        "reward_min": -2.5281250000000006,
        "leartime_s": 0.025412857998162508,
        "sampletime": 10.507904756988864,
        "best_mean": -1.0623250000000002,
        "best_max": -0.11812499999999977,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 77,
        "timesteps": 1540000,
        "reward_mean": -1.5430749999999998,
        "reward_max": -0.3331250000000001,
        "reward_min": -3.571249999999999,
        "leartime_s": 0.007294041017303243,
        "sampletime": 10.815886547003174,
        "best_mean": -1.0623250000000002,
        "best_max": -0.11812499999999977,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 78,
        "timesteps": 1560000,
        "reward_mean": -1.272375,
        "reward_max": -0.49124999999999996,
        "reward_min": -2.6500000000000004,
        "leartime_s": 0.016117619001306593,
        "sampletime": 10.531385759008117,
        "best_mean": -1.0623250000000002,
        "best_max": -0.11812499999999977,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 79,
        "timesteps": 1580000,
        "reward_mean": -1.2388500000000002,
        "reward_max": -0.41937500000000016,
        "reward_min": -2.8275,
        "leartime_s": 0.009416140004759654,
        "sampletime": 11.065044665010646,
        "best_mean": -1.0623250000000002,
        "best_max": -0.11812499999999977,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 80,
        "timesteps": 1600000,
        "reward_mean": -1.2735500000000002,
        "reward_max": -0.409375,
        "reward_min": -2.728124999999999,
        "leartime_s": 0.0076179430179763585,
        "sampletime": 10.95280953400652,
        "best_mean": -1.0623250000000002,
        "best_max": -0.11812499999999977,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 81,
        "timesteps": 1620000,
        "reward_mean": -1.4957,
        "reward_max": -0.7162500000000002,
        "reward_min": -4.254374999999998,
        "leartime_s": 0.01662705501075834,
        "sampletime": 10.384423307987163,
        "best_mean": -1.0623250000000002,
        "best_max": -0.11812499999999977,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 82,
        "timesteps": 1640000,
        "reward_mean": -1.2720185000000002,
        "reward_max": -0.5281250000000003,
        "reward_min": -2.444375000000001,
        "leartime_s": 0.024908959021558985,
        "sampletime": 11.132241717976285,
        "best_mean": -1.0623250000000002,
        "best_max": -0.11812499999999977,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 83,
        "timesteps": 1660000,
        "reward_mean": -1.2859,
        "reward_max": -0.455625,
        "reward_min": -2.9675000000000002,
        "leartime_s": 0.024659109010826796,
        "sampletime": 10.556037630012725,
        "best_mean": -1.0623250000000002,
        "best_max": -0.11812499999999977,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 84,
        "timesteps": 1680000,
        "reward_mean": -1.070175,
        "reward_max": -0.325,
        "reward_min": -2.405625000000001,
        "leartime_s": 0.022757692000595853,
        "sampletime": 10.69571679798537,
        "best_mean": -1.0623250000000002,
        "best_max": -0.11812499999999977,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 85,
        "timesteps": 1700000,
        "reward_mean": -1.0244750000000002,
        "reward_max": -0.26312500000000005,
        "reward_min": -2.2312499999999997,
        "leartime_s": 0.0111833089904394,
        "sampletime": 10.93906768297893,
        "best_mean": -1.0244750000000002,
        "best_max": -0.26312500000000005,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 86,
        "timesteps": 1720000,
        "reward_mean": -0.999775,
        "reward_max": -0.24937499999999987,
        "reward_min": -2.088749999999999,
        "leartime_s": 0.007946867001010105,
        "sampletime": 10.844550229987362,
        "best_mean": -0.999775,
        "best_max": -0.24937499999999987,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 87,
        "timesteps": 1740000,
        "reward_mean": -0.9512,
        "reward_max": -0.3212499999999999,
        "reward_min": -2.034375,
        "leartime_s": 0.03366526300669648,
        "sampletime": 10.746049548994051,
        "best_mean": -0.9512,
        "best_max": -0.3212499999999999,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 88,
        "timesteps": 1760000,
        "reward_mean": -0.7432000000000001,
        "reward_max": 0.10062500000000028,
        "reward_min": -1.3862500000000004,
        "leartime_s": 0.02481999300653115,
        "sampletime": 10.754735382011859,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 89,
        "timesteps": 1780000,
        "reward_mean": -1.0493000000000001,
        "reward_max": -0.3650000000000001,
        "reward_min": -2.8975000000000004,
        "leartime_s": 0.00822781800525263,
        "sampletime": 10.583435617998475,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 90,
        "timesteps": 1800000,
        "reward_mean": -1.2980144761904764,
        "reward_max": -0.5775000000000002,
        "reward_min": -2.1443750000000006,
        "leartime_s": 0.007969647995196283,
        "sampletime": 10.872728643997107,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 91,
        "timesteps": 1820000,
        "reward_mean": -0.9073806190476191,
        "reward_max": -0.010624999999999843,
        "reward_min": -1.8700000000000003,
        "leartime_s": 0.008014096994884312,
        "sampletime": 10.475863881001715,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 92,
        "timesteps": 1840000,
        "reward_mean": -0.9681000000000003,
        "reward_max": -0.2637499999999999,
        "reward_min": -1.7799999999999998,
        "leartime_s": 0.023355871002422646,
        "sampletime": 10.934654665004928,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 93,
        "timesteps": 1860000,
        "reward_mean": -1.1137360000000003,
        "reward_max": -0.3193749999999999,
        "reward_min": -2.403333333333334,
        "leartime_s": 0.026516105979681015,
        "sampletime": 10.795941268006572,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 94,
        "timesteps": 1880000,
        "reward_mean": -1.0083,
        "reward_max": -0.3537499999999998,
        "reward_min": -2.5812499999999994,
        "leartime_s": 0.008253389009041712,
        "sampletime": 10.855168326990679,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 95,
        "timesteps": 1900000,
        "reward_mean": -1.1382750000000001,
        "reward_max": -0.2974999999999999,
        "reward_min": -2.296875,
        "leartime_s": 0.011774407990742475,
        "sampletime": 10.285287503007567,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 96,
        "timesteps": 1920000,
        "reward_mean": -0.9471925000000002,
        "reward_max": -0.20562500000000009,
        "reward_min": -1.7468750000000004,
        "leartime_s": 0.008044841000810266,
        "sampletime": 11.161963499995181,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 97,
        "timesteps": 1940000,
        "reward_mean": -1.199575,
        "reward_max": -0.39625,
        "reward_min": -2.20375,
        "leartime_s": 0.028838739992352203,
        "sampletime": 10.356628129986348,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 98,
        "timesteps": 1960000,
        "reward_mean": -1.0736129285714289,
        "reward_max": -0.4281250000000002,
        "reward_min": -1.9531249999999996,
        "leartime_s": 0.010150808986509219,
        "sampletime": 10.65698595897993,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 99,
        "timesteps": 1980000,
        "reward_mean": -1.0880500000000002,
        "reward_max": -0.29624999999999996,
        "reward_min": -2.06625,
        "leartime_s": 0.022330089006572962,
        "sampletime": 10.720891876990208,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 100,
        "timesteps": 2000000,
        "reward_mean": -1.1921750000000002,
        "reward_max": -0.2812499999999999,
        "reward_min": -2.6312499999999988,
        "leartime_s": 0.03204335898044519,
        "sampletime": 10.318424212018726,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 101,
        "timesteps": 2020000,
        "reward_mean": -1.2322000000000002,
        "reward_max": -0.4462500000000001,
        "reward_min": -2.5818749999999993,
        "leartime_s": 0.009495108999544755,
        "sampletime": 10.387787743995432,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 102,
        "timesteps": 2040000,
        "reward_mean": -1.1018250000000003,
        "reward_max": -0.2249999999999998,
        "reward_min": -2.4324999999999997,
        "leartime_s": 0.027101467974716797,
        "sampletime": 11.045142873976147,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 103,
        "timesteps": 2060000,
        "reward_mean": -1.1326000000000003,
        "reward_max": -0.3625,
        "reward_min": -2.0593750000000006,
        "leartime_s": 0.06563738800468855,
        "sampletime": 10.226930247998098,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 104,
        "timesteps": 2080000,
        "reward_mean": -1.0984500000000001,
        "reward_max": -0.360625,
        "reward_min": -1.9675,
        "leartime_s": 0.018085532006807625,
        "sampletime": 11.497913041996071,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 105,
        "timesteps": 2100000,
        "reward_mean": -1.0443915000000001,
        "reward_max": -0.28125,
        "reward_min": -1.8943750000000004,
        "leartime_s": 0.018305924022570252,
        "sampletime": 10.768915861990536,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 106,
        "timesteps": 2120000,
        "reward_mean": -1.202625,
        "reward_max": -0.33749999999999997,
        "reward_min": -2.387499999999999,
        "leartime_s": 0.025473527988651767,
        "sampletime": 10.288169675011886,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 107,
        "timesteps": 2140000,
        "reward_mean": -0.8569750000000002,
        "reward_max": -0.13187499999999977,
        "reward_min": -1.62,
        "leartime_s": 0.0088289350096602,
        "sampletime": 11.045461898000212,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 108,
        "timesteps": 2160000,
        "reward_mean": -1.1948250000000002,
        "reward_max": -0.41000000000000003,
        "reward_min": -2.506249999999999,
        "leartime_s": 0.008715784992091358,
        "sampletime": 10.542095118988072,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 109,
        "timesteps": 2180000,
        "reward_mean": -1.1303250000000002,
        "reward_max": -0.4375,
        "reward_min": -1.8912499999999999,
        "leartime_s": 0.03498299000784755,
        "sampletime": 10.538751368003432,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 110,
        "timesteps": 2200000,
        "reward_mean": -1.081275,
        "reward_max": -0.2400000000000001,
        "reward_min": -2.7049999999999983,
        "leartime_s": 0.00900883600115776,
        "sampletime": 9.920396458008327,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 111,
        "timesteps": 2220000,
        "reward_mean": -1.0867250000000004,
        "reward_max": -0.250625,
        "reward_min": -1.8093750000000006,
        "leartime_s": 0.009257140016416088,
        "sampletime": 11.097390176000772,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 112,
        "timesteps": 2240000,
        "reward_mean": -0.857525,
        "reward_max": -0.05062499999999976,
        "reward_min": -1.7468750000000004,
        "leartime_s": 0.009856824995949864,
        "sampletime": 10.510666246002074,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 113,
        "timesteps": 2260000,
        "reward_mean": -1.1650500000000001,
        "reward_max": -0.598125,
        "reward_min": -2.424375000000001,
        "leartime_s": 0.015930701018078253,
        "sampletime": 10.04117969199433,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 114,
        "timesteps": 2280000,
        "reward_mean": -1.156425,
        "reward_max": -0.24749999999999994,
        "reward_min": -2.0449999999999995,
        "leartime_s": 0.028121668990934268,
        "sampletime": 10.753635264991317,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 115,
        "timesteps": 2300000,
        "reward_mean": -1.2026,
        "reward_max": -0.4343750000000001,
        "reward_min": -2.3849999999999993,
        "leartime_s": 0.021157253009732813,
        "sampletime": 10.51412813499337,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 116,
        "timesteps": 2320000,
        "reward_mean": -0.84745,
        "reward_max": -0.27062499999999995,
        "reward_min": -1.694375,
        "leartime_s": 0.028471961006289348,
        "sampletime": 10.535011226980714,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 117,
        "timesteps": 2340000,
        "reward_mean": -1.1105000000000003,
        "reward_max": -0.30124999999999985,
        "reward_min": -2.0868749999999996,
        "leartime_s": 0.009758920001331717,
        "sampletime": 11.035004977020435,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 118,
        "timesteps": 2360000,
        "reward_mean": -0.891575,
        "reward_max": -0.07749999999999985,
        "reward_min": -1.7412499999999995,
        "leartime_s": 0.06550394199439324,
        "sampletime": 10.702595936978469,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 119,
        "timesteps": 2380000,
        "reward_mean": -1.1674181428571433,
        "reward_max": -0.41375000000000006,
        "reward_min": -2.1406250000000004,
        "leartime_s": 0.01602110601379536,
        "sampletime": 11.298132708994672,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 120,
        "timesteps": 2400000,
        "reward_mean": -0.8790000000000002,
        "reward_max": -0.16312499999999988,
        "reward_min": -1.5331250000000005,
        "leartime_s": 0.039314940018812194,
        "sampletime": 10.69650601700414,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 121,
        "timesteps": 2420000,
        "reward_mean": -1.090125,
        "reward_max": -0.05999999999999987,
        "reward_min": -2.173125,
        "leartime_s": 0.02058270000270568,
        "sampletime": 10.376429006020771,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 122,
        "timesteps": 2440000,
        "reward_mean": -1.084,
        "reward_max": -0.4550000000000001,
        "reward_min": -1.7543749999999994,
        "leartime_s": 0.01928777399007231,
        "sampletime": 10.94059961399762,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 123,
        "timesteps": 2460000,
        "reward_mean": -0.893575,
        "reward_max": -0.17062499999999992,
        "reward_min": -1.8250000000000002,
        "leartime_s": 0.02703985699918121,
        "sampletime": 10.737753926980076,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 124,
        "timesteps": 2480000,
        "reward_mean": -0.8832250000000001,
        "reward_max": 0.0956250000000003,
        "reward_min": -1.7149999999999999,
        "leartime_s": 0.02001161000225693,
        "sampletime": 10.33830016097636,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 125,
        "timesteps": 2500000,
        "reward_mean": -1.3870500000000001,
        "reward_max": -0.4431249999999999,
        "reward_min": -2.8431249999999997,
        "leartime_s": 0.010487375024240464,
        "sampletime": 10.874095200008014,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 126,
        "timesteps": 2520000,
        "reward_mean": -0.90815,
        "reward_max": -0.18874999999999983,
        "reward_min": -1.786875,
        "leartime_s": 0.016880892013432458,
        "sampletime": 10.668220953986747,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 127,
        "timesteps": 2540000,
        "reward_mean": -0.8684750000000001,
        "reward_max": 0.20500000000000035,
        "reward_min": -1.7287499999999998,
        "leartime_s": 0.009119201014982536,
        "sampletime": 11.12256944400724,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 128,
        "timesteps": 2560000,
        "reward_mean": -1.0116250000000002,
        "reward_max": -0.30250000000000005,
        "reward_min": -1.6968750000000001,
        "leartime_s": 0.00940525101032108,
        "sampletime": 10.216882805980276,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 129,
        "timesteps": 2580000,
        "reward_mean": -1.081025,
        "reward_max": -0.33999999999999997,
        "reward_min": -2.1718749999999996,
        "leartime_s": 0.06221892300527543,
        "sampletime": 10.306305498001166,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 130,
        "timesteps": 2600000,
        "reward_mean": -1.1535000000000002,
        "reward_max": -0.5337500000000003,
        "reward_min": -1.994375,
        "leartime_s": 0.0207021749811247,
        "sampletime": 11.249621075985488,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 131,
        "timesteps": 2620000,
        "reward_mean": -1.1403,
        "reward_max": -0.5275000000000003,
        "reward_min": -2.5362500000000003,
        "leartime_s": 0.015635656978702173,
        "sampletime": 10.526456311985385,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 132,
        "timesteps": 2640000,
        "reward_mean": -1.1093499999999998,
        "reward_max": -0.4650000000000002,
        "reward_min": -1.8462500000000004,
        "leartime_s": 0.026051045017084107,
        "sampletime": 10.603337884997018,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 133,
        "timesteps": 2660000,
        "reward_mean": -1.0995000000000001,
        "reward_max": -0.16937500000000005,
        "reward_min": -2.7362499999999996,
        "leartime_s": 0.009627303021261469,
        "sampletime": 10.5470297029824,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 134,
        "timesteps": 2680000,
        "reward_mean": -1.0619230000000002,
        "reward_max": -0.3268749999999999,
        "reward_min": -2.7074999999999996,
        "leartime_s": 0.07398762801312841,
        "sampletime": 10.617322467995109,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 135,
        "timesteps": 2700000,
        "reward_mean": -1.0598,
        "reward_max": -0.43125,
        "reward_min": -2.2262500000000007,
        "leartime_s": 0.009393502987222746,
        "sampletime": 11.358911388990236,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 136,
        "timesteps": 2720000,
        "reward_mean": -1.298375,
        "reward_max": -0.5581250000000002,
        "reward_min": -2.8112499999999994,
        "leartime_s": 0.011520504020154476,
        "sampletime": 10.476827851001872,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 137,
        "timesteps": 2740000,
        "reward_mean": -1.36305,
        "reward_max": -0.5906250000000001,
        "reward_min": -2.7981249999999998,
        "leartime_s": 0.05432025299523957,
        "sampletime": 10.536979877011618,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 138,
        "timesteps": 2760000,
        "reward_mean": -1.0381750000000003,
        "reward_max": -0.33,
        "reward_min": -1.9206250000000007,
        "leartime_s": 0.04972825199365616,
        "sampletime": 11.315364790993044,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 139,
        "timesteps": 2780000,
        "reward_mean": -1.0643000000000002,
        "reward_max": -0.14750000000000002,
        "reward_min": -2.150625,
        "leartime_s": 0.016399605985498056,
        "sampletime": 10.57757570699323,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 140,
        "timesteps": 2800000,
        "reward_mean": -0.8274500000000001,
        "reward_max": -0.11437499999999992,
        "reward_min": -1.95,
        "leartime_s": 0.009927085979143158,
        "sampletime": 10.52404710900737,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 141,
        "timesteps": 2820000,
        "reward_mean": -0.9007000000000001,
        "reward_max": 0.18687500000000007,
        "reward_min": -2.564374999999999,
        "leartime_s": 0.012421569001162425,
        "sampletime": 11.02958080699318,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 142,
        "timesteps": 2840000,
        "reward_mean": -1.1276749999999998,
        "reward_max": -0.15562499999999993,
        "reward_min": -2.5887499999999997,
        "leartime_s": 0.01772079200600274,
        "sampletime": 10.391144587018061,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 143,
        "timesteps": 2860000,
        "reward_mean": -1.2227618333333334,
        "reward_max": -0.46187500000000004,
        "reward_min": -3.0075000000000007,
        "leartime_s": 0.025747998006409034,
        "sampletime": 10.515153548010858,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 144,
        "timesteps": 2880000,
        "reward_mean": -1.1100250000000003,
        "reward_max": -0.3268750000000001,
        "reward_min": -1.8831249999999997,
        "leartime_s": 0.0188953600008972,
        "sampletime": 10.639725507004187,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 145,
        "timesteps": 2900000,
        "reward_mean": -1.173775,
        "reward_max": -0.2631249999999999,
        "reward_min": -2.3706250000000004,
        "leartime_s": 0.027632765006273985,
        "sampletime": 10.238973208994139,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 146,
        "timesteps": 2920000,
        "reward_mean": -1.121625,
        "reward_max": -0.24874999999999992,
        "reward_min": -2.5218749999999988,
        "leartime_s": 0.012623260001419112,
        "sampletime": 11.012292271014303,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 147,
        "timesteps": 2940000,
        "reward_mean": -1.0262,
        "reward_max": -0.09687499999999996,
        "reward_min": -2.7199999999999998,
        "leartime_s": 0.038210786995477974,
        "sampletime": 10.149486452020938,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 148,
        "timesteps": 2960000,
        "reward_mean": -1.0772668333333335,
        "reward_max": -0.245,
        "reward_min": -2.480625,
        "leartime_s": 0.05568846999085508,
        "sampletime": 10.532426624995423,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 149,
        "timesteps": 2980000,
        "reward_mean": -1.1993250000000002,
        "reward_max": -0.51625,
        "reward_min": -2.0131249999999996,
        "leartime_s": 0.021108851011376828,
        "sampletime": 10.977545589994406,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 150,
        "timesteps": 3000000,
        "reward_mean": -1.0002750000000002,
        "reward_max": -0.2831250000000001,
        "reward_min": -2.3625000000000003,
        "leartime_s": 0.06293169999844395,
        "sampletime": 10.496557200996904,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 151,
        "timesteps": 3020000,
        "reward_mean": -1.2385500000000003,
        "reward_max": -0.1693749999999999,
        "reward_min": -2.5987500000000003,
        "leartime_s": 0.029600589972687885,
        "sampletime": 10.211558801005594,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 152,
        "timesteps": 3040000,
        "reward_mean": -0.8581750000000001,
        "reward_max": -0.17625000000000013,
        "reward_min": -2.0881250000000002,
        "leartime_s": 0.029084117006277665,
        "sampletime": 10.995441831997596,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 153,
        "timesteps": 3060000,
        "reward_mean": -0.8675000000000002,
        "reward_max": -0.24312499999999998,
        "reward_min": -1.5574999999999999,
        "leartime_s": 0.04869284000596963,
        "sampletime": 10.451272102014627,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 154,
        "timesteps": 3080000,
        "reward_mean": -0.961675,
        "reward_max": 0.025625000000000106,
        "reward_min": -2.425624999999999,
        "leartime_s": 0.012712835014099255,
        "sampletime": 10.793268370995065,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 155,
        "timesteps": 3100000,
        "reward_mean": -0.9784750000000001,
        "reward_max": -0.35375,
        "reward_min": -1.8343750000000005,
        "leartime_s": 0.0105395219870843,
        "sampletime": 10.71836353398976,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 156,
        "timesteps": 3120000,
        "reward_mean": -1.039975,
        "reward_max": -0.2737500000000002,
        "reward_min": -1.9224999999999999,
        "leartime_s": 0.025805889017647132,
        "sampletime": 10.450480856001377,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 157,
        "timesteps": 3140000,
        "reward_mean": -0.9402750000000002,
        "reward_max": -0.2918750000000002,
        "reward_min": -2.0725000000000002,
        "leartime_s": 0.02120412199292332,
        "sampletime": 11.117846990004182,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 158,
        "timesteps": 3160000,
        "reward_mean": -0.9992750000000002,
        "reward_max": -0.054375000000000145,
        "reward_min": -1.9312500000000001,
        "leartime_s": 0.03363967401674017,
        "sampletime": 10.389697456994327,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 159,
        "timesteps": 3180000,
        "reward_mean": -0.9913000000000002,
        "reward_max": -0.28812499999999996,
        "reward_min": -1.98125,
        "leartime_s": 0.011987870006123558,
        "sampletime": 11.322392353991745,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 160,
        "timesteps": 3200000,
        "reward_mean": -1.0269500000000003,
        "reward_max": -0.4118750000000002,
        "reward_min": -1.835625000000001,
        "leartime_s": 0.01360084000043571,
        "sampletime": 10.427220240992028,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 161,
        "timesteps": 3220000,
        "reward_mean": -1.1694500000000003,
        "reward_max": -0.3743750000000001,
        "reward_min": -2.4006250000000002,
        "leartime_s": 0.010296938009560108,
        "sampletime": 10.517648867011303,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 162,
        "timesteps": 3240000,
        "reward_mean": -1.104821285714286,
        "reward_max": -0.17437500000000003,
        "reward_min": -2.5256249999999993,
        "leartime_s": 0.011798797000665218,
        "sampletime": 11.22311909700511,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 163,
        "timesteps": 3260000,
        "reward_mean": -0.9963000000000004,
        "reward_max": -0.3731250000000002,
        "reward_min": -1.8699999999999999,
        "leartime_s": 0.020519868994597346,
        "sampletime": 10.322845260001486,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 164,
        "timesteps": 3280000,
        "reward_mean": -0.9779268333333334,
        "reward_max": -0.11312499999999974,
        "reward_min": -1.861333333333334,
        "leartime_s": 0.011352436005836353,
        "sampletime": 11.10173231200315,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 165,
        "timesteps": 3300000,
        "reward_mean": -0.9464750000000003,
        "reward_max": -0.1537500000000001,
        "reward_min": -1.7125000000000008,
        "leartime_s": 0.011116187000880018,
        "sampletime": 10.263223577989265,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 166,
        "timesteps": 3320000,
        "reward_mean": -0.9745148333333336,
        "reward_max": -0.21062499999999987,
        "reward_min": -1.8768749999999996,
        "leartime_s": 0.02021316799800843,
        "sampletime": 10.516198229015572,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 167,
        "timesteps": 3340000,
        "reward_mean": -0.8708750000000002,
        "reward_max": -0.023125000000000086,
        "reward_min": -1.6249999999999991,
        "leartime_s": 0.013297124998643994,
        "sampletime": 11.064702667994425,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 168,
        "timesteps": 3360000,
        "reward_mean": -0.9117000000000003,
        "reward_max": -0.3287499999999998,
        "reward_min": -1.5893749999999993,
        "leartime_s": 0.010955523990560323,
        "sampletime": 10.577952502993867,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 169,
        "timesteps": 3380000,
        "reward_mean": -0.8443750000000001,
        "reward_max": 0.08000000000000018,
        "reward_min": -1.741874999999999,
        "leartime_s": 0.016917510016355664,
        "sampletime": 10.79117923200829,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 170,
        "timesteps": 3400000,
        "reward_mean": -0.8758250000000001,
        "reward_max": -0.09687499999999993,
        "reward_min": -2.501875,
        "leartime_s": 0.011932628985960037,
        "sampletime": 11.11575243700645,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 171,
        "timesteps": 3420000,
        "reward_mean": -0.9567000000000001,
        "reward_max": -0.16812500000000002,
        "reward_min": -1.9268750000000003,
        "leartime_s": 0.013011325994739309,
        "sampletime": 10.289612919994397,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 172,
        "timesteps": 3440000,
        "reward_mean": -0.9281500000000001,
        "reward_max": -0.28312500000000007,
        "reward_min": -1.9668750000000002,
        "leartime_s": 0.04061366801033728,
        "sampletime": 11.126762339990819,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 173,
        "timesteps": 3460000,
        "reward_mean": -1.0074000000000003,
        "reward_max": -0.3275000000000001,
        "reward_min": -1.7818750000000008,
        "leartime_s": 0.03870362800080329,
        "sampletime": 10.512238069000887,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 174,
        "timesteps": 3480000,
        "reward_mean": -1.3056250000000003,
        "reward_max": -0.5450000000000002,
        "reward_min": -3.0700000000000003,
        "leartime_s": 0.01079637199291028,
        "sampletime": 10.679753447999246,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 175,
        "timesteps": 3500000,
        "reward_mean": -0.9712750000000003,
        "reward_max": -0.13312500000000016,
        "reward_min": -1.7156249999999993,
        "leartime_s": 0.012760133016854525,
        "sampletime": 11.147815949021606,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 176,
        "timesteps": 3520000,
        "reward_mean": -1.0056326666666668,
        "reward_max": -0.21312500000000004,
        "reward_min": -2.1,
        "leartime_s": 0.052897888992447406,
        "sampletime": 10.33751894897432,
        "best_mean": -0.7432000000000001,
        "best_max": 0.10062500000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 177,
        "timesteps": 3540000,
        "reward_mean": -0.7275499999999999,
        "reward_max": 0.1181249999999998,
        "reward_min": -2.3299999999999987,
        "leartime_s": 0.020729041018057615,
        "sampletime": 11.502511179016437,
        "best_mean": -0.7275499999999999,
        "best_max": 0.1181249999999998,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 178,
        "timesteps": 3560000,
        "reward_mean": -0.9822750000000002,
        "reward_max": -0.05937500000000007,
        "reward_min": -2.3712499999999985,
        "leartime_s": 0.014102954999543726,
        "sampletime": 10.783019484981196,
        "best_mean": -0.7275499999999999,
        "best_max": 0.1181249999999998,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 179,
        "timesteps": 3580000,
        "reward_mean": -0.7502741666666668,
        "reward_max": 0.13687500000000014,
        "reward_min": -2.4649999999999994,
        "leartime_s": 0.026034812995931134,
        "sampletime": 10.30840171399177,
        "best_mean": -0.7275499999999999,
        "best_max": 0.1181249999999998,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 180,
        "timesteps": 3600000,
        "reward_mean": -0.8495500000000001,
        "reward_max": -0.007499999999999861,
        "reward_min": -2.320624999999999,
        "leartime_s": 0.07923158799530938,
        "sampletime": 11.00610829499783,
        "best_mean": -0.7275499999999999,
        "best_max": 0.1181249999999998,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 181,
        "timesteps": 3620000,
        "reward_mean": -0.8563330000000001,
        "reward_max": 0.28500000000000003,
        "reward_min": -2.033749999999999,
        "leartime_s": 0.033625020005274564,
        "sampletime": 10.509502535016509,
        "best_mean": -0.7275499999999999,
        "best_max": 0.1181249999999998,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 182,
        "timesteps": 3640000,
        "reward_mean": -1.1739450000000002,
        "reward_max": -0.37749999999999984,
        "reward_min": -3.2249999999999988,
        "leartime_s": 0.03138982399832457,
        "sampletime": 10.365399188012816,
        "best_mean": -0.7275499999999999,
        "best_max": 0.1181249999999998,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 183,
        "timesteps": 3660000,
        "reward_mean": -0.7481250000000002,
        "reward_max": 0.03187499999999991,
        "reward_min": -1.5575000000000006,
        "leartime_s": 0.019821255991701037,
        "sampletime": 11.033247157989535,
        "best_mean": -0.7275499999999999,
        "best_max": 0.1181249999999998,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 184,
        "timesteps": 3680000,
        "reward_mean": -0.9763750000000002,
        "reward_max": -0.06999999999999999,
        "reward_min": -2.936249999999999,
        "leartime_s": 0.02860180797870271,
        "sampletime": 10.732406501017977,
        "best_mean": -0.7275499999999999,
        "best_max": 0.1181249999999998,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 185,
        "timesteps": 3700000,
        "reward_mean": -0.6699500000000002,
        "reward_max": 0.31125000000000014,
        "reward_min": -2.340625,
        "leartime_s": 0.026472494995687157,
        "sampletime": 10.750929413014092,
        "best_mean": -0.6699500000000002,
        "best_max": 0.31125000000000014,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 186,
        "timesteps": 3720000,
        "reward_mean": -0.630725,
        "reward_max": 0.22312500000000035,
        "reward_min": -1.665625,
        "leartime_s": 0.014053513994440436,
        "sampletime": 10.78717690097983,
        "best_mean": -0.630725,
        "best_max": 0.22312500000000035,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 187,
        "timesteps": 3740000,
        "reward_mean": -0.7580500000000001,
        "reward_max": 0.20250000000000012,
        "reward_min": -1.9687499999999991,
        "leartime_s": 0.012108622991945595,
        "sampletime": 10.520626442012144,
        "best_mean": -0.630725,
        "best_max": 0.22312500000000035,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 188,
        "timesteps": 3760000,
        "reward_mean": -1.3417249999999998,
        "reward_max": -0.18625000000000033,
        "reward_min": -2.813125,
        "leartime_s": 0.008381877007195726,
        "sampletime": 10.984805229993071,
        "best_mean": -0.630725,
        "best_max": 0.22312500000000035,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 189,
        "timesteps": 3780000,
        "reward_mean": -0.651675,
        "reward_max": 0.05500000000000009,
        "reward_min": -1.70625,
        "leartime_s": 0.012079213018296286,
        "sampletime": 10.358544210001128,
        "best_mean": -0.630725,
        "best_max": 0.22312500000000035,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 190,
        "timesteps": 3800000,
        "reward_mean": -0.5893249999999998,
        "reward_max": 0.28437500000000027,
        "reward_min": -1.8218749999999995,
        "leartime_s": 0.012207423016661778,
        "sampletime": 10.073929199017584,
        "best_mean": -0.5893249999999998,
        "best_max": 0.28437500000000027,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 191,
        "timesteps": 3820000,
        "reward_mean": -0.6401,
        "reward_max": 0.24687500000000012,
        "reward_min": -2.135,
        "leartime_s": 0.028069874009815976,
        "sampletime": 8.567114370001946,
        "best_mean": -0.5893249999999998,
        "best_max": 0.28437500000000027,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 192,
        "timesteps": 3840000,
        "reward_mean": -0.9540000000000001,
        "reward_max": -0.024374999999999584,
        "reward_min": -1.7899999999999991,
        "leartime_s": 0.011923912010388449,
        "sampletime": 8.319082892005099,
        "best_mean": -0.5893249999999998,
        "best_max": 0.28437500000000027,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 193,
        "timesteps": 3860000,
        "reward_mean": -0.9595499999999999,
        "reward_max": 0.0012499999999999803,
        "reward_min": -2.3274999999999992,
        "leartime_s": 0.012454175011953339,
        "sampletime": 8.384367894992465,
        "best_mean": -0.5893249999999998,
        "best_max": 0.28437500000000027,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 194,
        "timesteps": 3880000,
        "reward_mean": -0.8625750000000002,
        "reward_max": -0.040000000000000174,
        "reward_min": -1.6881250000000003,
        "leartime_s": 0.012405482004396617,
        "sampletime": 8.269709687010618,
        "best_mean": -0.5893249999999998,
        "best_max": 0.28437500000000027,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 195,
        "timesteps": 3900000,
        "reward_mean": -0.78175,
        "reward_max": 0.0025000000000003006,
        "reward_min": -2.2837499999999995,
        "leartime_s": 0.01325231697410345,
        "sampletime": 8.282608811976388,
        "best_mean": -0.5893249999999998,
        "best_max": 0.28437500000000027,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 196,
        "timesteps": 3920000,
        "reward_mean": -0.6235250000000001,
        "reward_max": 0.24249999999999994,
        "reward_min": -1.4531250000000009,
        "leartime_s": 0.012315164000028744,
        "sampletime": 8.096823635016335,
        "best_mean": -0.5893249999999998,
        "best_max": 0.28437500000000027,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 197,
        "timesteps": 3940000,
        "reward_mean": -1.0899750000000001,
        "reward_max": -0.34750000000000014,
        "reward_min": -2.7156249999999984,
        "leartime_s": 0.029239365976536646,
        "sampletime": 8.273399797006277,
        "best_mean": -0.5893249999999998,
        "best_max": 0.28437500000000027,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 198,
        "timesteps": 3960000,
        "reward_mean": -0.7369749999999999,
        "reward_max": 0.27500000000000024,
        "reward_min": -2.266249999999999,
        "leartime_s": 0.027719996985979378,
        "sampletime": 8.328804622986354,
        "best_mean": -0.5893249999999998,
        "best_max": 0.28437500000000027,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 199,
        "timesteps": 3980000,
        "reward_mean": -1.1159250000000003,
        "reward_max": -0.0056250000000000605,
        "reward_min": -2.415,
        "leartime_s": 0.03234665998024866,
        "sampletime": 8.50374034899869,
        "best_mean": -0.5893249999999998,
        "best_max": 0.28437500000000027,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 200,
        "timesteps": 4000000,
        "reward_mean": -0.9474908333333334,
        "reward_max": 0.04625000000000018,
        "reward_min": -1.9699999999999998,
        "leartime_s": 0.028351007000310346,
        "sampletime": 8.500903961976292,
        "best_mean": -0.5893249999999998,
        "best_max": 0.28437500000000027,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 201,
        "timesteps": 4020000,
        "reward_mean": -0.61075,
        "reward_max": 0.17937500000000012,
        "reward_min": -1.86625,
        "leartime_s": 0.020386329997563735,
        "sampletime": 8.417818346002605,
        "best_mean": -0.5893249999999998,
        "best_max": 0.28437500000000027,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 202,
        "timesteps": 4040000,
        "reward_mean": -0.6859986904761904,
        "reward_max": 0.004375000000000212,
        "reward_min": -1.5099999999999998,
        "leartime_s": 0.011957612005062401,
        "sampletime": 8.28837486897828,
        "best_mean": -0.5893249999999998,
        "best_max": 0.28437500000000027,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 203,
        "timesteps": 4060000,
        "reward_mean": -0.9358,
        "reward_max": 0.32375,
        "reward_min": -2.0524999999999998,
        "leartime_s": 0.012136272998759523,
        "sampletime": 8.50983231299324,
        "best_mean": -0.5893249999999998,
        "best_max": 0.28437500000000027,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 204,
        "timesteps": 4080000,
        "reward_mean": -0.9512249999999999,
        "reward_max": 0.0906250000000002,
        "reward_min": -2.3762499999999993,
        "leartime_s": 0.03011220900225453,
        "sampletime": 8.483286547008902,
        "best_mean": -0.5893249999999998,
        "best_max": 0.28437500000000027,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 205,
        "timesteps": 4100000,
        "reward_mean": -0.8363,
        "reward_max": 0.08750000000000034,
        "reward_min": -1.8406249999999995,
        "leartime_s": 0.012253359018359333,
        "sampletime": 8.219756078004139,
        "best_mean": -0.5893249999999998,
        "best_max": 0.28437500000000027,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 206,
        "timesteps": 4120000,
        "reward_mean": -0.5958249999999998,
        "reward_max": 0.4718750000000001,
        "reward_min": -2.0937499999999987,
        "leartime_s": 0.012651095981709659,
        "sampletime": 8.42611796798883,
        "best_mean": -0.5893249999999998,
        "best_max": 0.28437500000000027,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 207,
        "timesteps": 4140000,
        "reward_mean": -0.94085,
        "reward_max": 0.38500000000000023,
        "reward_min": -2.9699999999999984,
        "leartime_s": 0.012683726992690936,
        "sampletime": 8.416382457013242,
        "best_mean": -0.5893249999999998,
        "best_max": 0.28437500000000027,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 208,
        "timesteps": 4160000,
        "reward_mean": -0.9668749999999998,
        "reward_max": -0.017499999999999842,
        "reward_min": -2.2668749999999993,
        "leartime_s": 0.012758206983562559,
        "sampletime": 8.205991538008675,
        "best_mean": -0.5893249999999998,
        "best_max": 0.28437500000000027,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 209,
        "timesteps": 4180000,
        "reward_mean": -0.713675,
        "reward_max": 0.25562500000000016,
        "reward_min": -2.095,
        "leartime_s": 0.012425154010998085,
        "sampletime": 8.428670446999604,
        "best_mean": -0.5893249999999998,
        "best_max": 0.28437500000000027,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 210,
        "timesteps": 4200000,
        "reward_mean": -0.7288749999999997,
        "reward_max": 0.18250000000000058,
        "reward_min": -1.7293749999999997,
        "leartime_s": 0.014026215008925647,
        "sampletime": 8.306491373019526,
        "best_mean": -0.5893249999999998,
        "best_max": 0.28437500000000027,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 211,
        "timesteps": 4220000,
        "reward_mean": -0.6997000000000001,
        "reward_max": 0.5118750000000004,
        "reward_min": -2.3168749999999987,
        "leartime_s": 0.019588037976063788,
        "sampletime": 8.32517670901143,
        "best_mean": -0.5893249999999998,
        "best_max": 0.28437500000000027,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 212,
        "timesteps": 4240000,
        "reward_mean": -0.8821499999999999,
        "reward_max": 0.24625000000000022,
        "reward_min": -2.2137499999999997,
        "leartime_s": 0.015381422999780625,
        "sampletime": 8.39784128399333,
        "best_mean": -0.5893249999999998,
        "best_max": 0.28437500000000027,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 213,
        "timesteps": 4260000,
        "reward_mean": -0.7358499999999999,
        "reward_max": 0.15750000000000025,
        "reward_min": -1.948124999999999,
        "leartime_s": 0.012457245000405237,
        "sampletime": 8.310726647003321,
        "best_mean": -0.5893249999999998,
        "best_max": 0.28437500000000027,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 214,
        "timesteps": 4280000,
        "reward_mean": -0.9266749999999998,
        "reward_max": 0.19625000000000017,
        "reward_min": -2.726874999999999,
        "leartime_s": 0.014297306013759226,
        "sampletime": 8.517062322993297,
        "best_mean": -0.5893249999999998,
        "best_max": 0.28437500000000027,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 215,
        "timesteps": 4300000,
        "reward_mean": -0.810175,
        "reward_max": 0.2725000000000003,
        "reward_min": -1.7137500000000003,
        "leartime_s": 0.013100838987156749,
        "sampletime": 8.461309865000658,
        "best_mean": -0.5893249999999998,
        "best_max": 0.28437500000000027,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 216,
        "timesteps": 4320000,
        "reward_mean": -1.0651249999999997,
        "reward_max": 0.27124999999999994,
        "reward_min": -2.8093749999999984,
        "leartime_s": 0.02187595100258477,
        "sampletime": 8.469493167009205,
        "best_mean": -0.5893249999999998,
        "best_max": 0.28437500000000027,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 217,
        "timesteps": 4340000,
        "reward_mean": -0.9448249999999998,
        "reward_max": -0.19687499999999966,
        "reward_min": -2.3306249999999986,
        "leartime_s": 0.01278056699084118,
        "sampletime": 8.264565132005373,
        "best_mean": -0.5893249999999998,
        "best_max": 0.28437500000000027,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 218,
        "timesteps": 4360000,
        "reward_mean": -0.8124749999999998,
        "reward_max": 0.4143750000000006,
        "reward_min": -1.9350000000000005,
        "leartime_s": 0.021932801988441497,
        "sampletime": 8.335365625011036,
        "best_mean": -0.5893249999999998,
        "best_max": 0.28437500000000027,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 219,
        "timesteps": 4380000,
        "reward_mean": -0.7343499999999997,
        "reward_max": 0.23812500000000003,
        "reward_min": -1.9831249999999994,
        "leartime_s": 0.017472554987762123,
        "sampletime": 8.323162015003618,
        "best_mean": -0.5893249999999998,
        "best_max": 0.28437500000000027,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 220,
        "timesteps": 4400000,
        "reward_mean": -0.8270249999999999,
        "reward_max": -0.1081249999999998,
        "reward_min": -1.7131250000000002,
        "leartime_s": 0.013515010999981314,
        "sampletime": 8.312527794012567,
        "best_mean": -0.5893249999999998,
        "best_max": 0.28437500000000027,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 221,
        "timesteps": 4420000,
        "reward_mean": -0.5739249999999997,
        "reward_max": 0.5175000000000004,
        "reward_min": -1.8468749999999994,
        "leartime_s": 0.013182230002712458,
        "sampletime": 8.506501778989332,
        "best_mean": -0.5739249999999997,
        "best_max": 0.5175000000000004,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 222,
        "timesteps": 4440000,
        "reward_mean": -0.857,
        "reward_max": 0.11375000000000027,
        "reward_min": -1.9693749999999994,
        "leartime_s": 0.012782706995494664,
        "sampletime": 8.227028170018457,
        "best_mean": -0.5739249999999997,
        "best_max": 0.5175000000000004,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 223,
        "timesteps": 4460000,
        "reward_mean": -0.7481249999999998,
        "reward_max": 0.6543750000000002,
        "reward_min": -2.2243749999999993,
        "leartime_s": 0.01412100499146618,
        "sampletime": 8.443675065995194,
        "best_mean": -0.5739249999999997,
        "best_max": 0.5175000000000004,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 224,
        "timesteps": 4480000,
        "reward_mean": -1.1111499999999999,
        "reward_max": -0.1199999999999997,
        "reward_min": -2.373124999999999,
        "leartime_s": 0.0128590950043872,
        "sampletime": 8.239376996003557,
        "best_mean": -0.5739249999999997,
        "best_max": 0.5175000000000004,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 225,
        "timesteps": 4500000,
        "reward_mean": -0.7222249999999999,
        "reward_max": 0.2687500000000001,
        "reward_min": -1.8581249999999996,
        "leartime_s": 0.014128820010228083,
        "sampletime": 8.458412748004775,
        "best_mean": -0.5739249999999997,
        "best_max": 0.5175000000000004,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 226,
        "timesteps": 4520000,
        "reward_mean": -0.4316999999999998,
        "reward_max": 0.46062500000000034,
        "reward_min": -1.198125,
        "leartime_s": 0.026304911996703595,
        "sampletime": 8.571269965992542,
        "best_mean": -0.4316999999999998,
        "best_max": 0.46062500000000034,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 227,
        "timesteps": 4540000,
        "reward_mean": -0.3165749999999998,
        "reward_max": 0.8918750000000006,
        "reward_min": -1.6449999999999994,
        "leartime_s": 0.013659190008183941,
        "sampletime": 8.2529698080034,
        "best_mean": -0.3165749999999998,
        "best_max": 0.8918750000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 228,
        "timesteps": 4560000,
        "reward_mean": -0.729425,
        "reward_max": 0.3343750000000003,
        "reward_min": -2.2899999999999996,
        "leartime_s": 0.0133677429985255,
        "sampletime": 8.423429779009894,
        "best_mean": -0.3165749999999998,
        "best_max": 0.8918750000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 229,
        "timesteps": 4580000,
        "reward_mean": -0.8006749999999999,
        "reward_max": 0.3725000000000002,
        "reward_min": -2.656875,
        "leartime_s": 0.032683869008906186,
        "sampletime": 8.302309302991489,
        "best_mean": -0.3165749999999998,
        "best_max": 0.8918750000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 230,
        "timesteps": 4600000,
        "reward_mean": -0.33024999999999977,
        "reward_max": 0.7625000000000004,
        "reward_min": -1.369999999999999,
        "leartime_s": 0.019180293020326644,
        "sampletime": 8.257823138992535,
        "best_mean": -0.3165749999999998,
        "best_max": 0.8918750000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 231,
        "timesteps": 4620000,
        "reward_mean": -0.5012749999999998,
        "reward_max": 0.26437500000000036,
        "reward_min": -1.5156249999999993,
        "leartime_s": 0.06855256599374115,
        "sampletime": 8.347347420989536,
        "best_mean": -0.3165749999999998,
        "best_max": 0.8918750000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 232,
        "timesteps": 4640000,
        "reward_mean": -0.7965249999999998,
        "reward_max": -0.11562499999999992,
        "reward_min": -2.180000000000001,
        "leartime_s": 0.014969030977226794,
        "sampletime": 8.58671873199637,
        "best_mean": -0.3165749999999998,
        "best_max": 0.8918750000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 233,
        "timesteps": 4660000,
        "reward_mean": -0.43272499999999975,
        "reward_max": 0.3462500000000002,
        "reward_min": -1.6506249999999998,
        "leartime_s": 0.013442212017253041,
        "sampletime": 8.30350629100576,
        "best_mean": -0.3165749999999998,
        "best_max": 0.8918750000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 234,
        "timesteps": 4680000,
        "reward_mean": -0.9914499999999996,
        "reward_max": 0.1343750000000003,
        "reward_min": -2.5712499999999996,
        "leartime_s": 0.03293989799567498,
        "sampletime": 8.443714246997843,
        "best_mean": -0.3165749999999998,
        "best_max": 0.8918750000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 235,
        "timesteps": 4700000,
        "reward_mean": -1.1326749999999997,
        "reward_max": -0.13499999999999995,
        "reward_min": -2.946875,
        "leartime_s": 0.023597823979798704,
        "sampletime": 8.181841707002604,
        "best_mean": -0.3165749999999998,
        "best_max": 0.8918750000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 236,
        "timesteps": 4720000,
        "reward_mean": -0.4216999999999997,
        "reward_max": 0.6868750000000002,
        "reward_min": -1.8174999999999981,
        "leartime_s": 0.03151855801115744,
        "sampletime": 8.516678973013768,
        "best_mean": -0.3165749999999998,
        "best_max": 0.8918750000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 237,
        "timesteps": 4740000,
        "reward_mean": -0.7312999999999997,
        "reward_max": 0.3493750000000009,
        "reward_min": -1.9787500000000005,
        "leartime_s": 0.022255146002862602,
        "sampletime": 8.415530922007747,
        "best_mean": -0.3165749999999998,
        "best_max": 0.8918750000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 238,
        "timesteps": 4760000,
        "reward_mean": -0.5493249999999998,
        "reward_max": 0.5925000000000002,
        "reward_min": -1.8350000000000009,
        "leartime_s": 0.0346799110120628,
        "sampletime": 8.28019708400825,
        "best_mean": -0.3165749999999998,
        "best_max": 0.8918750000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 239,
        "timesteps": 4780000,
        "reward_mean": -0.5304999999999997,
        "reward_max": 0.6100000000000005,
        "reward_min": -1.6562499999999993,
        "leartime_s": 0.01554970198776573,
        "sampletime": 8.333269345981535,
        "best_mean": -0.3165749999999998,
        "best_max": 0.8918750000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 240,
        "timesteps": 4800000,
        "reward_mean": -0.9474749999999998,
        "reward_max": 0.07,
        "reward_min": -2.100625,
        "leartime_s": 0.01800888602156192,
        "sampletime": 8.612765136000235,
        "best_mean": -0.3165749999999998,
        "best_max": 0.8918750000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 241,
        "timesteps": 4820000,
        "reward_mean": -0.6134749999999998,
        "reward_max": 0.23937500000000025,
        "reward_min": -1.6093749999999984,
        "leartime_s": 0.014445237000472844,
        "sampletime": 8.69255160301691,
        "best_mean": -0.3165749999999998,
        "best_max": 0.8918750000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 242,
        "timesteps": 4840000,
        "reward_mean": -0.9365999999999998,
        "reward_max": 0.30937500000000034,
        "reward_min": -2.2924999999999986,
        "leartime_s": 0.013399713992839679,
        "sampletime": 8.341090610978426,
        "best_mean": -0.3165749999999998,
        "best_max": 0.8918750000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 243,
        "timesteps": 4860000,
        "reward_mean": -0.8338999999999998,
        "reward_max": 0.08187500000000011,
        "reward_min": -2.0949999999999998,
        "leartime_s": 0.013848647009581327,
        "sampletime": 8.272952487983275,
        "best_mean": -0.3165749999999998,
        "best_max": 0.8918750000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 244,
        "timesteps": 4880000,
        "reward_mean": -0.7578249999999999,
        "reward_max": 0.31500000000000034,
        "reward_min": -2.2087499999999998,
        "leartime_s": 0.049336488998960704,
        "sampletime": 8.40253200000734,
        "best_mean": -0.3165749999999998,
        "best_max": 0.8918750000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 245,
        "timesteps": 4900000,
        "reward_mean": -0.6905249999999995,
        "reward_max": 0.1931250000000005,
        "reward_min": -1.7449999999999994,
        "leartime_s": 0.035819117998471484,
        "sampletime": 8.390930962981656,
        "best_mean": -0.3165749999999998,
        "best_max": 0.8918750000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 246,
        "timesteps": 4920000,
        "reward_mean": -0.7208999999999999,
        "reward_max": 0.3181250000000006,
        "reward_min": -2.464999999999999,
        "leartime_s": 0.0339008430019021,
        "sampletime": 8.634362392011099,
        "best_mean": -0.3165749999999998,
        "best_max": 0.8918750000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 247,
        "timesteps": 4940000,
        "reward_mean": -0.43337499999999973,
        "reward_max": 0.45125000000000076,
        "reward_min": -1.5312500000000002,
        "leartime_s": 0.01368358198669739,
        "sampletime": 8.416925907018594,
        "best_mean": -0.3165749999999998,
        "best_max": 0.8918750000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 248,
        "timesteps": 4960000,
        "reward_mean": -0.9636749999999998,
        "reward_max": -0.18375,
        "reward_min": -2.25875,
        "leartime_s": 0.016412408993346617,
        "sampletime": 8.405313135008328,
        "best_mean": -0.3165749999999998,
        "best_max": 0.8918750000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 249,
        "timesteps": 4980000,
        "reward_mean": -0.6937499999999998,
        "reward_max": 0.24687500000000043,
        "reward_min": -1.7281249999999992,
        "leartime_s": 0.026373340020654723,
        "sampletime": 8.378660232992843,
        "best_mean": -0.3165749999999998,
        "best_max": 0.8918750000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 250,
        "timesteps": 5000000,
        "reward_mean": -0.7900999999999997,
        "reward_max": 0.31187500000000024,
        "reward_min": -2.522499999999999,
        "leartime_s": 0.014774980983929709,
        "sampletime": 8.477871059003519,
        "best_mean": -0.3165749999999998,
        "best_max": 0.8918750000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 251,
        "timesteps": 5020000,
        "reward_mean": -0.8544249999999998,
        "reward_max": 0.1643750000000001,
        "reward_min": -1.9493749999999985,
        "leartime_s": 0.020022662007249892,
        "sampletime": 8.360582930996316,
        "best_mean": -0.3165749999999998,
        "best_max": 0.8918750000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 252,
        "timesteps": 5040000,
        "reward_mean": -0.5289749999999999,
        "reward_max": 0.23812500000000048,
        "reward_min": -1.5737499999999998,
        "leartime_s": 0.027963341010035947,
        "sampletime": 8.14314794098027,
        "best_mean": -0.3165749999999998,
        "best_max": 0.8918750000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 253,
        "timesteps": 5060000,
        "reward_mean": -0.5055249999999999,
        "reward_max": 0.2306250000000003,
        "reward_min": -1.66625,
        "leartime_s": 0.013904969004215673,
        "sampletime": 8.210572725016391,
        "best_mean": -0.3165749999999998,
        "best_max": 0.8918750000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 254,
        "timesteps": 5080000,
        "reward_mean": -0.9261249999999998,
        "reward_max": -0.11624999999999999,
        "reward_min": -2.158749999999999,
        "leartime_s": 0.014548244973411784,
        "sampletime": 8.325357351015555,
        "best_mean": -0.3165749999999998,
        "best_max": 0.8918750000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 255,
        "timesteps": 5100000,
        "reward_mean": -0.7022499999999996,
        "reward_max": 0.4293750000000003,
        "reward_min": -1.8999999999999997,
        "leartime_s": 0.01422109201666899,
        "sampletime": 8.268206758017186,
        "best_mean": -0.3165749999999998,
        "best_max": 0.8918750000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 256,
        "timesteps": 5120000,
        "reward_mean": -0.43227499999999974,
        "reward_max": 0.7275000000000006,
        "reward_min": -1.4774999999999994,
        "leartime_s": 0.014335521002067253,
        "sampletime": 8.233154545014258,
        "best_mean": -0.3165749999999998,
        "best_max": 0.8918750000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 257,
        "timesteps": 5140000,
        "reward_mean": -0.9234499999999998,
        "reward_max": 0.45437500000000075,
        "reward_min": -2.7775000000000003,
        "leartime_s": 0.01549246400827542,
        "sampletime": 8.291763241984881,
        "best_mean": -0.3165749999999998,
        "best_max": 0.8918750000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 258,
        "timesteps": 5160000,
        "reward_mean": -0.7221249999999998,
        "reward_max": 0.1750000000000004,
        "reward_min": -1.861874999999999,
        "leartime_s": 0.01440769201144576,
        "sampletime": 8.350598861987237,
        "best_mean": -0.3165749999999998,
        "best_max": 0.8918750000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 259,
        "timesteps": 5180000,
        "reward_mean": -0.9341499999999997,
        "reward_max": 0.03375000000000028,
        "reward_min": -2.108749999999999,
        "leartime_s": 0.02391576100490056,
        "sampletime": 8.51072539400775,
        "best_mean": -0.3165749999999998,
        "best_max": 0.8918750000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 260,
        "timesteps": 5200000,
        "reward_mean": -0.42232499999999984,
        "reward_max": 0.6581250000000003,
        "reward_min": -1.8268749999999994,
        "leartime_s": 0.03771324499393813,
        "sampletime": 8.439610589004587,
        "best_mean": -0.3165749999999998,
        "best_max": 0.8918750000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 261,
        "timesteps": 5220000,
        "reward_mean": -0.8882499999999998,
        "reward_max": 0.041249999999999634,
        "reward_min": -2.2624999999999993,
        "leartime_s": 0.01933183698565699,
        "sampletime": 8.448507157008862,
        "best_mean": -0.3165749999999998,
        "best_max": 0.8918750000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 262,
        "timesteps": 5240000,
        "reward_mean": -0.5132749999999997,
        "reward_max": 0.3500000000000003,
        "reward_min": -1.5631249999999999,
        "leartime_s": 0.030829737021122128,
        "sampletime": 8.378910828003427,
        "best_mean": -0.3165749999999998,
        "best_max": 0.8918750000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 263,
        "timesteps": 5260000,
        "reward_mean": -0.8880750000000001,
        "reward_max": 0.35,
        "reward_min": -2.39625,
        "leartime_s": 0.014957233011955395,
        "sampletime": 8.319254653993994,
        "best_mean": -0.3165749999999998,
        "best_max": 0.8918750000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 264,
        "timesteps": 5280000,
        "reward_mean": -0.8061999999999997,
        "reward_max": 0.2406250000000006,
        "reward_min": -2.1818750000000002,
        "leartime_s": 0.014427268004510552,
        "sampletime": 8.450933307001833,
        "best_mean": -0.3165749999999998,
        "best_max": 0.8918750000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 265,
        "timesteps": 5300000,
        "reward_mean": -0.7362249999999999,
        "reward_max": 0.30937500000000046,
        "reward_min": -1.4200000000000002,
        "leartime_s": 0.029005992983002216,
        "sampletime": 8.320212421996985,
        "best_mean": -0.3165749999999998,
        "best_max": 0.8918750000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 266,
        "timesteps": 5320000,
        "reward_mean": -0.7821999999999996,
        "reward_max": 0.10250000000000037,
        "reward_min": -1.9993749999999986,
        "leartime_s": 0.0212952510046307,
        "sampletime": 8.316155363019789,
        "best_mean": -0.3165749999999998,
        "best_max": 0.8918750000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 267,
        "timesteps": 5340000,
        "reward_mean": -0.7237499999999998,
        "reward_max": 0.09125000000000028,
        "reward_min": -2.005625,
        "leartime_s": 0.026833654002984986,
        "sampletime": 8.361751688004006,
        "best_mean": -0.3165749999999998,
        "best_max": 0.8918750000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 268,
        "timesteps": 5360000,
        "reward_mean": -0.6466249999999998,
        "reward_max": 0.37437499999999957,
        "reward_min": -1.7824999999999993,
        "leartime_s": 0.015842609020182863,
        "sampletime": 8.210589891998097,
        "best_mean": -0.3165749999999998,
        "best_max": 0.8918750000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 269,
        "timesteps": 5380000,
        "reward_mean": -0.7310249999999998,
        "reward_max": 0.15562499999999999,
        "reward_min": -2.4287500000000004,
        "leartime_s": 0.015735227992990986,
        "sampletime": 8.388809972006129,
        "best_mean": -0.3165749999999998,
        "best_max": 0.8918750000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 270,
        "timesteps": 5400000,
        "reward_mean": -0.869675,
        "reward_max": -0.02437499999999978,
        "reward_min": -2.274374999999999,
        "leartime_s": 0.01720142099657096,
        "sampletime": 8.371133188979002,
        "best_mean": -0.3165749999999998,
        "best_max": 0.8918750000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 271,
        "timesteps": 5420000,
        "reward_mean": -0.6420249999999996,
        "reward_max": 0.21687500000000026,
        "reward_min": -1.8924999999999992,
        "leartime_s": 0.02195840099011548,
        "sampletime": 8.205942030996084,
        "best_mean": -0.3165749999999998,
        "best_max": 0.8918750000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 272,
        "timesteps": 5440000,
        "reward_mean": -0.7841749999999998,
        "reward_max": 0.0725000000000005,
        "reward_min": -1.817499999999999,
        "leartime_s": 0.015054699004394934,
        "sampletime": 8.362562245019944,
        "best_mean": -0.3165749999999998,
        "best_max": 0.8918750000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 273,
        "timesteps": 5460000,
        "reward_mean": -0.27982499999999993,
        "reward_max": 0.7800000000000004,
        "reward_min": -1.3018750000000008,
        "leartime_s": 0.01064504700480029,
        "sampletime": 8.260329107986763,
        "best_mean": -0.27982499999999993,
        "best_max": 0.7800000000000004,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 274,
        "timesteps": 5480000,
        "reward_mean": -0.7380249999999999,
        "reward_max": 0.23562499999999995,
        "reward_min": -1.86,
        "leartime_s": 0.01576841398491524,
        "sampletime": 8.334167166001862,
        "best_mean": -0.27982499999999993,
        "best_max": 0.7800000000000004,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 275,
        "timesteps": 5500000,
        "reward_mean": -0.47182499999999983,
        "reward_max": 0.5731250000000003,
        "reward_min": -1.8056249999999994,
        "leartime_s": 0.01670302200363949,
        "sampletime": 8.637748592009302,
        "best_mean": -0.27982499999999993,
        "best_max": 0.7800000000000004,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 276,
        "timesteps": 5520000,
        "reward_mean": -0.7861999999999998,
        "reward_max": 0.22937500000000027,
        "reward_min": -1.9587500000000004,
        "leartime_s": 0.01613157702377066,
        "sampletime": 8.36412760798703,
        "best_mean": -0.27982499999999993,
        "best_max": 0.7800000000000004,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 277,
        "timesteps": 5540000,
        "reward_mean": -0.7113999999999997,
        "reward_max": 0.3375000000000004,
        "reward_min": -1.7606249999999986,
        "leartime_s": 0.016477790020871907,
        "sampletime": 8.279155683005229,
        "best_mean": -0.27982499999999993,
        "best_max": 0.7800000000000004,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 278,
        "timesteps": 5560000,
        "reward_mean": -0.6866749999999999,
        "reward_max": 0.27062500000000056,
        "reward_min": -1.9687499999999998,
        "leartime_s": 0.015632123016985133,
        "sampletime": 8.352568336995319,
        "best_mean": -0.27982499999999993,
        "best_max": 0.7800000000000004,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 279,
        "timesteps": 5580000,
        "reward_mean": -0.35829999999999973,
        "reward_max": 0.6043750000000003,
        "reward_min": -1.478749999999999,
        "leartime_s": 0.016466575994854793,
        "sampletime": 8.30199984900537,
        "best_mean": -0.27982499999999993,
        "best_max": 0.7800000000000004,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 280,
        "timesteps": 5600000,
        "reward_mean": -0.812425,
        "reward_max": 0.21750000000000028,
        "reward_min": -2.0149999999999997,
        "leartime_s": 0.0333814479818102,
        "sampletime": 8.13569882401498,
        "best_mean": -0.27982499999999993,
        "best_max": 0.7800000000000004,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 281,
        "timesteps": 5620000,
        "reward_mean": -0.45089999999999986,
        "reward_max": 0.9306250000000003,
        "reward_min": -1.7318749999999996,
        "leartime_s": 0.024453766003716737,
        "sampletime": 8.483830754994415,
        "best_mean": -0.27982499999999993,
        "best_max": 0.7800000000000004,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 282,
        "timesteps": 5640000,
        "reward_mean": -0.73205,
        "reward_max": 0.1712500000000003,
        "reward_min": -1.7199999999999998,
        "leartime_s": 0.02547381501062773,
        "sampletime": 8.315029677993152,
        "best_mean": -0.27982499999999993,
        "best_max": 0.7800000000000004,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 283,
        "timesteps": 5660000,
        "reward_mean": -0.1228249999999998,
        "reward_max": 0.7025000000000001,
        "reward_min": -1.1531249999999997,
        "leartime_s": 0.019108548993244767,
        "sampletime": 8.4557675679971,
        "best_mean": -0.1228249999999998,
        "best_max": 0.7025000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 284,
        "timesteps": 5680000,
        "reward_mean": -0.8182499999999999,
        "reward_max": 0.1200000000000003,
        "reward_min": -1.9287500000000017,
        "leartime_s": 0.03343787899939343,
        "sampletime": 8.253911216015695,
        "best_mean": -0.1228249999999998,
        "best_max": 0.7025000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 285,
        "timesteps": 5700000,
        "reward_mean": -0.5930999999999996,
        "reward_max": 0.30125000000000035,
        "reward_min": -1.7693749999999995,
        "leartime_s": 0.0167398149787914,
        "sampletime": 8.356420623982558,
        "best_mean": -0.1228249999999998,
        "best_max": 0.7025000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 286,
        "timesteps": 5720000,
        "reward_mean": -0.8011749999999997,
        "reward_max": 0.1800000000000005,
        "reward_min": -1.9912499999999997,
        "leartime_s": 0.01770907299942337,
        "sampletime": 8.337480488989968,
        "best_mean": -0.1228249999999998,
        "best_max": 0.7025000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 287,
        "timesteps": 5740000,
        "reward_mean": -0.5910999999999998,
        "reward_max": 0.35062500000000046,
        "reward_min": -1.56375,
        "leartime_s": 0.016863966011442244,
        "sampletime": 8.390597933990648,
        "best_mean": -0.1228249999999998,
        "best_max": 0.7025000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 288,
        "timesteps": 5760000,
        "reward_mean": -0.6820249999999997,
        "reward_max": 0.4306250000000004,
        "reward_min": -1.8324999999999996,
        "leartime_s": 0.016091170022264123,
        "sampletime": 8.330722017009975,
        "best_mean": -0.1228249999999998,
        "best_max": 0.7025000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 289,
        "timesteps": 5780000,
        "reward_mean": -0.5500499999999998,
        "reward_max": 0.0643750000000003,
        "reward_min": -1.936875000000001,
        "leartime_s": 0.02848558299592696,
        "sampletime": 8.476822494005319,
        "best_mean": -0.1228249999999998,
        "best_max": 0.7025000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 290,
        "timesteps": 5800000,
        "reward_mean": -0.6597249999999998,
        "reward_max": 0.5106249999999999,
        "reward_min": -1.9193749999999998,
        "leartime_s": 0.026511265023145825,
        "sampletime": 8.484710250981152,
        "best_mean": -0.1228249999999998,
        "best_max": 0.7025000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 291,
        "timesteps": 5820000,
        "reward_mean": -0.6197499999999998,
        "reward_max": 0.2043750000000003,
        "reward_min": -1.8081249999999995,
        "leartime_s": 0.03417561200330965,
        "sampletime": 8.278791307995562,
        "best_mean": -0.1228249999999998,
        "best_max": 0.7025000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 292,
        "timesteps": 5840000,
        "reward_mean": -0.4439999999999998,
        "reward_max": 0.6937500000000006,
        "reward_min": -1.5293749999999993,
        "leartime_s": 0.021569122007349506,
        "sampletime": 8.2951900959888,
        "best_mean": -0.1228249999999998,
        "best_max": 0.7025000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 293,
        "timesteps": 5860000,
        "reward_mean": -0.4000749999999997,
        "reward_max": 0.5775000000000003,
        "reward_min": -1.869375,
        "leartime_s": 0.017924791987752542,
        "sampletime": 8.40324690201669,
        "best_mean": -0.1228249999999998,
        "best_max": 0.7025000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 294,
        "timesteps": 5880000,
        "reward_mean": -0.6098749999999995,
        "reward_max": 0.6581250000000007,
        "reward_min": -2.054999999999999,
        "leartime_s": 0.01681583299068734,
        "sampletime": 8.425545900012366,
        "best_mean": -0.1228249999999998,
        "best_max": 0.7025000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 295,
        "timesteps": 5900000,
        "reward_mean": -0.6442249999999997,
        "reward_max": 0.37562500000000076,
        "reward_min": -1.716875000000001,
        "leartime_s": 0.03246862400555983,
        "sampletime": 8.19769995502429,
        "best_mean": -0.1228249999999998,
        "best_max": 0.7025000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 296,
        "timesteps": 5920000,
        "reward_mean": -0.47907499999999986,
        "reward_max": 0.4968750000000003,
        "reward_min": -1.6949999999999996,
        "leartime_s": 0.018290815001819283,
        "sampletime": 8.199228128010873,
        "best_mean": -0.1228249999999998,
        "best_max": 0.7025000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 297,
        "timesteps": 5940000,
        "reward_mean": -0.6019249999999996,
        "reward_max": 0.42437500000000056,
        "reward_min": -2.402499999999998,
        "leartime_s": 0.03920627699699253,
        "sampletime": 8.300697414000751,
        "best_mean": -0.1228249999999998,
        "best_max": 0.7025000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 298,
        "timesteps": 5960000,
        "reward_mean": -0.2132499999999996,
        "reward_max": 0.6662500000000003,
        "reward_min": -1.235625,
        "leartime_s": 0.01838786600274034,
        "sampletime": 8.347785414021928,
        "best_mean": -0.1228249999999998,
        "best_max": 0.7025000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 299,
        "timesteps": 5980000,
        "reward_mean": -0.6845249999999996,
        "reward_max": 0.16687500000000077,
        "reward_min": -1.7137499999999992,
        "leartime_s": 0.016534877999220043,
        "sampletime": 8.374891482002567,
        "best_mean": -0.1228249999999998,
        "best_max": 0.7025000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 300,
        "timesteps": 6000000,
        "reward_mean": -0.3626999999999997,
        "reward_max": 0.6531250000000004,
        "reward_min": -1.3531250000000001,
        "leartime_s": 0.01748855400364846,
        "sampletime": 8.45776649902109,
        "best_mean": -0.1228249999999998,
        "best_max": 0.7025000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 301,
        "timesteps": 6020000,
        "reward_mean": -0.34907499999999975,
        "reward_max": 0.5425000000000003,
        "reward_min": -2.5924999999999994,
        "leartime_s": 0.016616917011560872,
        "sampletime": 8.394032477022847,
        "best_mean": -0.1228249999999998,
        "best_max": 0.7025000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 302,
        "timesteps": 6040000,
        "reward_mean": -0.3377999999999995,
        "reward_max": 0.6581250000000005,
        "reward_min": -1.6856250000000006,
        "leartime_s": 0.02061497000977397,
        "sampletime": 8.380899606010644,
        "best_mean": -0.1228249999999998,
        "best_max": 0.7025000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 303,
        "timesteps": 6060000,
        "reward_mean": -0.25957499999999956,
        "reward_max": 0.8125000000000001,
        "reward_min": -1.6849999999999996,
        "leartime_s": 0.03745043801609427,
        "sampletime": 8.43144526501419,
        "best_mean": -0.1228249999999998,
        "best_max": 0.7025000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 304,
        "timesteps": 6080000,
        "reward_mean": -0.5880249999999997,
        "reward_max": 0.6587500000000002,
        "reward_min": -1.739999999999999,
        "leartime_s": 0.0292330399970524,
        "sampletime": 8.438980756996898,
        "best_mean": -0.1228249999999998,
        "best_max": 0.7025000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 305,
        "timesteps": 6100000,
        "reward_mean": -0.5570249999999998,
        "reward_max": 0.44999999999999996,
        "reward_min": -2.0512499999999987,
        "leartime_s": 0.018361750000622123,
        "sampletime": 8.403138597990619,
        "best_mean": -0.1228249999999998,
        "best_max": 0.7025000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 306,
        "timesteps": 6120000,
        "reward_mean": -0.34124999999999966,
        "reward_max": 0.5993750000000004,
        "reward_min": -3.1712499999999992,
        "leartime_s": 0.016567336017033085,
        "sampletime": 8.31249093200313,
        "best_mean": -0.1228249999999998,
        "best_max": 0.7025000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 307,
        "timesteps": 6140000,
        "reward_mean": -0.22267499999999985,
        "reward_max": 0.7118750000000005,
        "reward_min": -1.1156249999999999,
        "leartime_s": 0.02824153797701001,
        "sampletime": 8.296788381994702,
        "best_mean": -0.1228249999999998,
        "best_max": 0.7025000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 308,
        "timesteps": 6160000,
        "reward_mean": -0.18534999999999974,
        "reward_max": 0.6800000000000003,
        "reward_min": -1.4950000000000006,
        "leartime_s": 0.01914727801340632,
        "sampletime": 8.439859229983995,
        "best_mean": -0.1228249999999998,
        "best_max": 0.7025000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 309,
        "timesteps": 6180000,
        "reward_mean": -0.4367999999999997,
        "reward_max": 0.7100000000000005,
        "reward_min": -1.7037499999999997,
        "leartime_s": 0.03414841598714702,
        "sampletime": 8.335437865025597,
        "best_mean": -0.1228249999999998,
        "best_max": 0.7025000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 310,
        "timesteps": 6200000,
        "reward_mean": -0.32854999999999973,
        "reward_max": 0.5550000000000009,
        "reward_min": -1.5281250000000008,
        "leartime_s": 0.026672165986383334,
        "sampletime": 8.408428700000513,
        "best_mean": -0.1228249999999998,
        "best_max": 0.7025000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 311,
        "timesteps": 6220000,
        "reward_mean": -0.5080999999999998,
        "reward_max": 0.38000000000000056,
        "reward_min": -1.7037499999999992,
        "leartime_s": 0.02568985801190138,
        "sampletime": 8.222773199988296,
        "best_mean": -0.1228249999999998,
        "best_max": 0.7025000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 312,
        "timesteps": 6240000,
        "reward_mean": -0.22052499999999972,
        "reward_max": 0.7306250000000005,
        "reward_min": -1.1618749999999989,
        "leartime_s": 0.019736821996048093,
        "sampletime": 8.377037611993728,
        "best_mean": -0.1228249999999998,
        "best_max": 0.7025000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 313,
        "timesteps": 6260000,
        "reward_mean": -0.3486999999999998,
        "reward_max": 0.4156250000000006,
        "reward_min": -1.2624999999999995,
        "leartime_s": 0.018465478002326563,
        "sampletime": 8.255006432998925,
        "best_mean": -0.1228249999999998,
        "best_max": 0.7025000000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 314,
        "timesteps": 6280000,
        "reward_mean": -0.015674999999999634,
        "reward_max": 1.0431250000000005,
        "reward_min": -0.8643750000000001,
        "leartime_s": 0.018391327001154423,
        "sampletime": 8.278097403992433,
        "best_mean": -0.015674999999999634,
        "best_max": 1.0431250000000005,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 315,
        "timesteps": 6300000,
        "reward_mean": -0.6251499999999997,
        "reward_max": 0.6181250000000003,
        "reward_min": -2.318125,
        "leartime_s": 0.016430882998974994,
        "sampletime": 8.36572881398024,
        "best_mean": -0.015674999999999634,
        "best_max": 1.0431250000000005,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 316,
        "timesteps": 6320000,
        "reward_mean": -0.5374499999999994,
        "reward_max": 0.33312500000000045,
        "reward_min": -1.8362499999999993,
        "leartime_s": 0.020139100990490988,
        "sampletime": 8.414732251985697,
        "best_mean": -0.015674999999999634,
        "best_max": 1.0431250000000005,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 317,
        "timesteps": 6340000,
        "reward_mean": -0.3247249999999996,
        "reward_max": 0.6137500000000005,
        "reward_min": -1.6825,
        "leartime_s": 0.0403700589959044,
        "sampletime": 8.572456121997675,
        "best_mean": -0.015674999999999634,
        "best_max": 1.0431250000000005,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 318,
        "timesteps": 6360000,
        "reward_mean": -0.11022499999999955,
        "reward_max": 1.1356250000000008,
        "reward_min": -0.9981249999999997,
        "leartime_s": 0.039921684976434335,
        "sampletime": 8.399536725977669,
        "best_mean": -0.015674999999999634,
        "best_max": 1.0431250000000005,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 319,
        "timesteps": 6380000,
        "reward_mean": -0.2955249999999996,
        "reward_max": 0.7137500000000004,
        "reward_min": -1.9737499999999994,
        "leartime_s": 0.02357146400026977,
        "sampletime": 8.299116481008241,
        "best_mean": -0.015674999999999634,
        "best_max": 1.0431250000000005,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 320,
        "timesteps": 6400000,
        "reward_mean": -0.28669999999999946,
        "reward_max": 0.5600000000000003,
        "reward_min": -1.6937499999999999,
        "leartime_s": 0.01966774699394591,
        "sampletime": 8.443342267011758,
        "best_mean": -0.015674999999999634,
        "best_max": 1.0431250000000005,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 321,
        "timesteps": 6420000,
        "reward_mean": 0.08437500000000055,
        "reward_max": 1.0137500000000008,
        "reward_min": -1.1024999999999994,
        "leartime_s": 0.02220912298071198,
        "sampletime": 8.304882164986338,
        "best_mean": 0.08437500000000055,
        "best_max": 1.0137500000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 322,
        "timesteps": 6440000,
        "reward_mean": 0.08500000000000041,
        "reward_max": 0.9937500000000004,
        "reward_min": -0.8731249999999994,
        "leartime_s": 0.016796140000224113,
        "sampletime": 8.422340618009912,
        "best_mean": 0.08500000000000041,
        "best_max": 0.9937500000000004,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 323,
        "timesteps": 6460000,
        "reward_mean": -0.04874999999999949,
        "reward_max": 0.7968750000000006,
        "reward_min": -1.220625,
        "leartime_s": 0.044053552992409095,
        "sampletime": 8.227743398019811,
        "best_mean": 0.08500000000000041,
        "best_max": 0.9937500000000004,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 324,
        "timesteps": 6480000,
        "reward_mean": -0.5787249999999995,
        "reward_max": 0.46812500000000024,
        "reward_min": -2.9356249999999986,
        "leartime_s": 0.017946439009392634,
        "sampletime": 8.369266512978356,
        "best_mean": 0.08500000000000041,
        "best_max": 0.9937500000000004,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 325,
        "timesteps": 6500000,
        "reward_mean": -0.2459239999999997,
        "reward_max": 0.7318750000000006,
        "reward_min": -1.3118750000000001,
        "leartime_s": 0.027918086998397484,
        "sampletime": 8.374318260990549,
        "best_mean": 0.08500000000000041,
        "best_max": 0.9937500000000004,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 326,
        "timesteps": 6520000,
        "reward_mean": -0.7373999999999993,
        "reward_max": 0.6100000000000003,
        "reward_min": -3.0737499999999973,
        "leartime_s": 0.024572211026679724,
        "sampletime": 8.494060632016044,
        "best_mean": 0.08500000000000041,
        "best_max": 0.9937500000000004,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 327,
        "timesteps": 6540000,
        "reward_mean": 0.0057250000000004415,
        "reward_max": 0.7750000000000001,
        "reward_min": -0.8306249999999995,
        "leartime_s": 0.02005576598457992,
        "sampletime": 8.484707925992552,
        "best_mean": 0.08500000000000041,
        "best_max": 0.9937500000000004,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 328,
        "timesteps": 6560000,
        "reward_mean": -0.09749999999999943,
        "reward_max": 0.9843750000000001,
        "reward_min": -1.5693749999999986,
        "leartime_s": 0.018411303986795247,
        "sampletime": 8.39768515099422,
        "best_mean": 0.08500000000000041,
        "best_max": 0.9937500000000004,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 329,
        "timesteps": 6580000,
        "reward_mean": 0.04995000000000043,
        "reward_max": 0.8781250000000005,
        "reward_min": -0.8943749999999998,
        "leartime_s": 0.022573993977857754,
        "sampletime": 8.246272104996024,
        "best_mean": 0.08500000000000041,
        "best_max": 0.9937500000000004,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 330,
        "timesteps": 6600000,
        "reward_mean": -0.08812499999999945,
        "reward_max": 0.893125000000001,
        "reward_min": -0.9418749999999989,
        "leartime_s": 0.038302623986965045,
        "sampletime": 8.2810191460012,
        "best_mean": 0.08500000000000041,
        "best_max": 0.9937500000000004,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 331,
        "timesteps": 6620000,
        "reward_mean": -0.4513749999999995,
        "reward_max": 0.8831250000000005,
        "reward_min": -1.8681249999999987,
        "leartime_s": 0.03490826999768615,
        "sampletime": 8.51149723600247,
        "best_mean": 0.08500000000000041,
        "best_max": 0.9937500000000004,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 332,
        "timesteps": 6640000,
        "reward_mean": -0.1300499999999997,
        "reward_max": 0.8025000000000005,
        "reward_min": -1.28125,
        "leartime_s": 0.020169221999822184,
        "sampletime": 8.271942103019683,
        "best_mean": 0.08500000000000041,
        "best_max": 0.9937500000000004,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 333,
        "timesteps": 6660000,
        "reward_mean": -0.11354999999999951,
        "reward_max": 1.0400000000000005,
        "reward_min": -1.365,
        "leartime_s": 0.017397656018147245,
        "sampletime": 8.229847309994511,
        "best_mean": 0.08500000000000041,
        "best_max": 0.9937500000000004,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 334,
        "timesteps": 6680000,
        "reward_mean": -0.13957499999999945,
        "reward_max": 0.7325000000000006,
        "reward_min": -1.5524999999999984,
        "leartime_s": 0.024642018019221723,
        "sampletime": 8.351260877010645,
        "best_mean": 0.08500000000000041,
        "best_max": 0.9937500000000004,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 335,
        "timesteps": 6700000,
        "reward_mean": -0.32649999999999957,
        "reward_max": 0.6906250000000005,
        "reward_min": -2.291249999999999,
        "leartime_s": 0.01802978600608185,
        "sampletime": 8.324865006987238,
        "best_mean": 0.08500000000000041,
        "best_max": 0.9937500000000004,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 336,
        "timesteps": 6720000,
        "reward_mean": -0.44084999999999935,
        "reward_max": 0.7218750000000005,
        "reward_min": -1.6575,
        "leartime_s": 0.036482039984548464,
        "sampletime": 8.371878739999374,
        "best_mean": 0.08500000000000041,
        "best_max": 0.9937500000000004,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 337,
        "timesteps": 6740000,
        "reward_mean": 0.27607500000000046,
        "reward_max": 1.2581250000000002,
        "reward_min": -0.7412499999999993,
        "leartime_s": 0.019471876992611215,
        "sampletime": 8.336850502993912,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 338,
        "timesteps": 6760000,
        "reward_mean": -0.25512499999999944,
        "reward_max": 0.5318750000000004,
        "reward_min": -1.5799999999999987,
        "leartime_s": 0.01808829899528064,
        "sampletime": 8.352295666991267,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 339,
        "timesteps": 6780000,
        "reward_mean": -0.3687749999999994,
        "reward_max": 0.5475000000000004,
        "reward_min": -1.3993749999999996,
        "leartime_s": 0.04197867802577093,
        "sampletime": 8.515895209013252,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 340,
        "timesteps": 6800000,
        "reward_mean": -0.0811499999999994,
        "reward_max": 0.7043750000000003,
        "reward_min": -1.0812499999999994,
        "leartime_s": 0.023749390995362774,
        "sampletime": 8.313001742993947,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 341,
        "timesteps": 6820000,
        "reward_mean": -0.08874999999999957,
        "reward_max": 1.0800000000000007,
        "reward_min": -1.2356250000000002,
        "leartime_s": 0.01748737200978212,
        "sampletime": 8.507796046993462,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 342,
        "timesteps": 6840000,
        "reward_mean": -0.3114749999999995,
        "reward_max": 0.48625000000000035,
        "reward_min": -1.5124999999999993,
        "leartime_s": 0.020167743001366034,
        "sampletime": 8.364613023004495,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 343,
        "timesteps": 6860000,
        "reward_mean": -0.2406749999999997,
        "reward_max": 0.6825000000000003,
        "reward_min": -1.0562499999999997,
        "leartime_s": 0.031877500005066395,
        "sampletime": 8.403548762988066,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 344,
        "timesteps": 6880000,
        "reward_mean": -0.6258249999999993,
        "reward_max": 0.42187500000000044,
        "reward_min": -2.286249999999999,
        "leartime_s": 0.01783978199819103,
        "sampletime": 8.335850935021881,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 345,
        "timesteps": 6900000,
        "reward_mean": -0.18579999999999958,
        "reward_max": 0.6268750000000004,
        "reward_min": -1.3387499999999997,
        "leartime_s": 0.019380996993277222,
        "sampletime": 8.402854224987095,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 346,
        "timesteps": 6920000,
        "reward_mean": -0.21902499999999958,
        "reward_max": 1.0018750000000005,
        "reward_min": -1.6356249999999992,
        "leartime_s": 0.022691589023452252,
        "sampletime": 8.19318370099063,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 347,
        "timesteps": 6940000,
        "reward_mean": -0.38749999999999946,
        "reward_max": 0.5606250000000007,
        "reward_min": -1.5868750000000005,
        "leartime_s": 0.02013981799245812,
        "sampletime": 8.379782884992892,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 348,
        "timesteps": 6960000,
        "reward_mean": -0.46059999999999945,
        "reward_max": 0.4443750000000004,
        "reward_min": -1.584374999999999,
        "leartime_s": 0.017824520997237414,
        "sampletime": 8.379781337018358,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 349,
        "timesteps": 6980000,
        "reward_mean": -0.1692999999999996,
        "reward_max": 1.1506250000000002,
        "reward_min": -1.4306249999999994,
        "leartime_s": 0.018143766006687656,
        "sampletime": 8.372874551976565,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 350,
        "timesteps": 7000000,
        "reward_mean": -0.26624999999999943,
        "reward_max": 0.9593750000000003,
        "reward_min": -1.7262499999999985,
        "leartime_s": 0.022491960000479594,
        "sampletime": 8.281187398999464,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 351,
        "timesteps": 7020000,
        "reward_mean": -0.5088499999999995,
        "reward_max": 0.6837500000000006,
        "reward_min": -1.9231249999999998,
        "leartime_s": 0.020027127000503242,
        "sampletime": 8.306135668011848,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 352,
        "timesteps": 7040000,
        "reward_mean": -0.15249999999999944,
        "reward_max": 0.6362500000000005,
        "reward_min": -1.0612499999999996,
        "leartime_s": 0.021346838009776548,
        "sampletime": 8.553562225017231,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 353,
        "timesteps": 7060000,
        "reward_mean": -0.08017499999999957,
        "reward_max": 0.7612500000000006,
        "reward_min": -1.7556249999999993,
        "leartime_s": 0.019859235995681956,
        "sampletime": 8.579026363993762,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 354,
        "timesteps": 7080000,
        "reward_mean": -0.10067499999999933,
        "reward_max": 0.6687500000000007,
        "reward_min": -1.4043749999999995,
        "leartime_s": 0.05580271501094103,
        "sampletime": 8.448856801027432,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 355,
        "timesteps": 7100000,
        "reward_mean": -0.09099999999999941,
        "reward_max": 1.2193750000000008,
        "reward_min": -1.6399999999999995,
        "leartime_s": 0.035845583013724536,
        "sampletime": 8.67352955599199,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 356,
        "timesteps": 7120000,
        "reward_mean": -0.38332499999999947,
        "reward_max": 0.6825000000000008,
        "reward_min": -1.4525,
        "leartime_s": 0.018768267997074872,
        "sampletime": 8.398266463016625,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 357,
        "timesteps": 7140000,
        "reward_mean": -0.1594749999999995,
        "reward_max": 0.6250000000000009,
        "reward_min": -1.3362499999999977,
        "leartime_s": 0.02641903402400203,
        "sampletime": 8.399996007006848,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 358,
        "timesteps": 7160000,
        "reward_mean": 0.027800000000000363,
        "reward_max": 1.0868750000000005,
        "reward_min": -1.1862499999999996,
        "leartime_s": 0.021594328980427235,
        "sampletime": 8.398678522993578,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 359,
        "timesteps": 7180000,
        "reward_mean": -0.1176249999999995,
        "reward_max": 0.9462500000000005,
        "reward_min": -1.848749999999999,
        "leartime_s": 0.044803513010265306,
        "sampletime": 8.129350592003902,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 360,
        "timesteps": 7200000,
        "reward_mean": -0.2561749999999995,
        "reward_max": 0.9475000000000007,
        "reward_min": -1.5893749999999982,
        "leartime_s": 0.023460401978809386,
        "sampletime": 8.354138972004876,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 361,
        "timesteps": 7220000,
        "reward_mean": -0.025199999999999497,
        "reward_max": 1.3043750000000005,
        "reward_min": -1.1268749999999994,
        "leartime_s": 0.027701603015884757,
        "sampletime": 8.495978454011492,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 362,
        "timesteps": 7240000,
        "reward_mean": -0.2655499999999995,
        "reward_max": 0.8481250000000004,
        "reward_min": -1.9562500000000003,
        "leartime_s": 0.013309247995493934,
        "sampletime": 8.391910178994294,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 363,
        "timesteps": 7260000,
        "reward_mean": -0.05977499999999958,
        "reward_max": 0.9262500000000005,
        "reward_min": -1.0856249999999992,
        "leartime_s": 0.025896200007991865,
        "sampletime": 8.347143925988348,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 364,
        "timesteps": 7280000,
        "reward_mean": -0.28134999999999943,
        "reward_max": 0.6343750000000004,
        "reward_min": -1.5181249999999997,
        "leartime_s": 0.019546022987924516,
        "sampletime": 8.375279847008642,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 365,
        "timesteps": 7300000,
        "reward_mean": -0.12199999999999968,
        "reward_max": 0.8250000000000003,
        "reward_min": -1.2756249999999991,
        "leartime_s": 0.025808529986534268,
        "sampletime": 8.417746427992824,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 366,
        "timesteps": 7320000,
        "reward_mean": -0.3065499999999996,
        "reward_max": 0.7356250000000006,
        "reward_min": -1.7399999999999987,
        "leartime_s": 0.042544121999526396,
        "sampletime": 8.321829207998235,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 367,
        "timesteps": 7340000,
        "reward_mean": -0.06447499999999952,
        "reward_max": 0.7943750000000008,
        "reward_min": -1.3587499999999986,
        "leartime_s": 0.018486701999790967,
        "sampletime": 8.196007061982527,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 368,
        "timesteps": 7360000,
        "reward_mean": -0.10422499999999954,
        "reward_max": 0.9225000000000008,
        "reward_min": -1.13,
        "leartime_s": 0.025189554988173768,
        "sampletime": 8.357195000018692,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 369,
        "timesteps": 7380000,
        "reward_mean": -0.5548749999999993,
        "reward_max": 0.7743750000000006,
        "reward_min": -1.875624999999999,
        "leartime_s": 0.01880789900314994,
        "sampletime": 8.3253461199929,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 370,
        "timesteps": 7400000,
        "reward_mean": -0.3693749999999995,
        "reward_max": 0.398750000000001,
        "reward_min": -1.5118749999999976,
        "leartime_s": 0.03249404902453534,
        "sampletime": 8.277669098984916,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 371,
        "timesteps": 7420000,
        "reward_mean": -0.4852499999999997,
        "reward_max": 0.3375000000000008,
        "reward_min": -1.8006250000000001,
        "leartime_s": 0.02134296699659899,
        "sampletime": 8.157093479996547,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 372,
        "timesteps": 7440000,
        "reward_mean": -0.31394999999999973,
        "reward_max": 0.5556250000000006,
        "reward_min": -1.57375,
        "leartime_s": 0.023994735995074734,
        "sampletime": 8.277160961995833,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 373,
        "timesteps": 7460000,
        "reward_mean": -0.4071249999999997,
        "reward_max": 0.4712500000000004,
        "reward_min": -1.2518750000000005,
        "leartime_s": 0.01888285597669892,
        "sampletime": 8.467068275000202,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 374,
        "timesteps": 7480000,
        "reward_mean": -0.32537499999999964,
        "reward_max": 0.6787500000000004,
        "reward_min": -1.3174999999999994,
        "leartime_s": 0.024004935985431075,
        "sampletime": 8.403150589991128,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 375,
        "timesteps": 7500000,
        "reward_mean": -0.4877499999999997,
        "reward_max": 0.3587500000000009,
        "reward_min": -1.2587499999999987,
        "leartime_s": 0.021352053008740768,
        "sampletime": 8.435934879002161,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 376,
        "timesteps": 7520000,
        "reward_mean": -0.15862499999999954,
        "reward_max": 0.7725000000000007,
        "reward_min": -1.0618749999999995,
        "leartime_s": 0.017998467985307798,
        "sampletime": 8.536622623010771,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 377,
        "timesteps": 7540000,
        "reward_mean": -0.3916249999999997,
        "reward_max": 0.5125000000000004,
        "reward_min": -1.2437500000000004,
        "leartime_s": 0.020096583000849932,
        "sampletime": 8.38635085101123,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 378,
        "timesteps": 7560000,
        "reward_mean": -0.5221749999999997,
        "reward_max": 0.16562500000000044,
        "reward_min": -1.5368749999999987,
        "leartime_s": 0.045520707994000986,
        "sampletime": 8.225275809003506,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 379,
        "timesteps": 7580000,
        "reward_mean": -0.3998249999999996,
        "reward_max": 0.6387500000000006,
        "reward_min": -1.6118749999999995,
        "leartime_s": 0.01937934898887761,
        "sampletime": 8.379928878013743,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 380,
        "timesteps": 7600000,
        "reward_mean": -0.33784999999999976,
        "reward_max": 0.3131250000000003,
        "reward_min": -1.2650000000000001,
        "leartime_s": 0.028215781989274547,
        "sampletime": 8.48591227500583,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 381,
        "timesteps": 7620000,
        "reward_mean": -0.4690749999999996,
        "reward_max": 0.2575000000000004,
        "reward_min": -1.500624999999999,
        "leartime_s": 0.029999955993844196,
        "sampletime": 8.526540489983745,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 382,
        "timesteps": 7640000,
        "reward_mean": -0.5234249999999997,
        "reward_max": 0.40125000000000033,
        "reward_min": -1.48375,
        "leartime_s": 0.026124566997168586,
        "sampletime": 8.286338140984299,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 383,
        "timesteps": 7660000,
        "reward_mean": -0.6817499999999996,
        "reward_max": 0.8568749999999998,
        "reward_min": -2.3506249999999986,
        "leartime_s": 0.05299374900641851,
        "sampletime": 8.292426419997355,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 384,
        "timesteps": 7680000,
        "reward_mean": -0.5396249999999998,
        "reward_max": 0.19062500000000013,
        "reward_min": -2.0056249999999993,
        "leartime_s": 0.03463261999422684,
        "sampletime": 8.459774618007941,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 385,
        "timesteps": 7700000,
        "reward_mean": -0.7637249999999997,
        "reward_max": 0.32437499999999975,
        "reward_min": -1.8793750000000007,
        "leartime_s": 0.028004842024529353,
        "sampletime": 8.32670470199082,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 386,
        "timesteps": 7720000,
        "reward_mean": -0.3830999999999998,
        "reward_max": 0.2825000000000001,
        "reward_min": -1.55375,
        "leartime_s": 0.019751829997403547,
        "sampletime": 8.291947135003284,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 387,
        "timesteps": 7740000,
        "reward_mean": -0.37162499999999976,
        "reward_max": 0.6087500000000002,
        "reward_min": -1.1831249999999993,
        "leartime_s": 0.028741185000399128,
        "sampletime": 8.316521172993816,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 388,
        "timesteps": 7760000,
        "reward_mean": -0.5790499999999997,
        "reward_max": 0.3012500000000002,
        "reward_min": -2.1193749999999993,
        "leartime_s": 0.01974542997777462,
        "sampletime": 8.38985532897641,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 389,
        "timesteps": 7780000,
        "reward_mean": -0.5096999999999996,
        "reward_max": 0.47375000000000017,
        "reward_min": -1.8868749999999992,
        "leartime_s": 0.021703744016122073,
        "sampletime": 8.356668978987727,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 390,
        "timesteps": 7800000,
        "reward_mean": -0.6053749999999997,
        "reward_max": 0.3206250000000004,
        "reward_min": -1.916249999999999,
        "leartime_s": 0.034136915986891836,
        "sampletime": 8.486719740991248,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 391,
        "timesteps": 7820000,
        "reward_mean": -0.8916249999999996,
        "reward_max": 0.17437500000000036,
        "reward_min": -3.113749999999998,
        "leartime_s": 0.03541402198607102,
        "sampletime": 8.39356719100033,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 392,
        "timesteps": 7840000,
        "reward_mean": -0.5732999999999997,
        "reward_max": 0.2243750000000003,
        "reward_min": -1.6431249999999993,
        "leartime_s": 0.021117960015544668,
        "sampletime": 8.289500970975496,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 393,
        "timesteps": 7860000,
        "reward_mean": -0.3016999999999998,
        "reward_max": 1.14375,
        "reward_min": -1.0643750000000007,
        "leartime_s": 0.02051476700580679,
        "sampletime": 8.118371432996355,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 394,
        "timesteps": 7880000,
        "reward_mean": -0.30152499999999965,
        "reward_max": 0.6137500000000004,
        "reward_min": -1.5474999999999997,
        "leartime_s": 0.04368974099634215,
        "sampletime": 8.222148398985155,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 395,
        "timesteps": 7900000,
        "reward_mean": -0.7743999999999996,
        "reward_max": -0.0281249999999999,
        "reward_min": -1.8556249999999996,
        "leartime_s": 0.020225741987815127,
        "sampletime": 8.401038185984362,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 396,
        "timesteps": 7920000,
        "reward_mean": -0.5712249999999996,
        "reward_max": 0.2393750000000004,
        "reward_min": -1.55,
        "leartime_s": 0.03296338199288584,
        "sampletime": 8.359384298993973,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 397,
        "timesteps": 7940000,
        "reward_mean": -0.44079999999999986,
        "reward_max": 0.41687500000000066,
        "reward_min": -1.6737499999999996,
        "leartime_s": 0.04812601101002656,
        "sampletime": 8.449976656993385,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 398,
        "timesteps": 7960000,
        "reward_mean": -0.5890249999999999,
        "reward_max": 0.8475000000000004,
        "reward_min": -2.2274999999999996,
        "leartime_s": 0.022627780999755487,
        "sampletime": 8.359436124999775,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 399,
        "timesteps": 7980000,
        "reward_mean": -0.5403249999999999,
        "reward_max": 0.31750000000000034,
        "reward_min": -1.4606249999999994,
        "leartime_s": 0.022301849006908014,
        "sampletime": 8.328289400989888,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 400,
        "timesteps": 8000000,
        "reward_mean": -0.6424999999999997,
        "reward_max": 0.05500000000000019,
        "reward_min": -1.5762499999999984,
        "leartime_s": 0.020171819982351735,
        "sampletime": 8.407460735004861,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 401,
        "timesteps": 8020000,
        "reward_mean": -0.4957249999999997,
        "reward_max": 0.42937500000000056,
        "reward_min": -4.445624999999997,
        "leartime_s": 0.02050677200895734,
        "sampletime": 8.361677822016645,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 402,
        "timesteps": 8040000,
        "reward_mean": -0.4697499999999997,
        "reward_max": 0.24312500000000023,
        "reward_min": -1.6543749999999986,
        "leartime_s": 0.024799155013170093,
        "sampletime": 8.322401331999572,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 403,
        "timesteps": 8060000,
        "reward_mean": -0.6902999999999998,
        "reward_max": 0.11125000000000031,
        "reward_min": -1.765,
        "leartime_s": 0.03165726299630478,
        "sampletime": 8.3595208870247,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 404,
        "timesteps": 8080000,
        "reward_mean": -0.7122249999999996,
        "reward_max": 0.46437500000000004,
        "reward_min": -2.516249999999999,
        "leartime_s": 0.01995483200880699,
        "sampletime": 8.164943234005477,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 405,
        "timesteps": 8100000,
        "reward_mean": -0.7505749999999999,
        "reward_max": -0.013124999999999942,
        "reward_min": -2.0156249999999996,
        "leartime_s": 0.020329695020336658,
        "sampletime": 8.459767587977694,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 406,
        "timesteps": 8120000,
        "reward_mean": -0.41117499999999985,
        "reward_max": 0.4475000000000001,
        "reward_min": -1.5374999999999992,
        "leartime_s": 0.044084011984523386,
        "sampletime": 8.321212954993825,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 407,
        "timesteps": 8140000,
        "reward_mean": -0.44057499999999983,
        "reward_max": 0.3656250000000003,
        "reward_min": -2.176874999999999,
        "leartime_s": 0.04663411001092754,
        "sampletime": 8.535044916003244,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 408,
        "timesteps": 8160000,
        "reward_mean": -0.3991249999999998,
        "reward_max": 0.8556250000000005,
        "reward_min": -1.6087500000000001,
        "leartime_s": 0.05407356200157665,
        "sampletime": 8.320132845983608,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 409,
        "timesteps": 8180000,
        "reward_mean": -0.6484999999999997,
        "reward_max": 0.5187500000000002,
        "reward_min": -2.2899999999999987,
        "leartime_s": 0.04527182099991478,
        "sampletime": 8.381076010002289,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 410,
        "timesteps": 8200000,
        "reward_mean": -0.7078999999999998,
        "reward_max": 0.07062500000000052,
        "reward_min": -2.0599999999999987,
        "leartime_s": 0.039007063023746014,
        "sampletime": 8.334968481998658,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 411,
        "timesteps": 8220000,
        "reward_mean": -1.0262999999999998,
        "reward_max": -0.012499999999999834,
        "reward_min": -2.426249999999999,
        "leartime_s": 0.023679826990701258,
        "sampletime": 8.38273110598675,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 412,
        "timesteps": 8240000,
        "reward_mean": -0.4799249999999997,
        "reward_max": 0.5068750000000005,
        "reward_min": -1.4674999999999998,
        "leartime_s": 0.02174408099381253,
        "sampletime": 8.361422893998679,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 413,
        "timesteps": 8260000,
        "reward_mean": -0.5124999999999997,
        "reward_max": 0.3331250000000002,
        "reward_min": -1.2743749999999991,
        "leartime_s": 0.0219697639986407,
        "sampletime": 8.656217088981066,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 414,
        "timesteps": 8280000,
        "reward_mean": -0.2595749999999998,
        "reward_max": 0.9218750000000003,
        "reward_min": -1.7981249999999998,
        "leartime_s": 0.024374750995775685,
        "sampletime": 8.420907225983683,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 415,
        "timesteps": 8300000,
        "reward_mean": -0.6000499999999998,
        "reward_max": 0.2787500000000002,
        "reward_min": -1.9524999999999988,
        "leartime_s": 0.0220039619889576,
        "sampletime": 8.338137563987402,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 416,
        "timesteps": 8320000,
        "reward_mean": -0.24067499999999975,
        "reward_max": 0.7812500000000003,
        "reward_min": -1.7599999999999998,
        "leartime_s": 0.020457211998291314,
        "sampletime": 8.495269693987211,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 417,
        "timesteps": 8340000,
        "reward_mean": -0.9206499999999997,
        "reward_max": 0.007499999999999937,
        "reward_min": -2.8687499999999995,
        "leartime_s": 0.022895461006555706,
        "sampletime": 8.204677153989905,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 418,
        "timesteps": 8360000,
        "reward_mean": -0.48417499999999963,
        "reward_max": 0.2918750000000001,
        "reward_min": -1.5131249999999992,
        "leartime_s": 0.037655985011952,
        "sampletime": 8.263375656999415,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 419,
        "timesteps": 8380000,
        "reward_mean": -0.6840249999999999,
        "reward_max": 0.26500000000000035,
        "reward_min": -2.076875,
        "leartime_s": 0.025096427998505533,
        "sampletime": 8.283341078989906,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 420,
        "timesteps": 8400000,
        "reward_mean": -0.3966249999999997,
        "reward_max": 0.43875000000000025,
        "reward_min": -1.2962499999999986,
        "leartime_s": 0.03286597898113541,
        "sampletime": 8.548202925012447,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 421,
        "timesteps": 8420000,
        "reward_mean": -0.4288499999999998,
        "reward_max": 0.2993750000000004,
        "reward_min": -1.2087500000000002,
        "leartime_s": 0.041756079997867346,
        "sampletime": 8.490931214997545,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 422,
        "timesteps": 8440000,
        "reward_mean": -0.6380999999999997,
        "reward_max": 0.21625000000000028,
        "reward_min": -2.218749999999999,
        "leartime_s": 0.023048618983011693,
        "sampletime": 8.341776292974828,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 423,
        "timesteps": 8460000,
        "reward_mean": -0.5685999999999994,
        "reward_max": 0.3975000000000004,
        "reward_min": -2.619999999999998,
        "leartime_s": 0.028749132005032152,
        "sampletime": 8.268068560020765,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 424,
        "timesteps": 8480000,
        "reward_mean": -0.5311249999999997,
        "reward_max": 0.24375000000000027,
        "reward_min": -1.564375,
        "leartime_s": 0.0211421660205815,
        "sampletime": 8.365084909979487,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 425,
        "timesteps": 8500000,
        "reward_mean": -0.43787499999999996,
        "reward_max": 0.5587500000000004,
        "reward_min": -1.2600000000000005,
        "leartime_s": 0.021956163982395083,
        "sampletime": 8.430342299019685,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 426,
        "timesteps": 8520000,
        "reward_mean": -0.3455749999999997,
        "reward_max": 0.43312500000000054,
        "reward_min": -1.2431249999999994,
        "leartime_s": 0.02715283998986706,
        "sampletime": 8.466960449994076,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 427,
        "timesteps": 8540000,
        "reward_mean": -0.6222499999999997,
        "reward_max": 0.35437500000000016,
        "reward_min": -2.048749999999999,
        "leartime_s": 0.021676280011888593,
        "sampletime": 8.377570907003246,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 428,
        "timesteps": 8560000,
        "reward_mean": -0.4460999999999998,
        "reward_max": 0.5037500000000003,
        "reward_min": -1.1662499999999987,
        "leartime_s": 0.02285827900050208,
        "sampletime": 8.458621399011463,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 429,
        "timesteps": 8580000,
        "reward_mean": -0.48537499999999967,
        "reward_max": 0.7612500000000005,
        "reward_min": -2.0074999999999994,
        "leartime_s": 0.02615106399753131,
        "sampletime": 8.49655994499335,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 430,
        "timesteps": 8600000,
        "reward_mean": -0.20507499999999956,
        "reward_max": 0.6456250000000004,
        "reward_min": -1.296874999999999,
        "leartime_s": 0.02842391698504798,
        "sampletime": 8.342052777006757,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 431,
        "timesteps": 8620000,
        "reward_mean": -0.6671999999999997,
        "reward_max": 0.14312500000000014,
        "reward_min": -1.57125,
        "leartime_s": 0.045911191002232954,
        "sampletime": 8.211466160981217,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 432,
        "timesteps": 8640000,
        "reward_mean": -0.2770749999999997,
        "reward_max": 0.5368750000000005,
        "reward_min": -1.2468750000000002,
        "leartime_s": 0.04579530097544193,
        "sampletime": 8.31212570797652,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 433,
        "timesteps": 8660000,
        "reward_mean": -0.5894999999999996,
        "reward_max": 0.30562500000000054,
        "reward_min": -1.922499999999999,
        "leartime_s": 0.01982367699383758,
        "sampletime": 8.390931058005663,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 434,
        "timesteps": 8680000,
        "reward_mean": -0.9265999999999995,
        "reward_max": 0.3887500000000003,
        "reward_min": -2.52,
        "leartime_s": 0.028407347010215744,
        "sampletime": 8.354081313009374,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 435,
        "timesteps": 8700000,
        "reward_mean": -0.34637499999999966,
        "reward_max": 0.7643750000000006,
        "reward_min": -1.7243749999999982,
        "leartime_s": 0.04750893198070116,
        "sampletime": 8.359154376987135,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 436,
        "timesteps": 8720000,
        "reward_mean": -0.06139999999999954,
        "reward_max": 0.6387500000000007,
        "reward_min": -1.02875,
        "leartime_s": 0.023845899006118998,
        "sampletime": 8.439937346003717,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 437,
        "timesteps": 8740000,
        "reward_mean": -0.05894999999999969,
        "reward_max": 0.9975000000000002,
        "reward_min": -1.1843750000000002,
        "leartime_s": 0.04525530300452374,
        "sampletime": 8.437769838987151,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 438,
        "timesteps": 8760000,
        "reward_mean": -0.19834999999999955,
        "reward_max": 0.5087500000000004,
        "reward_min": -1.00375,
        "leartime_s": 0.028249419992789626,
        "sampletime": 8.434899696992943,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 439,
        "timesteps": 8780000,
        "reward_mean": -0.1176999999999997,
        "reward_max": 1.0106250000000006,
        "reward_min": -1.0037500000000001,
        "leartime_s": 0.0476061090012081,
        "sampletime": 8.458101049996912,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 440,
        "timesteps": 8800000,
        "reward_mean": -0.38287499999999963,
        "reward_max": 0.4925000000000004,
        "reward_min": -1.7493749999999986,
        "leartime_s": 0.021773979999125004,
        "sampletime": 8.513205957977334,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 441,
        "timesteps": 8820000,
        "reward_mean": -0.39332499999999954,
        "reward_max": 0.40937500000000104,
        "reward_min": -2.084374999999998,
        "leartime_s": 0.02187752097961493,
        "sampletime": 8.323206970992032,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 442,
        "timesteps": 8840000,
        "reward_mean": -0.4215249999999995,
        "reward_max": 0.5562500000000005,
        "reward_min": -2.4837499999999992,
        "leartime_s": 0.03862139699049294,
        "sampletime": 8.587307029985823,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 443,
        "timesteps": 8860000,
        "reward_mean": -0.5828749999999996,
        "reward_max": 0.2700000000000002,
        "reward_min": -1.7699999999999998,
        "leartime_s": 0.024259081023046747,
        "sampletime": 8.455498224007897,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 444,
        "timesteps": 8880000,
        "reward_mean": -0.39507499999999957,
        "reward_max": 0.6156250000000005,
        "reward_min": -1.6462499999999993,
        "leartime_s": 0.02181460100109689,
        "sampletime": 8.145821294019697,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 445,
        "timesteps": 8900000,
        "reward_mean": -0.5334249999999995,
        "reward_max": 0.46312500000000034,
        "reward_min": -1.6681249999999992,
        "leartime_s": 0.03615613002330065,
        "sampletime": 8.469797247002134,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 446,
        "timesteps": 8920000,
        "reward_mean": -0.0703249999999997,
        "reward_max": 0.7106250000000004,
        "reward_min": -1.0231249999999996,
        "leartime_s": 0.029026580014033243,
        "sampletime": 8.29979980099597,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 447,
        "timesteps": 8940000,
        "reward_mean": -0.18442499999999973,
        "reward_max": 0.6412500000000002,
        "reward_min": -1.1243749999999992,
        "leartime_s": 0.02176110100117512,
        "sampletime": 8.366475754010025,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 448,
        "timesteps": 8960000,
        "reward_mean": 0.01817500000000034,
        "reward_max": 1.1987500000000002,
        "reward_min": -0.9331249999999994,
        "leartime_s": 0.04861813600291498,
        "sampletime": 8.16782415099442,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 449,
        "timesteps": 8980000,
        "reward_mean": -0.39879999999999954,
        "reward_max": 0.5881250000000007,
        "reward_min": -1.7399999999999987,
        "leartime_s": 0.04039337899303064,
        "sampletime": 8.20408714399673,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 450,
        "timesteps": 9000000,
        "reward_mean": 0.20467500000000044,
        "reward_max": 1.0525000000000004,
        "reward_min": -0.7456249999999995,
        "leartime_s": 0.04627822898328304,
        "sampletime": 8.334894844010705,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 451,
        "timesteps": 9020000,
        "reward_mean": -0.32912499999999956,
        "reward_max": 0.42625000000000024,
        "reward_min": -1.281249999999999,
        "leartime_s": 0.026383151998743415,
        "sampletime": 8.492652494023787,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 452,
        "timesteps": 9040000,
        "reward_mean": 0.08502500000000042,
        "reward_max": 0.8525000000000005,
        "reward_min": -1.0593750000000002,
        "leartime_s": 0.022491976007586345,
        "sampletime": 8.460113172011916,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 453,
        "timesteps": 9060000,
        "reward_mean": -0.11799999999999965,
        "reward_max": 0.6631250000000002,
        "reward_min": -1.2681249999999995,
        "leartime_s": 0.026128730998607352,
        "sampletime": 8.324621059000492,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 454,
        "timesteps": 9080000,
        "reward_mean": -0.03197499999999959,
        "reward_max": 0.9425000000000007,
        "reward_min": -0.8981249999999996,
        "leartime_s": 0.022497136000311002,
        "sampletime": 8.477587281988235,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 455,
        "timesteps": 9100000,
        "reward_mean": -0.2409999999999997,
        "reward_max": 0.48625000000000035,
        "reward_min": -1.4181250000000003,
        "leartime_s": 0.02247316497960128,
        "sampletime": 8.375697226991178,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 456,
        "timesteps": 9120000,
        "reward_mean": -0.20657499999999962,
        "reward_max": 0.5806250000000006,
        "reward_min": -0.9431249999999993,
        "leartime_s": 0.034424618002958596,
        "sampletime": 8.380323024990503,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 457,
        "timesteps": 9140000,
        "reward_mean": -0.2021499999999994,
        "reward_max": 0.6637500000000006,
        "reward_min": -1.7406249999999999,
        "leartime_s": 0.03194883099058643,
        "sampletime": 8.377123655984178,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 458,
        "timesteps": 9160000,
        "reward_mean": -0.3693249999999997,
        "reward_max": 0.9400000000000004,
        "reward_min": -1.3218749999999997,
        "leartime_s": 0.027580469992244616,
        "sampletime": 8.232987847994082,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 459,
        "timesteps": 9180000,
        "reward_mean": 0.016050000000000276,
        "reward_max": 0.8050000000000005,
        "reward_min": -1.01625,
        "leartime_s": 0.024364618002437055,
        "sampletime": 8.352800636988832,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 460,
        "timesteps": 9200000,
        "reward_mean": -0.018499999999999586,
        "reward_max": 1.0193750000000004,
        "reward_min": -0.8637499999999994,
        "leartime_s": 0.02261411599465646,
        "sampletime": 8.410423221997917,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 461,
        "timesteps": 9220000,
        "reward_mean": 0.10680000000000038,
        "reward_max": 0.9406250000000006,
        "reward_min": -0.8749999999999993,
        "leartime_s": 0.04474777900031768,
        "sampletime": 8.266224752995186,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 462,
        "timesteps": 9240000,
        "reward_mean": -0.01934999999999971,
        "reward_max": 0.8918750000000002,
        "reward_min": -1.1868749999999992,
        "leartime_s": 0.014776581985643134,
        "sampletime": 8.30147865897743,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 463,
        "timesteps": 9260000,
        "reward_mean": -0.12857499999999955,
        "reward_max": 1.0950000000000006,
        "reward_min": -1.1599999999999995,
        "leartime_s": 0.027841971983434632,
        "sampletime": 8.359229808993405,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 464,
        "timesteps": 9280000,
        "reward_mean": 0.005750000000000535,
        "reward_max": 1.071250000000001,
        "reward_min": -0.7462499999999994,
        "leartime_s": 0.026193739991867915,
        "sampletime": 8.50741544997436,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 465,
        "timesteps": 9300000,
        "reward_mean": -0.007224999999999448,
        "reward_max": 1.19375,
        "reward_min": -0.9899999999999995,
        "leartime_s": 0.04357644100673497,
        "sampletime": 8.274677734007128,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 466,
        "timesteps": 9320000,
        "reward_mean": -0.1351749999999995,
        "reward_max": 0.6918750000000005,
        "reward_min": -1.1943750000000006,
        "leartime_s": 0.03036394898663275,
        "sampletime": 8.478602307004621,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 467,
        "timesteps": 9340000,
        "reward_mean": -0.0037499999999995853,
        "reward_max": 0.8731250000000004,
        "reward_min": -1.4956249999999989,
        "leartime_s": 0.024102994007989764,
        "sampletime": 8.387054708000505,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 468,
        "timesteps": 9360000,
        "reward_mean": -0.09379999999999955,
        "reward_max": 0.7225000000000004,
        "reward_min": -0.8462499999999993,
        "leartime_s": 0.023152780020609498,
        "sampletime": 8.240530684997793,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 469,
        "timesteps": 9380000,
        "reward_mean": 0.1250250000000004,
        "reward_max": 0.9450000000000006,
        "reward_min": -1.1362499999999998,
        "leartime_s": 0.02447470900369808,
        "sampletime": 8.089596264006104,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 470,
        "timesteps": 9400000,
        "reward_mean": 0.1443250000000005,
        "reward_max": 1.5568750000000005,
        "reward_min": -1.0387499999999994,
        "leartime_s": 0.024824571009958163,
        "sampletime": 8.42172141498304,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 471,
        "timesteps": 9420000,
        "reward_mean": -0.16384999999999966,
        "reward_max": 0.6125000000000005,
        "reward_min": -1.14875,
        "leartime_s": 0.02275397299672477,
        "sampletime": 8.393950992001919,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 472,
        "timesteps": 9440000,
        "reward_mean": 0.1244000000000004,
        "reward_max": 1.1606250000000002,
        "reward_min": -0.7056249999999988,
        "leartime_s": 0.024325385980773717,
        "sampletime": 8.52502763600205,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 473,
        "timesteps": 9460000,
        "reward_mean": -0.017399999999999388,
        "reward_max": 0.9306250000000007,
        "reward_min": -1.03375,
        "leartime_s": 0.023134649003623053,
        "sampletime": 8.496315380994929,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 474,
        "timesteps": 9480000,
        "reward_mean": 0.028625000000000518,
        "reward_max": 0.9556250000000003,
        "reward_min": -0.8950000000000001,
        "leartime_s": 0.023406997992424294,
        "sampletime": 8.32396763502038,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 475,
        "timesteps": 9500000,
        "reward_mean": -0.31942499999999957,
        "reward_max": 0.5393750000000004,
        "reward_min": -1.360625,
        "leartime_s": 0.02295926000806503,
        "sampletime": 8.478026411990868,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 476,
        "timesteps": 9520000,
        "reward_mean": -0.16264999999999963,
        "reward_max": 0.7568750000000009,
        "reward_min": -1.2099999999999982,
        "leartime_s": 0.027654305013129488,
        "sampletime": 8.465171247022226,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 477,
        "timesteps": 9540000,
        "reward_mean": -0.02947499999999953,
        "reward_max": 1.1731250000000002,
        "reward_min": -1.1118749999999993,
        "leartime_s": 0.023739468975691125,
        "sampletime": 8.427578508999432,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 478,
        "timesteps": 9560000,
        "reward_mean": 0.18112500000000048,
        "reward_max": 1.1337500000000005,
        "reward_min": -0.6481250000000001,
        "leartime_s": 0.029937794985016808,
        "sampletime": 8.536303261993453,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 479,
        "timesteps": 9580000,
        "reward_mean": 0.0833000000000005,
        "reward_max": 0.9981250000000005,
        "reward_min": -0.749374999999999,
        "leartime_s": 0.05100024299463257,
        "sampletime": 8.62536846200237,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 480,
        "timesteps": 9600000,
        "reward_mean": 0.24155000000000043,
        "reward_max": 1.2143750000000006,
        "reward_min": -0.8781249999999996,
        "leartime_s": 0.04522642999654636,
        "sampletime": 8.215976919978857,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 481,
        "timesteps": 9620000,
        "reward_mean": 0.14012500000000044,
        "reward_max": 1.0118750000000005,
        "reward_min": -0.6631249999999995,
        "leartime_s": 0.05196321298717521,
        "sampletime": 8.435221131017897,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 482,
        "timesteps": 9640000,
        "reward_mean": 0.13632500000000053,
        "reward_max": 1.1612500000000008,
        "reward_min": -0.8612499999999997,
        "leartime_s": 0.04736701099318452,
        "sampletime": 8.44531663399539,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 483,
        "timesteps": 9660000,
        "reward_mean": -0.03592499999999955,
        "reward_max": 0.8418750000000007,
        "reward_min": -0.9799999999999995,
        "leartime_s": 0.03953791700769216,
        "sampletime": 8.414972708007554,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 484,
        "timesteps": 9680000,
        "reward_mean": -0.02862499999999942,
        "reward_max": 0.7937500000000003,
        "reward_min": -1.0687499999999992,
        "leartime_s": 0.04098677201545797,
        "sampletime": 8.21762270500767,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 485,
        "timesteps": 9700000,
        "reward_mean": 0.17372500000000046,
        "reward_max": 1.2043750000000004,
        "reward_min": -0.6831249999999998,
        "leartime_s": 0.06142402297700755,
        "sampletime": 8.369688862003386,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 486,
        "timesteps": 9720000,
        "reward_mean": -0.1951499999999994,
        "reward_max": 0.8043750000000008,
        "reward_min": -1.515624999999999,
        "leartime_s": 0.024669411999639124,
        "sampletime": 8.380324842990376,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 487,
        "timesteps": 9740000,
        "reward_mean": -0.04339999999999944,
        "reward_max": 0.8900000000000007,
        "reward_min": -1.733749999999999,
        "leartime_s": 0.04410442599328235,
        "sampletime": 8.34282273799181,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 488,
        "timesteps": 9760000,
        "reward_mean": 0.1339750000000005,
        "reward_max": 1.1537500000000007,
        "reward_min": -1.150625,
        "leartime_s": 0.02323450898984447,
        "sampletime": 8.241041250003036,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 489,
        "timesteps": 9780000,
        "reward_mean": 0.055575000000000575,
        "reward_max": 0.8637500000000009,
        "reward_min": -1.2268749999999997,
        "leartime_s": 0.024118754983646795,
        "sampletime": 8.722524650976993,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 490,
        "timesteps": 9800000,
        "reward_mean": 0.1738250000000005,
        "reward_max": 0.9537500000000004,
        "reward_min": -0.5037499999999996,
        "leartime_s": 0.03432487600366585,
        "sampletime": 8.330790602980414,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 491,
        "timesteps": 9820000,
        "reward_mean": 0.1729500000000005,
        "reward_max": 1.0331250000000005,
        "reward_min": -0.8462499999999991,
        "leartime_s": 0.035288577986648306,
        "sampletime": 8.132863545004511,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 492,
        "timesteps": 9840000,
        "reward_mean": 0.20417500000000052,
        "reward_max": 1.3231250000000006,
        "reward_min": -0.6112499999999995,
        "leartime_s": 0.023830915975850075,
        "sampletime": 7.733210115984548,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 493,
        "timesteps": 9860000,
        "reward_mean": 0.07612500000000051,
        "reward_max": 1.0475000000000008,
        "reward_min": -0.7543749999999996,
        "leartime_s": 0.04853211698355153,
        "sampletime": 7.624590007006191,
        "best_mean": 0.27607500000000046,
        "best_max": 1.2581250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 494,
        "timesteps": 9880000,
        "reward_mean": 0.3524500000000006,
        "reward_max": 1.2437500000000008,
        "reward_min": -0.41312499999999935,
        "leartime_s": 0.04010954202385619,
        "sampletime": 7.710027205990627,
        "best_mean": 0.3524500000000006,
        "best_max": 1.2437500000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 495,
        "timesteps": 9900000,
        "reward_mean": 0.25357500000000055,
        "reward_max": 1.0150000000000006,
        "reward_min": -0.5574999999999989,
        "leartime_s": 0.038798958994448185,
        "sampletime": 7.860119705001125,
        "best_mean": 0.3524500000000006,
        "best_max": 1.2437500000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 496,
        "timesteps": 9920000,
        "reward_mean": -0.13364999999999944,
        "reward_max": 0.6325000000000006,
        "reward_min": -1.4637499999999988,
        "leartime_s": 0.02711043501039967,
        "sampletime": 7.7495157240191475,
        "best_mean": 0.3524500000000006,
        "best_max": 1.2437500000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 497,
        "timesteps": 9940000,
        "reward_mean": 0.3026250000000007,
        "reward_max": 1.1050000000000006,
        "reward_min": -1.0306249999999992,
        "leartime_s": 0.023004897986538708,
        "sampletime": 7.6127094110124744,
        "best_mean": 0.3524500000000006,
        "best_max": 1.2437500000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 498,
        "timesteps": 9960000,
        "reward_mean": 0.2793750000000006,
        "reward_max": 1.1675000000000006,
        "reward_min": -0.8499999999999996,
        "leartime_s": 0.036075252981390804,
        "sampletime": 7.722328498988645,
        "best_mean": 0.3524500000000006,
        "best_max": 1.2437500000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 499,
        "timesteps": 9980000,
        "reward_mean": 0.44652500000000067,
        "reward_max": 1.2337500000000008,
        "reward_min": -0.6062499999999991,
        "leartime_s": 0.029524982994189486,
        "sampletime": 7.662214056996163,
        "best_mean": 0.44652500000000067,
        "best_max": 1.2337500000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 500,
        "timesteps": 10000000,
        "reward_mean": -0.023474999999999475,
        "reward_max": 0.8593750000000007,
        "reward_min": -1.4106249999999991,
        "leartime_s": 0.02828195400070399,
        "sampletime": 7.765591306000715,
        "best_mean": 0.44652500000000067,
        "best_max": 1.2337500000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 1511,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    }
]