[
    {
        "generation": 1,
        "timesteps": 20000,
        "reward_mean": -39.66847476190476,
        "reward_max": -3.585,
        "reward_min": -69.51066666666665,
        "leartime_s": 0.019060719991102815,
        "sampletime": 7.801474367006449,
        "best_mean": -39.66847476190476,
        "best_max": -3.585,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 2,
        "timesteps": 40000,
        "reward_mean": -38.89563133333334,
        "reward_max": -3.2843749999999994,
        "reward_min": -81.36375000000001,
        "leartime_s": 0.013518571009626612,
        "sampletime": 7.8820308259746525,
        "best_mean": -38.89563133333334,
        "best_max": -3.2843749999999994,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 3,
        "timesteps": 60000,
        "reward_mean": -21.9307,
        "reward_max": 1.3031250000000008,
        "reward_min": -165.986875,
        "leartime_s": 0.004592013021465391,
        "sampletime": 7.691291942988755,
        "best_mean": -21.9307,
        "best_max": 1.3031250000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 4,
        "timesteps": 80000,
        "reward_mean": -18.186600000000002,
        "reward_max": 1.3106250000000013,
        "reward_min": -44.46000000000001,
        "leartime_s": 0.005411602003732696,
        "sampletime": 7.823055582004599,
        "best_mean": -18.186600000000002,
        "best_max": 1.3106250000000013,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 5,
        "timesteps": 100000,
        "reward_mean": -20.0285,
        "reward_max": 0.18187500000000087,
        "reward_min": -122.04937499999998,
        "leartime_s": 0.014984074019594118,
        "sampletime": 7.706312252004864,
        "best_mean": -18.186600000000002,
        "best_max": 1.3106250000000013,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 6,
        "timesteps": 120000,
        "reward_mean": -12.250900000000001,
        "reward_max": -1.1631249999999997,
        "reward_min": -116.46124999999999,
        "leartime_s": 0.004428287997143343,
        "sampletime": 7.819833891000599,
        "best_mean": -12.250900000000001,
        "best_max": -1.1631249999999997,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 7,
        "timesteps": 140000,
        "reward_mean": -8.047375,
        "reward_max": -0.27749999999999975,
        "reward_min": -94.58874999999999,
        "leartime_s": 0.004584647016599774,
        "sampletime": 7.791818275989499,
        "best_mean": -8.047375,
        "best_max": -0.27749999999999975,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 8,
        "timesteps": 160000,
        "reward_mean": -4.079899999999999,
        "reward_max": 0.11625000000000028,
        "reward_min": -19.001250000000002,
        "leartime_s": 0.00446847899002023,
        "sampletime": 7.795415546017466,
        "best_mean": -4.079899999999999,
        "best_max": 0.11625000000000028,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 9,
        "timesteps": 180000,
        "reward_mean": -1.0654999999999997,
        "reward_max": 0.9831250000000004,
        "reward_min": -7.5575000000000045,
        "leartime_s": 0.00467659899732098,
        "sampletime": 7.720395395997912,
        "best_mean": -1.0654999999999997,
        "best_max": 0.9831250000000004,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 10,
        "timesteps": 200000,
        "reward_mean": -0.33224999999999943,
        "reward_max": 0.7468750000000006,
        "reward_min": -2.7806249999999997,
        "leartime_s": 0.013559187995269895,
        "sampletime": 7.7944755050120875,
        "best_mean": -0.33224999999999943,
        "best_max": 0.7468750000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 11,
        "timesteps": 220000,
        "reward_mean": 0.016625000000000605,
        "reward_max": 0.9656250000000007,
        "reward_min": -2.9693750000000003,
        "leartime_s": 0.004617009020876139,
        "sampletime": 7.7219575229974,
        "best_mean": 0.016625000000000605,
        "best_max": 0.9656250000000007,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 12,
        "timesteps": 240000,
        "reward_mean": -0.20822499999999947,
        "reward_max": 0.5381250000000006,
        "reward_min": -2.4487499999999995,
        "leartime_s": 0.004653271986171603,
        "sampletime": 7.740361731994199,
        "best_mean": 0.016625000000000605,
        "best_max": 0.9656250000000007,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 13,
        "timesteps": 260000,
        "reward_mean": -0.25264999999999976,
        "reward_max": 0.7925000000000002,
        "reward_min": -1.2450000000000003,
        "leartime_s": 0.00473481000517495,
        "sampletime": 7.791946112993173,
        "best_mean": 0.016625000000000605,
        "best_max": 0.9656250000000007,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 14,
        "timesteps": 280000,
        "reward_mean": -0.6250999999999999,
        "reward_max": 0.3225000000000002,
        "reward_min": -2.4281249999999996,
        "leartime_s": 0.004978359997039661,
        "sampletime": 7.801249515003292,
        "best_mean": 0.016625000000000605,
        "best_max": 0.9656250000000007,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 15,
        "timesteps": 300000,
        "reward_mean": -0.69505,
        "reward_max": 0.2268750000000003,
        "reward_min": -1.6293749999999987,
        "leartime_s": 0.004961109982104972,
        "sampletime": 7.927445995999733,
        "best_mean": 0.016625000000000605,
        "best_max": 0.9656250000000007,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 16,
        "timesteps": 320000,
        "reward_mean": -0.5108499999999998,
        "reward_max": 0.7868749999999998,
        "reward_min": -1.6243749999999988,
        "leartime_s": 0.01302824099548161,
        "sampletime": 7.748082232021261,
        "best_mean": 0.016625000000000605,
        "best_max": 0.9656250000000007,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 17,
        "timesteps": 340000,
        "reward_mean": -0.8039999999999998,
        "reward_max": -0.09812499999999975,
        "reward_min": -2.174999999999999,
        "leartime_s": 0.004095084004802629,
        "sampletime": 7.841259235981852,
        "best_mean": 0.016625000000000605,
        "best_max": 0.9656250000000007,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 18,
        "timesteps": 360000,
        "reward_mean": -0.8384749999999999,
        "reward_max": -0.014374999999999943,
        "reward_min": -1.991874999999999,
        "leartime_s": 0.00482277397532016,
        "sampletime": 7.803783517010743,
        "best_mean": 0.016625000000000605,
        "best_max": 0.9656250000000007,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 19,
        "timesteps": 380000,
        "reward_mean": -0.8775499999999999,
        "reward_max": -0.07812500000000004,
        "reward_min": -1.5793750000000002,
        "leartime_s": 0.004799952992470935,
        "sampletime": 7.854695813002763,
        "best_mean": 0.016625000000000605,
        "best_max": 0.9656250000000007,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 20,
        "timesteps": 400000,
        "reward_mean": -0.6376999999999998,
        "reward_max": 0.6343750000000004,
        "reward_min": -2.301874999999999,
        "leartime_s": 0.005182863998925313,
        "sampletime": 7.925526125007309,
        "best_mean": 0.016625000000000605,
        "best_max": 0.9656250000000007,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 21,
        "timesteps": 420000,
        "reward_mean": -0.9767249999999997,
        "reward_max": 0.0450000000000003,
        "reward_min": -2.364374999999999,
        "leartime_s": 0.0075364520016592,
        "sampletime": 7.768970932986122,
        "best_mean": 0.016625000000000605,
        "best_max": 0.9656250000000007,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 22,
        "timesteps": 440000,
        "reward_mean": -0.9853499999999997,
        "reward_max": -0.12687499999999985,
        "reward_min": -2.2774999999999985,
        "leartime_s": 0.0060488930030260235,
        "sampletime": 7.746091511013219,
        "best_mean": 0.016625000000000605,
        "best_max": 0.9656250000000007,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 23,
        "timesteps": 460000,
        "reward_mean": -1.1244249999999998,
        "reward_max": 0.034375000000000044,
        "reward_min": -2.479374999999999,
        "leartime_s": 0.005000856996048242,
        "sampletime": 7.812142120004864,
        "best_mean": 0.016625000000000605,
        "best_max": 0.9656250000000007,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 24,
        "timesteps": 480000,
        "reward_mean": -0.9029249999999998,
        "reward_max": -0.058124999999999594,
        "reward_min": -1.9968749999999988,
        "leartime_s": 0.005052945023635402,
        "sampletime": 7.804798094992293,
        "best_mean": 0.016625000000000605,
        "best_max": 0.9656250000000007,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 25,
        "timesteps": 500000,
        "reward_mean": -0.8420249999999997,
        "reward_max": 0.19812500000000025,
        "reward_min": -2.12,
        "leartime_s": 0.005076444998849183,
        "sampletime": 7.799855535005918,
        "best_mean": 0.016625000000000605,
        "best_max": 0.9656250000000007,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 26,
        "timesteps": 520000,
        "reward_mean": -1.0061249999999997,
        "reward_max": 0.15125000000000016,
        "reward_min": -3.0087499999999983,
        "leartime_s": 0.005243497987976298,
        "sampletime": 7.650980910984799,
        "best_mean": 0.016625000000000605,
        "best_max": 0.9656250000000007,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 27,
        "timesteps": 540000,
        "reward_mean": -0.7345999999999997,
        "reward_max": 0.10437500000000055,
        "reward_min": -1.8206249999999997,
        "leartime_s": 0.0051246589864604175,
        "sampletime": 7.751147404982476,
        "best_mean": 0.016625000000000605,
        "best_max": 0.9656250000000007,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 28,
        "timesteps": 560000,
        "reward_mean": -0.6669499999999997,
        "reward_max": 0.6118750000000003,
        "reward_min": -2.2093749999999996,
        "leartime_s": 0.014729498012457043,
        "sampletime": 7.766724054003134,
        "best_mean": 0.016625000000000605,
        "best_max": 0.9656250000000007,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 29,
        "timesteps": 580000,
        "reward_mean": -0.9206999999999999,
        "reward_max": 0.06000000000000063,
        "reward_min": -2.2381249999999997,
        "leartime_s": 0.01505170701420866,
        "sampletime": 7.899303459998919,
        "best_mean": 0.016625000000000605,
        "best_max": 0.9656250000000007,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 30,
        "timesteps": 600000,
        "reward_mean": -0.6741249999999996,
        "reward_max": 0.4762500000000003,
        "reward_min": -2.09625,
        "leartime_s": 0.005289778986480087,
        "sampletime": 7.713921404007124,
        "best_mean": 0.016625000000000605,
        "best_max": 0.9656250000000007,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 31,
        "timesteps": 620000,
        "reward_mean": -0.5343249999999995,
        "reward_max": 0.47625000000000073,
        "reward_min": -1.868749999999999,
        "leartime_s": 0.005386592005379498,
        "sampletime": 7.729784036026103,
        "best_mean": 0.016625000000000605,
        "best_max": 0.9656250000000007,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 32,
        "timesteps": 640000,
        "reward_mean": -1.0245999999999997,
        "reward_max": 0.23062500000000047,
        "reward_min": -2.5643749999999987,
        "leartime_s": 0.005366291996324435,
        "sampletime": 7.803853655990679,
        "best_mean": 0.016625000000000605,
        "best_max": 0.9656250000000007,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 33,
        "timesteps": 660000,
        "reward_mean": -0.6913249999999996,
        "reward_max": 0.6118750000000008,
        "reward_min": -2.447499999999999,
        "leartime_s": 0.005272462003631517,
        "sampletime": 7.686640874977456,
        "best_mean": 0.016625000000000605,
        "best_max": 0.9656250000000007,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 34,
        "timesteps": 680000,
        "reward_mean": -0.7575249999999998,
        "reward_max": 0.3100000000000003,
        "reward_min": -2.3225,
        "leartime_s": 0.06344721800996922,
        "sampletime": 7.793587894004304,
        "best_mean": 0.016625000000000605,
        "best_max": 0.9656250000000007,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 35,
        "timesteps": 700000,
        "reward_mean": -0.6666749999999996,
        "reward_max": 0.5550000000000007,
        "reward_min": -2.3499999999999983,
        "leartime_s": 0.005378392001148313,
        "sampletime": 7.7725270520022605,
        "best_mean": 0.016625000000000605,
        "best_max": 0.9656250000000007,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 36,
        "timesteps": 720000,
        "reward_mean": -0.4699999999999996,
        "reward_max": 0.3500000000000002,
        "reward_min": -1.7012499999999995,
        "leartime_s": 0.005612192006083205,
        "sampletime": 7.790960876998724,
        "best_mean": 0.016625000000000605,
        "best_max": 0.9656250000000007,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 37,
        "timesteps": 740000,
        "reward_mean": -0.5739749999999997,
        "reward_max": 0.33187500000000025,
        "reward_min": -2.011249999999999,
        "leartime_s": 0.005498720973264426,
        "sampletime": 7.843409024993889,
        "best_mean": 0.016625000000000605,
        "best_max": 0.9656250000000007,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 38,
        "timesteps": 760000,
        "reward_mean": -0.1292499999999996,
        "reward_max": 0.7693750000000007,
        "reward_min": -1.5424999999999989,
        "leartime_s": 0.005546611006138846,
        "sampletime": 7.6320229890116025,
        "best_mean": 0.016625000000000605,
        "best_max": 0.9656250000000007,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 39,
        "timesteps": 780000,
        "reward_mean": -0.26722499999999966,
        "reward_max": 1.0500000000000007,
        "reward_min": -1.8581249999999998,
        "leartime_s": 0.005547834007302299,
        "sampletime": 7.766586512007052,
        "best_mean": 0.016625000000000605,
        "best_max": 0.9656250000000007,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 40,
        "timesteps": 800000,
        "reward_mean": -0.15952499999999958,
        "reward_max": 0.7793750000000003,
        "reward_min": -1.8768749999999992,
        "leartime_s": 0.004700033023254946,
        "sampletime": 7.778973609005334,
        "best_mean": 0.016625000000000605,
        "best_max": 0.9656250000000007,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 41,
        "timesteps": 820000,
        "reward_mean": -0.1843999999999995,
        "reward_max": 0.7387500000000004,
        "reward_min": -1.7225000000000006,
        "leartime_s": 0.0057197049900423735,
        "sampletime": 7.854955685004825,
        "best_mean": 0.016625000000000605,
        "best_max": 0.9656250000000007,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 42,
        "timesteps": 840000,
        "reward_mean": -0.20664999999999956,
        "reward_max": 0.8506250000000007,
        "reward_min": -1.8393749999999982,
        "leartime_s": 0.005657954985508695,
        "sampletime": 7.7934640549938194,
        "best_mean": 0.016625000000000605,
        "best_max": 0.9656250000000007,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 43,
        "timesteps": 860000,
        "reward_mean": -0.2913749999999996,
        "reward_max": 0.5825000000000005,
        "reward_min": -1.322499999999999,
        "leartime_s": 0.005818687001010403,
        "sampletime": 7.798210955981631,
        "best_mean": 0.016625000000000605,
        "best_max": 0.9656250000000007,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 44,
        "timesteps": 880000,
        "reward_mean": -0.30834999999999957,
        "reward_max": 0.7375000000000004,
        "reward_min": -1.4593749999999994,
        "leartime_s": 0.006126437016064301,
        "sampletime": 7.628877782000927,
        "best_mean": 0.016625000000000605,
        "best_max": 0.9656250000000007,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 45,
        "timesteps": 900000,
        "reward_mean": 0.0669500000000004,
        "reward_max": 1.0093750000000001,
        "reward_min": -1.1612499999999997,
        "leartime_s": 0.005942636984400451,
        "sampletime": 7.735895917983726,
        "best_mean": 0.0669500000000004,
        "best_max": 1.0093750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 46,
        "timesteps": 920000,
        "reward_mean": -0.27349999999999963,
        "reward_max": 0.8856250000000006,
        "reward_min": -1.5037499999999995,
        "leartime_s": 0.009864252002444118,
        "sampletime": 7.833529655996244,
        "best_mean": 0.0669500000000004,
        "best_max": 1.0093750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 47,
        "timesteps": 940000,
        "reward_mean": -0.16859999999999953,
        "reward_max": 0.8481250000000004,
        "reward_min": -1.3187499999999994,
        "leartime_s": 0.007317761017475277,
        "sampletime": 7.80468642100459,
        "best_mean": 0.0669500000000004,
        "best_max": 1.0093750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 48,
        "timesteps": 960000,
        "reward_mean": -0.4420499999999995,
        "reward_max": 1.0843750000000005,
        "reward_min": -1.8356250000000003,
        "leartime_s": 0.009312515001511201,
        "sampletime": 7.824267161020543,
        "best_mean": 0.0669500000000004,
        "best_max": 1.0093750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 49,
        "timesteps": 980000,
        "reward_mean": -0.31542499999999973,
        "reward_max": 0.5468750000000004,
        "reward_min": -1.5049999999999992,
        "leartime_s": 0.007177430990850553,
        "sampletime": 7.768232968985103,
        "best_mean": 0.0669500000000004,
        "best_max": 1.0093750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 50,
        "timesteps": 1000000,
        "reward_mean": 0.1283500000000004,
        "reward_max": 1.3062500000000004,
        "reward_min": -1.6425000000000007,
        "leartime_s": 0.0058873269881587476,
        "sampletime": 7.7945797230058815,
        "best_mean": 0.1283500000000004,
        "best_max": 1.3062500000000004,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 51,
        "timesteps": 1020000,
        "reward_mean": 0.036400000000000515,
        "reward_max": 1.1093750000000004,
        "reward_min": -0.971874999999999,
        "leartime_s": 0.006184189987834543,
        "sampletime": 7.787430910975672,
        "best_mean": 0.1283500000000004,
        "best_max": 1.3062500000000004,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 52,
        "timesteps": 1040000,
        "reward_mean": -0.1508499999999995,
        "reward_max": 0.986250000000001,
        "reward_min": -1.5243749999999994,
        "leartime_s": 0.017527161980979145,
        "sampletime": 7.833754549006699,
        "best_mean": 0.1283500000000004,
        "best_max": 1.3062500000000004,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 53,
        "timesteps": 1060000,
        "reward_mean": -0.2748249999999996,
        "reward_max": 0.7050000000000006,
        "reward_min": -1.8618749999999995,
        "leartime_s": 0.006562503025634214,
        "sampletime": 7.771494442014955,
        "best_mean": 0.1283500000000004,
        "best_max": 1.3062500000000004,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 54,
        "timesteps": 1080000,
        "reward_mean": 0.043000000000000434,
        "reward_max": 1.1756250000000006,
        "reward_min": -1.0987499999999997,
        "leartime_s": 0.00975101999938488,
        "sampletime": 7.904543987009674,
        "best_mean": 0.1283500000000004,
        "best_max": 1.3062500000000004,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 55,
        "timesteps": 1100000,
        "reward_mean": -0.20582499999999945,
        "reward_max": 0.8100000000000007,
        "reward_min": -1.4393749999999996,
        "leartime_s": 0.007391824998194352,
        "sampletime": 7.775191212975187,
        "best_mean": 0.1283500000000004,
        "best_max": 1.3062500000000004,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 56,
        "timesteps": 1120000,
        "reward_mean": -0.2515249999999994,
        "reward_max": 1.0531250000000005,
        "reward_min": -1.6274999999999997,
        "leartime_s": 0.00942511999164708,
        "sampletime": 7.714959981007269,
        "best_mean": 0.1283500000000004,
        "best_max": 1.3062500000000004,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 57,
        "timesteps": 1140000,
        "reward_mean": -0.19978483333333297,
        "reward_max": 1.0025000000000006,
        "reward_min": -2.27,
        "leartime_s": 0.006401204009307548,
        "sampletime": 7.836697452003136,
        "best_mean": 0.1283500000000004,
        "best_max": 1.3062500000000004,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 58,
        "timesteps": 1160000,
        "reward_mean": 0.22585000000000052,
        "reward_max": 1.6812500000000006,
        "reward_min": -0.8224999999999992,
        "leartime_s": 0.0064096139976754785,
        "sampletime": 7.634494046011241,
        "best_mean": 0.22585000000000052,
        "best_max": 1.6812500000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 59,
        "timesteps": 1180000,
        "reward_mean": -0.2680249999999995,
        "reward_max": 0.8962500000000008,
        "reward_min": -1.8318750000000008,
        "leartime_s": 0.006721902987919748,
        "sampletime": 7.68688563600881,
        "best_mean": 0.22585000000000052,
        "best_max": 1.6812500000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 60,
        "timesteps": 1200000,
        "reward_mean": -0.0885749999999995,
        "reward_max": 1.0181250000000004,
        "reward_min": -1.5162499999999997,
        "leartime_s": 0.01642947699292563,
        "sampletime": 7.807441351993475,
        "best_mean": 0.22585000000000052,
        "best_max": 1.6812500000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 61,
        "timesteps": 1220000,
        "reward_mean": -0.1608749999999994,
        "reward_max": 0.7843750000000009,
        "reward_min": -1.2149999999999992,
        "leartime_s": 0.005189362011151388,
        "sampletime": 7.662102215981577,
        "best_mean": 0.22585000000000052,
        "best_max": 1.6812500000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 62,
        "timesteps": 1240000,
        "reward_mean": -0.038774999999999504,
        "reward_max": 1.4475000000000007,
        "reward_min": -1.1506249999999998,
        "leartime_s": 0.006360546016367152,
        "sampletime": 7.693370321998373,
        "best_mean": 0.22585000000000052,
        "best_max": 1.6812500000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 63,
        "timesteps": 1260000,
        "reward_mean": -0.1417999999999995,
        "reward_max": 1.1193750000000002,
        "reward_min": -1.5006249999999988,
        "leartime_s": 0.006934218021342531,
        "sampletime": 7.783752577000996,
        "best_mean": 0.22585000000000052,
        "best_max": 1.6812500000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 64,
        "timesteps": 1280000,
        "reward_mean": 0.006600000000000492,
        "reward_max": 1.1206250000000004,
        "reward_min": -1.5518749999999994,
        "leartime_s": 0.00669556698994711,
        "sampletime": 7.672380364994751,
        "best_mean": 0.22585000000000052,
        "best_max": 1.6812500000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 65,
        "timesteps": 1300000,
        "reward_mean": -0.052574999999999504,
        "reward_max": 1.767500000000001,
        "reward_min": -1.1993749999999994,
        "leartime_s": 0.014530396001646295,
        "sampletime": 7.782679980009561,
        "best_mean": 0.22585000000000052,
        "best_max": 1.6812500000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 66,
        "timesteps": 1320000,
        "reward_mean": -0.20554999999999943,
        "reward_max": 0.6381250000000007,
        "reward_min": -1.7831249999999996,
        "leartime_s": 0.0066265570058021694,
        "sampletime": 7.843291486991802,
        "best_mean": 0.22585000000000052,
        "best_max": 1.6812500000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 67,
        "timesteps": 1340000,
        "reward_mean": 0.26347500000000046,
        "reward_max": 1.3768750000000005,
        "reward_min": -0.8443749999999997,
        "leartime_s": 0.015660372999263927,
        "sampletime": 7.991220447991509,
        "best_mean": 0.26347500000000046,
        "best_max": 1.3768750000000005,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 68,
        "timesteps": 1360000,
        "reward_mean": -0.45049999999999935,
        "reward_max": 0.969375000000001,
        "reward_min": -2.773124999999999,
        "leartime_s": 0.014333700004499406,
        "sampletime": 7.620993884978816,
        "best_mean": 0.26347500000000046,
        "best_max": 1.3768750000000005,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 69,
        "timesteps": 1380000,
        "reward_mean": -0.028599999999999477,
        "reward_max": 0.9468750000000007,
        "reward_min": -1.6437499999999998,
        "leartime_s": 0.0066725590149872005,
        "sampletime": 7.668740395019995,
        "best_mean": 0.26347500000000046,
        "best_max": 1.3768750000000005,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 70,
        "timesteps": 1400000,
        "reward_mean": -0.18469999999999948,
        "reward_max": 1.2625000000000004,
        "reward_min": -1.9643749999999998,
        "leartime_s": 0.00667941800202243,
        "sampletime": 7.651991244987585,
        "best_mean": 0.26347500000000046,
        "best_max": 1.3768750000000005,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 71,
        "timesteps": 1420000,
        "reward_mean": 0.09445000000000055,
        "reward_max": 1.1425000000000005,
        "reward_min": -1.393749999999999,
        "leartime_s": 0.006946090987185016,
        "sampletime": 7.723453089012764,
        "best_mean": 0.26347500000000046,
        "best_max": 1.3768750000000005,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 72,
        "timesteps": 1440000,
        "reward_mean": -0.20382499999999953,
        "reward_max": 0.7268750000000008,
        "reward_min": -1.5031250000000005,
        "leartime_s": 0.00670932000502944,
        "sampletime": 7.836796413001139,
        "best_mean": 0.26347500000000046,
        "best_max": 1.3768750000000005,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 73,
        "timesteps": 1460000,
        "reward_mean": -0.3401249999999995,
        "reward_max": 0.7906250000000004,
        "reward_min": -1.705625,
        "leartime_s": 0.00818607400287874,
        "sampletime": 7.791743609006517,
        "best_mean": 0.26347500000000046,
        "best_max": 1.3768750000000005,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 74,
        "timesteps": 1480000,
        "reward_mean": 0.056475000000000435,
        "reward_max": 0.8656250000000005,
        "reward_min": -0.9093749999999988,
        "leartime_s": 0.00728942098794505,
        "sampletime": 7.732281453005271,
        "best_mean": 0.26347500000000046,
        "best_max": 1.3768750000000005,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 75,
        "timesteps": 1500000,
        "reward_mean": 0.013825000000000443,
        "reward_max": 1.1931250000000002,
        "reward_min": -1.395,
        "leartime_s": 0.018297907983651385,
        "sampletime": 7.822750052000629,
        "best_mean": 0.26347500000000046,
        "best_max": 1.3768750000000005,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 76,
        "timesteps": 1520000,
        "reward_mean": -0.19157499999999944,
        "reward_max": 0.9737500000000007,
        "reward_min": -1.6256249999999994,
        "leartime_s": 0.007191583979874849,
        "sampletime": 7.865933741006302,
        "best_mean": 0.26347500000000046,
        "best_max": 1.3768750000000005,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 77,
        "timesteps": 1540000,
        "reward_mean": -0.31612499999999955,
        "reward_max": 0.8918750000000004,
        "reward_min": -1.9018749999999986,
        "leartime_s": 0.0071199719968717545,
        "sampletime": 7.858712718007155,
        "best_mean": 0.26347500000000046,
        "best_max": 1.3768750000000005,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 78,
        "timesteps": 1560000,
        "reward_mean": -0.12209999999999968,
        "reward_max": 1.0343750000000005,
        "reward_min": -1.0368750000000007,
        "leartime_s": 0.007244813983561471,
        "sampletime": 7.723759024986066,
        "best_mean": 0.26347500000000046,
        "best_max": 1.3768750000000005,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 79,
        "timesteps": 1580000,
        "reward_mean": -0.03129999999999965,
        "reward_max": 0.9612500000000002,
        "reward_min": -1.5818749999999988,
        "leartime_s": 0.018817139003658667,
        "sampletime": 7.8345315259939525,
        "best_mean": 0.26347500000000046,
        "best_max": 1.3768750000000005,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 80,
        "timesteps": 1600000,
        "reward_mean": -0.09117499999999965,
        "reward_max": 0.8337500000000005,
        "reward_min": -0.835624999999999,
        "leartime_s": 0.00722463199053891,
        "sampletime": 7.786743653996382,
        "best_mean": 0.26347500000000046,
        "best_max": 1.3768750000000005,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 81,
        "timesteps": 1620000,
        "reward_mean": -0.3146499999999996,
        "reward_max": 0.8868749999999999,
        "reward_min": -1.3881249999999992,
        "leartime_s": 0.011442357994383201,
        "sampletime": 7.672778130974621,
        "best_mean": 0.26347500000000046,
        "best_max": 1.3768750000000005,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 82,
        "timesteps": 1640000,
        "reward_mean": 0.1026250000000005,
        "reward_max": 1.1562500000000004,
        "reward_min": -1.2612499999999993,
        "leartime_s": 0.008103997999569401,
        "sampletime": 7.765886884997599,
        "best_mean": 0.26347500000000046,
        "best_max": 1.3768750000000005,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 83,
        "timesteps": 1660000,
        "reward_mean": -0.1962749999999996,
        "reward_max": 1.3018750000000003,
        "reward_min": -1.9106249999999985,
        "leartime_s": 0.01390907700988464,
        "sampletime": 7.833224114001496,
        "best_mean": 0.26347500000000046,
        "best_max": 1.3768750000000005,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 84,
        "timesteps": 1680000,
        "reward_mean": -0.17617499999999967,
        "reward_max": 0.9337500000000006,
        "reward_min": -1.1662499999999991,
        "leartime_s": 0.012272034015040845,
        "sampletime": 7.890619824989699,
        "best_mean": 0.26347500000000046,
        "best_max": 1.3768750000000005,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 85,
        "timesteps": 1700000,
        "reward_mean": -0.04002499999999969,
        "reward_max": 0.8912500000000002,
        "reward_min": -1.728749999999999,
        "leartime_s": 0.00735706600244157,
        "sampletime": 7.917378070997074,
        "best_mean": 0.26347500000000046,
        "best_max": 1.3768750000000005,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 86,
        "timesteps": 1720000,
        "reward_mean": -0.2252749999999996,
        "reward_max": 1.0575000000000006,
        "reward_min": -1.4656249999999988,
        "leartime_s": 0.00757509600953199,
        "sampletime": 7.777979582984699,
        "best_mean": 0.26347500000000046,
        "best_max": 1.3768750000000005,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 87,
        "timesteps": 1740000,
        "reward_mean": 0.2635750000000004,
        "reward_max": 1.1931250000000002,
        "reward_min": -1.0581250000000006,
        "leartime_s": 0.012134185002651066,
        "sampletime": 7.845362665015273,
        "best_mean": 0.2635750000000004,
        "best_max": 1.1931250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 88,
        "timesteps": 1760000,
        "reward_mean": 0.14310000000000037,
        "reward_max": 1.1025000000000005,
        "reward_min": -1.1050000000000004,
        "leartime_s": 0.019211879989597946,
        "sampletime": 7.769578075996833,
        "best_mean": 0.2635750000000004,
        "best_max": 1.1931250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 89,
        "timesteps": 1780000,
        "reward_mean": -0.12402499999999954,
        "reward_max": 1.0693750000000006,
        "reward_min": -1.3724999999999992,
        "leartime_s": 0.007819830003427342,
        "sampletime": 7.789638810005272,
        "best_mean": 0.2635750000000004,
        "best_max": 1.1931250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 90,
        "timesteps": 1800000,
        "reward_mean": -0.0870999999999996,
        "reward_max": 0.8968750000000005,
        "reward_min": -1.0793749999999989,
        "leartime_s": 0.017030695016728714,
        "sampletime": 7.794175371993333,
        "best_mean": 0.2635750000000004,
        "best_max": 1.1931250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 91,
        "timesteps": 1820000,
        "reward_mean": -0.19799999999999968,
        "reward_max": 0.9318750000000007,
        "reward_min": -1.041875,
        "leartime_s": 0.009477965999394655,
        "sampletime": 7.8157322439947166,
        "best_mean": 0.2635750000000004,
        "best_max": 1.1931250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 92,
        "timesteps": 1840000,
        "reward_mean": -0.03287499999999943,
        "reward_max": 1.1050000000000009,
        "reward_min": -1.259374999999999,
        "leartime_s": 0.008033371006604284,
        "sampletime": 7.728919236978982,
        "best_mean": 0.2635750000000004,
        "best_max": 1.1931250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 93,
        "timesteps": 1860000,
        "reward_mean": 0.10607500000000045,
        "reward_max": 1.1512500000000006,
        "reward_min": -1.261249999999999,
        "leartime_s": 0.0077350390201900154,
        "sampletime": 7.797739011992235,
        "best_mean": 0.2635750000000004,
        "best_max": 1.1931250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 94,
        "timesteps": 1880000,
        "reward_mean": -0.02057499999999971,
        "reward_max": 0.9243750000000002,
        "reward_min": -0.8162499999999998,
        "leartime_s": 0.01296114397700876,
        "sampletime": 7.711780407000333,
        "best_mean": 0.2635750000000004,
        "best_max": 1.1931250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 95,
        "timesteps": 1900000,
        "reward_mean": 0.039550000000000356,
        "reward_max": 1.0043750000000005,
        "reward_min": -0.9031249999999996,
        "leartime_s": 0.007866219995776191,
        "sampletime": 7.7452828559908085,
        "best_mean": 0.2635750000000004,
        "best_max": 1.1931250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 96,
        "timesteps": 1920000,
        "reward_mean": -0.04489999999999954,
        "reward_max": 0.7562500000000005,
        "reward_min": -0.9468750000000007,
        "leartime_s": 0.00804437097394839,
        "sampletime": 7.947023955988698,
        "best_mean": 0.2635750000000004,
        "best_max": 1.1931250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 97,
        "timesteps": 1940000,
        "reward_mean": -0.19947499999999962,
        "reward_max": 0.6912500000000004,
        "reward_min": -1.0862499999999995,
        "leartime_s": 0.0190658759966027,
        "sampletime": 7.88849468898843,
        "best_mean": 0.2635750000000004,
        "best_max": 1.1931250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 98,
        "timesteps": 1960000,
        "reward_mean": -0.1773749999999996,
        "reward_max": 1.1112500000000005,
        "reward_min": -1.291875,
        "leartime_s": 0.008259881986305118,
        "sampletime": 7.885567113000434,
        "best_mean": 0.2635750000000004,
        "best_max": 1.1931250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 99,
        "timesteps": 1980000,
        "reward_mean": -0.1716749999999995,
        "reward_max": 0.9581250000000002,
        "reward_min": -0.9537499999999999,
        "leartime_s": 0.00800118298502639,
        "sampletime": 7.720033055986278,
        "best_mean": 0.2635750000000004,
        "best_max": 1.1931250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 100,
        "timesteps": 2000000,
        "reward_mean": -0.27229999999999965,
        "reward_max": 0.6981250000000007,
        "reward_min": -1.2118750000000003,
        "leartime_s": 0.00787644399679266,
        "sampletime": 7.741177941003116,
        "best_mean": 0.2635750000000004,
        "best_max": 1.1931250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 101,
        "timesteps": 2020000,
        "reward_mean": -0.12187499999999961,
        "reward_max": 0.7612500000000006,
        "reward_min": -1.2287499999999991,
        "leartime_s": 0.012069319986039773,
        "sampletime": 7.892150155006675,
        "best_mean": 0.2635750000000004,
        "best_max": 1.1931250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 102,
        "timesteps": 2040000,
        "reward_mean": -0.09487499999999952,
        "reward_max": 0.7050000000000004,
        "reward_min": -1.4437499999999996,
        "leartime_s": 0.012751981994369999,
        "sampletime": 7.775709620007547,
        "best_mean": 0.2635750000000004,
        "best_max": 1.1931250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 103,
        "timesteps": 2060000,
        "reward_mean": -0.2763999999999997,
        "reward_max": 0.7231250000000007,
        "reward_min": -0.9562499999999993,
        "leartime_s": 0.00817870398168452,
        "sampletime": 7.942663572990568,
        "best_mean": 0.2635750000000004,
        "best_max": 1.1931250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 104,
        "timesteps": 2080000,
        "reward_mean": -0.2112249999999997,
        "reward_max": 0.5281250000000005,
        "reward_min": -1.0506249999999995,
        "leartime_s": 0.008030734024941921,
        "sampletime": 7.687773058016319,
        "best_mean": 0.2635750000000004,
        "best_max": 1.1931250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 105,
        "timesteps": 2100000,
        "reward_mean": 0.012325000000000504,
        "reward_max": 1.0900000000000003,
        "reward_min": -1.6143749999999988,
        "leartime_s": 0.008214895002311096,
        "sampletime": 7.624288688006345,
        "best_mean": 0.2635750000000004,
        "best_max": 1.1931250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 106,
        "timesteps": 2120000,
        "reward_mean": 0.09392500000000045,
        "reward_max": 0.9812500000000006,
        "reward_min": -1.1112499999999985,
        "leartime_s": 0.008245585020631552,
        "sampletime": 7.735503728996264,
        "best_mean": 0.2635750000000004,
        "best_max": 1.1931250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 107,
        "timesteps": 2140000,
        "reward_mean": -0.24277499999999952,
        "reward_max": 0.7593750000000006,
        "reward_min": -1.511874999999999,
        "leartime_s": 0.010506553982850164,
        "sampletime": 7.711131354997633,
        "best_mean": 0.2635750000000004,
        "best_max": 1.1931250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 108,
        "timesteps": 2160000,
        "reward_mean": 0.06247500000000048,
        "reward_max": 1.0512500000000007,
        "reward_min": -0.8843750000000004,
        "leartime_s": 0.01777263800613582,
        "sampletime": 7.7383385820139665,
        "best_mean": 0.2635750000000004,
        "best_max": 1.1931250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 109,
        "timesteps": 2180000,
        "reward_mean": 0.21695000000000056,
        "reward_max": 1.0593750000000002,
        "reward_min": -0.9168749999999999,
        "leartime_s": 0.00949286000104621,
        "sampletime": 7.757007588981651,
        "best_mean": 0.2635750000000004,
        "best_max": 1.1931250000000002,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 110,
        "timesteps": 2200000,
        "reward_mean": 0.3495250000000004,
        "reward_max": 1.4012500000000006,
        "reward_min": -1.3324999999999991,
        "leartime_s": 0.02632730599725619,
        "sampletime": 7.957054530008463,
        "best_mean": 0.3495250000000004,
        "best_max": 1.4012500000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 111,
        "timesteps": 2220000,
        "reward_mean": 0.04052500000000058,
        "reward_max": 0.9537500000000003,
        "reward_min": -0.6681249999999991,
        "leartime_s": 0.008564887015381828,
        "sampletime": 7.842848483007401,
        "best_mean": 0.3495250000000004,
        "best_max": 1.4012500000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 112,
        "timesteps": 2240000,
        "reward_mean": 0.20315000000000044,
        "reward_max": 1.0956250000000005,
        "reward_min": -0.9043749999999996,
        "leartime_s": 0.008445757994195446,
        "sampletime": 7.765920207020827,
        "best_mean": 0.3495250000000004,
        "best_max": 1.4012500000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 113,
        "timesteps": 2260000,
        "reward_mean": 0.0204000000000006,
        "reward_max": 0.7575000000000007,
        "reward_min": -0.9699999999999984,
        "leartime_s": 0.008468109008390456,
        "sampletime": 7.645379825989949,
        "best_mean": 0.3495250000000004,
        "best_max": 1.4012500000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 114,
        "timesteps": 2280000,
        "reward_mean": 0.11470000000000047,
        "reward_max": 0.9100000000000006,
        "reward_min": -0.7962499999999998,
        "leartime_s": 0.022201780986506492,
        "sampletime": 7.815561473020352,
        "best_mean": 0.3495250000000004,
        "best_max": 1.4012500000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 115,
        "timesteps": 2300000,
        "reward_mean": 0.17892500000000058,
        "reward_max": 1.0412500000000005,
        "reward_min": -0.770624999999999,
        "leartime_s": 0.019821678986772895,
        "sampletime": 7.836157921003178,
        "best_mean": 0.3495250000000004,
        "best_max": 1.4012500000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 116,
        "timesteps": 2320000,
        "reward_mean": 0.6025750000000005,
        "reward_max": 1.5093750000000006,
        "reward_min": -0.37437500000000007,
        "leartime_s": 0.010280518006766215,
        "sampletime": 7.786077284021303,
        "best_mean": 0.6025750000000005,
        "best_max": 1.5093750000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 117,
        "timesteps": 2340000,
        "reward_mean": 0.4170500000000006,
        "reward_max": 1.3656250000000005,
        "reward_min": -0.4749999999999994,
        "leartime_s": 0.021174108987906948,
        "sampletime": 7.862790222017793,
        "best_mean": 0.6025750000000005,
        "best_max": 1.5093750000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 118,
        "timesteps": 2360000,
        "reward_mean": 0.3345250000000007,
        "reward_max": 1.1187500000000008,
        "reward_min": -0.3756249999999993,
        "leartime_s": 0.024149272998329252,
        "sampletime": 7.844233598007122,
        "best_mean": 0.6025750000000005,
        "best_max": 1.5093750000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 119,
        "timesteps": 2380000,
        "reward_mean": 0.4028250000000007,
        "reward_max": 1.6762500000000007,
        "reward_min": -1.5812499999999996,
        "leartime_s": 0.008599141001468524,
        "sampletime": 7.812004248989979,
        "best_mean": 0.6025750000000005,
        "best_max": 1.5093750000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 120,
        "timesteps": 2400000,
        "reward_mean": 0.49420000000000064,
        "reward_max": 1.4662500000000007,
        "reward_min": -0.7937499999999998,
        "leartime_s": 0.008757770992815495,
        "sampletime": 7.772563243022887,
        "best_mean": 0.6025750000000005,
        "best_max": 1.5093750000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 121,
        "timesteps": 2420000,
        "reward_mean": 0.38960000000000067,
        "reward_max": 1.155000000000001,
        "reward_min": -0.4331249999999994,
        "leartime_s": 0.008671069983392954,
        "sampletime": 7.861502309999196,
        "best_mean": 0.6025750000000005,
        "best_max": 1.5093750000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 122,
        "timesteps": 2440000,
        "reward_mean": 0.44660000000000066,
        "reward_max": 1.4912500000000013,
        "reward_min": -0.4287499999999995,
        "leartime_s": 0.008710621012141928,
        "sampletime": 7.636574090021895,
        "best_mean": 0.6025750000000005,
        "best_max": 1.5093750000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 123,
        "timesteps": 2460000,
        "reward_mean": 0.21990000000000062,
        "reward_max": 0.9318750000000007,
        "reward_min": -0.8462499999999996,
        "leartime_s": 0.008831451996229589,
        "sampletime": 7.780009403009899,
        "best_mean": 0.6025750000000005,
        "best_max": 1.5093750000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 124,
        "timesteps": 2480000,
        "reward_mean": 0.4211500000000005,
        "reward_max": 1.3293750000000009,
        "reward_min": -0.2612499999999994,
        "leartime_s": 0.009147573000518605,
        "sampletime": 7.645742240012623,
        "best_mean": 0.6025750000000005,
        "best_max": 1.5093750000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 125,
        "timesteps": 2500000,
        "reward_mean": 0.33095000000000063,
        "reward_max": 1.1125000000000007,
        "reward_min": -0.46999999999999914,
        "leartime_s": 0.00899562198901549,
        "sampletime": 7.770982169022318,
        "best_mean": 0.6025750000000005,
        "best_max": 1.5093750000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 126,
        "timesteps": 2520000,
        "reward_mean": 0.6288000000000007,
        "reward_max": 1.5512500000000007,
        "reward_min": -0.3787499999999988,
        "leartime_s": 0.0089294420031365,
        "sampletime": 7.624547043989878,
        "best_mean": 0.6288000000000007,
        "best_max": 1.5512500000000007,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 127,
        "timesteps": 2540000,
        "reward_mean": 0.5311250000000007,
        "reward_max": 1.5681250000000007,
        "reward_min": -0.5424999999999996,
        "leartime_s": 0.009004593011923134,
        "sampletime": 7.775645863992395,
        "best_mean": 0.6288000000000007,
        "best_max": 1.5512500000000007,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 128,
        "timesteps": 2560000,
        "reward_mean": 0.7738000000000007,
        "reward_max": 1.639375000000001,
        "reward_min": -0.28249999999999964,
        "leartime_s": 0.020816779986489564,
        "sampletime": 7.872974068013718,
        "best_mean": 0.7738000000000007,
        "best_max": 1.639375000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 129,
        "timesteps": 2580000,
        "reward_mean": 0.5879750000000006,
        "reward_max": 1.7206250000000007,
        "reward_min": -0.7787499999999992,
        "leartime_s": 0.009212666976964101,
        "sampletime": 7.788393508002628,
        "best_mean": 0.7738000000000007,
        "best_max": 1.639375000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 130,
        "timesteps": 2600000,
        "reward_mean": 0.5711000000000006,
        "reward_max": 1.4868750000000004,
        "reward_min": -0.3224999999999997,
        "leartime_s": 0.009807416994590312,
        "sampletime": 7.720554678991903,
        "best_mean": 0.7738000000000007,
        "best_max": 1.639375000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 131,
        "timesteps": 2620000,
        "reward_mean": 0.6121750000000007,
        "reward_max": 1.4250000000000007,
        "reward_min": -0.1937499999999995,
        "leartime_s": 0.02264003100572154,
        "sampletime": 7.761447154014604,
        "best_mean": 0.7738000000000007,
        "best_max": 1.639375000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 132,
        "timesteps": 2640000,
        "reward_mean": 0.5897500000000004,
        "reward_max": 1.5931250000000001,
        "reward_min": -0.30562499999999937,
        "leartime_s": 0.009168613003566861,
        "sampletime": 7.913730700995075,
        "best_mean": 0.7738000000000007,
        "best_max": 1.639375000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 133,
        "timesteps": 2660000,
        "reward_mean": 0.5289750000000006,
        "reward_max": 1.4412500000000004,
        "reward_min": -0.8987499999999997,
        "leartime_s": 0.009880197991151363,
        "sampletime": 7.726996829005657,
        "best_mean": 0.7738000000000007,
        "best_max": 1.639375000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 134,
        "timesteps": 2680000,
        "reward_mean": 0.4989500000000007,
        "reward_max": 1.318125000000001,
        "reward_min": -0.366874999999999,
        "leartime_s": 0.019080267986282706,
        "sampletime": 7.768130341020878,
        "best_mean": 0.7738000000000007,
        "best_max": 1.639375000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 135,
        "timesteps": 2700000,
        "reward_mean": 0.4795750000000007,
        "reward_max": 1.451875000000001,
        "reward_min": -0.4006249999999994,
        "leartime_s": 0.009310658002505079,
        "sampletime": 7.876132006000262,
        "best_mean": 0.7738000000000007,
        "best_max": 1.639375000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 136,
        "timesteps": 2720000,
        "reward_mean": 0.7838750000000008,
        "reward_max": 1.8156250000000012,
        "reward_min": -1.0406249999999988,
        "leartime_s": 0.035415068006841466,
        "sampletime": 7.7761628559965175,
        "best_mean": 0.7838750000000008,
        "best_max": 1.8156250000000012,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 137,
        "timesteps": 2740000,
        "reward_mean": 0.5563000000000006,
        "reward_max": 1.9850000000000008,
        "reward_min": -0.5862499999999997,
        "leartime_s": 0.009311176982009783,
        "sampletime": 7.797593196009984,
        "best_mean": 0.7838750000000008,
        "best_max": 1.8156250000000012,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 138,
        "timesteps": 2760000,
        "reward_mean": 0.6296250000000007,
        "reward_max": 1.6937500000000005,
        "reward_min": -0.46187499999999915,
        "leartime_s": 0.009124306990997866,
        "sampletime": 7.766939133987762,
        "best_mean": 0.7838750000000008,
        "best_max": 1.8156250000000012,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 139,
        "timesteps": 2780000,
        "reward_mean": 0.6419000000000007,
        "reward_max": 1.6025000000000007,
        "reward_min": -0.22624999999999995,
        "leartime_s": 0.023275080020539463,
        "sampletime": 7.810843524988741,
        "best_mean": 0.7838750000000008,
        "best_max": 1.8156250000000012,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 140,
        "timesteps": 2800000,
        "reward_mean": 0.6890000000000007,
        "reward_max": 1.4862500000000005,
        "reward_min": -0.3368749999999988,
        "leartime_s": 0.0093850779812783,
        "sampletime": 7.854255119978916,
        "best_mean": 0.7838750000000008,
        "best_max": 1.8156250000000012,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 141,
        "timesteps": 2820000,
        "reward_mean": 0.7083250000000008,
        "reward_max": 1.6125000000000007,
        "reward_min": -0.32500000000000023,
        "leartime_s": 0.025436320021981373,
        "sampletime": 7.783263686025748,
        "best_mean": 0.7838750000000008,
        "best_max": 1.8156250000000012,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 142,
        "timesteps": 2840000,
        "reward_mean": 0.6817000000000006,
        "reward_max": 1.648750000000001,
        "reward_min": -0.36687499999999873,
        "leartime_s": 0.009552899020491168,
        "sampletime": 7.763361039018491,
        "best_mean": 0.7838750000000008,
        "best_max": 1.8156250000000012,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 143,
        "timesteps": 2860000,
        "reward_mean": 0.7234000000000007,
        "reward_max": 1.718125000000001,
        "reward_min": -0.06812499999999921,
        "leartime_s": 0.00952990900259465,
        "sampletime": 7.632514261000324,
        "best_mean": 0.7838750000000008,
        "best_max": 1.8156250000000012,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 144,
        "timesteps": 2880000,
        "reward_mean": 1.0293000000000005,
        "reward_max": 1.9893750000000008,
        "reward_min": 0.033750000000001064,
        "leartime_s": 0.01089141602278687,
        "sampletime": 7.489142606995301,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 145,
        "timesteps": 2900000,
        "reward_mean": 0.6283000000000006,
        "reward_max": 1.7625000000000008,
        "reward_min": -0.25249999999999956,
        "leartime_s": 0.015139351977268234,
        "sampletime": 7.725155187014025,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 146,
        "timesteps": 2920000,
        "reward_mean": 0.5846750000000005,
        "reward_max": 1.3625,
        "reward_min": -0.44249999999999984,
        "leartime_s": 0.009664309007348493,
        "sampletime": 7.889831424021395,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 147,
        "timesteps": 2940000,
        "reward_mean": 0.8872250000000008,
        "reward_max": 1.6425000000000007,
        "reward_min": -0.09812499999999934,
        "leartime_s": 0.00996663499972783,
        "sampletime": 7.744838125974638,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 148,
        "timesteps": 2960000,
        "reward_mean": 0.5379750000000008,
        "reward_max": 1.251875000000001,
        "reward_min": -0.3399999999999992,
        "leartime_s": 0.0096086619887501,
        "sampletime": 7.767276811006013,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 149,
        "timesteps": 2980000,
        "reward_mean": 0.2777250000000007,
        "reward_max": 1.073125000000001,
        "reward_min": -0.5524999999999999,
        "leartime_s": 0.009812130010686815,
        "sampletime": 7.71472952599288,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 150,
        "timesteps": 3000000,
        "reward_mean": 0.7275000000000005,
        "reward_max": 1.9612500000000002,
        "reward_min": -0.2993749999999994,
        "leartime_s": 0.009829972987063229,
        "sampletime": 7.868988810980227,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 151,
        "timesteps": 3020000,
        "reward_mean": 0.7656250000000007,
        "reward_max": 1.753750000000001,
        "reward_min": -0.08437499999999938,
        "leartime_s": 0.00992529300856404,
        "sampletime": 8.013970293017337,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 152,
        "timesteps": 3040000,
        "reward_mean": 0.5895250000000006,
        "reward_max": 1.730000000000001,
        "reward_min": -0.5749999999999994,
        "leartime_s": 0.021141852979781106,
        "sampletime": 7.819051375001436,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 153,
        "timesteps": 3060000,
        "reward_mean": 0.5666000000000005,
        "reward_max": 1.6381250000000007,
        "reward_min": -0.4974999999999995,
        "leartime_s": 0.01649952700245194,
        "sampletime": 7.791849997011013,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 154,
        "timesteps": 3080000,
        "reward_mean": 0.7647000000000005,
        "reward_max": 1.8400000000000005,
        "reward_min": -0.05687499999999937,
        "leartime_s": 0.010250453982735053,
        "sampletime": 7.8600084480131045,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 155,
        "timesteps": 3100000,
        "reward_mean": 0.6908000000000006,
        "reward_max": 1.7075000000000007,
        "reward_min": -0.6512499999999998,
        "leartime_s": 0.009861220984021202,
        "sampletime": 7.758020445005968,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 156,
        "timesteps": 3120000,
        "reward_mean": 0.7350750000000007,
        "reward_max": 1.577500000000001,
        "reward_min": -0.2799999999999993,
        "leartime_s": 0.026395163004053757,
        "sampletime": 7.765382782992674,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 157,
        "timesteps": 3140000,
        "reward_mean": 0.8260500000000005,
        "reward_max": 1.9612500000000002,
        "reward_min": -0.2806249999999994,
        "leartime_s": 0.010505686019314453,
        "sampletime": 7.857504293002421,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 158,
        "timesteps": 3160000,
        "reward_mean": 0.5538500000000008,
        "reward_max": 1.3506250000000009,
        "reward_min": -0.3743749999999996,
        "leartime_s": 0.010158133984077722,
        "sampletime": 7.701139376993524,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 159,
        "timesteps": 3180000,
        "reward_mean": 0.6056250000000006,
        "reward_max": 1.5987500000000008,
        "reward_min": -0.5087499999999993,
        "leartime_s": 0.010297786997398362,
        "sampletime": 7.85326565199648,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 160,
        "timesteps": 3200000,
        "reward_mean": 0.5632250000000008,
        "reward_max": 1.3268750000000007,
        "reward_min": -0.24937499999999996,
        "leartime_s": 0.010137007018784061,
        "sampletime": 7.678911536000669,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 161,
        "timesteps": 3220000,
        "reward_mean": 0.6330750000000006,
        "reward_max": 1.6175000000000002,
        "reward_min": -0.2418749999999995,
        "leartime_s": 0.011065367987612262,
        "sampletime": 7.850545481982408,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 162,
        "timesteps": 3240000,
        "reward_mean": 0.5558250000000006,
        "reward_max": 1.3475000000000008,
        "reward_min": -0.46999999999999953,
        "leartime_s": 0.022888384002726525,
        "sampletime": 7.878550626017386,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 163,
        "timesteps": 3260000,
        "reward_mean": 0.9230750000000005,
        "reward_max": 1.7818750000000008,
        "reward_min": 0.060625000000000526,
        "leartime_s": 0.030064703983953223,
        "sampletime": 7.841239414003212,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 164,
        "timesteps": 3280000,
        "reward_mean": 0.7089250000000006,
        "reward_max": 1.5387500000000003,
        "reward_min": -0.3762499999999991,
        "leartime_s": 0.010345687973313034,
        "sampletime": 7.591392097994685,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 165,
        "timesteps": 3300000,
        "reward_mean": 0.9517250000000007,
        "reward_max": 2.1562500000000013,
        "reward_min": -0.14312499999999984,
        "leartime_s": 0.012540965981315821,
        "sampletime": 7.8651356539921835,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 166,
        "timesteps": 3320000,
        "reward_mean": 0.7288000000000007,
        "reward_max": 1.7543750000000007,
        "reward_min": -0.04562499999999943,
        "leartime_s": 0.010318323998944834,
        "sampletime": 7.675510859000497,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 167,
        "timesteps": 3340000,
        "reward_mean": 0.24722500000000058,
        "reward_max": 1.1168750000000007,
        "reward_min": -0.7306249999999997,
        "leartime_s": 0.015290162991732359,
        "sampletime": 7.738977897999575,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 168,
        "timesteps": 3360000,
        "reward_mean": 0.7946750000000007,
        "reward_max": 1.7131250000000002,
        "reward_min": -0.2868749999999992,
        "leartime_s": 0.022822508006356657,
        "sampletime": 7.796117952995701,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 169,
        "timesteps": 3380000,
        "reward_mean": 0.5415000000000006,
        "reward_max": 1.363750000000001,
        "reward_min": -0.5943749999999999,
        "leartime_s": 0.014366720017278567,
        "sampletime": 7.735026338981697,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 170,
        "timesteps": 3400000,
        "reward_mean": 0.5966000000000006,
        "reward_max": 1.7187500000000009,
        "reward_min": -0.27062499999999956,
        "leartime_s": 0.02050233501358889,
        "sampletime": 7.747198975004721,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 171,
        "timesteps": 3420000,
        "reward_mean": 0.1873000000000006,
        "reward_max": 1.4231250000000006,
        "reward_min": -1.1081249999999991,
        "leartime_s": 0.01058708899654448,
        "sampletime": 7.783264425001107,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 172,
        "timesteps": 3440000,
        "reward_mean": 0.3849250000000007,
        "reward_max": 1.1462500000000004,
        "reward_min": -0.9024999999999999,
        "leartime_s": 0.010771509987534955,
        "sampletime": 7.771014055004343,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 173,
        "timesteps": 3460000,
        "reward_mean": 0.5013000000000006,
        "reward_max": 1.3031250000000003,
        "reward_min": -0.4512499999999995,
        "leartime_s": 0.01073834000271745,
        "sampletime": 7.789053993998095,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 174,
        "timesteps": 3480000,
        "reward_mean": 0.7148750000000006,
        "reward_max": 1.5950000000000004,
        "reward_min": -0.2343749999999991,
        "leartime_s": 0.010933381010545418,
        "sampletime": 7.806972127000336,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 175,
        "timesteps": 3500000,
        "reward_mean": 0.31535000000000063,
        "reward_max": 1.1443750000000006,
        "reward_min": -0.6106249999999991,
        "leartime_s": 0.026026625011581928,
        "sampletime": 7.685922072007088,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 176,
        "timesteps": 3520000,
        "reward_mean": 0.4727000000000006,
        "reward_max": 1.3118750000000006,
        "reward_min": -0.4099999999999994,
        "leartime_s": 0.011049062013626099,
        "sampletime": 7.880376879998948,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 177,
        "timesteps": 3540000,
        "reward_mean": 0.5721750000000005,
        "reward_max": 1.5993750000000002,
        "reward_min": -0.5087499999999988,
        "leartime_s": 0.010790872998768464,
        "sampletime": 7.797357698000269,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 178,
        "timesteps": 3560000,
        "reward_mean": 0.7419000000000006,
        "reward_max": 1.8543750000000006,
        "reward_min": -0.1887499999999995,
        "leartime_s": 0.01061062898952514,
        "sampletime": 7.808697073021904,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 179,
        "timesteps": 3580000,
        "reward_mean": 0.7002000000000006,
        "reward_max": 1.5212500000000004,
        "reward_min": -0.23374999999999968,
        "leartime_s": 0.012656462989980355,
        "sampletime": 7.873727638012497,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 180,
        "timesteps": 3600000,
        "reward_mean": 0.5534250000000006,
        "reward_max": 1.6612500000000008,
        "reward_min": -0.4699999999999995,
        "leartime_s": 0.010957385995425284,
        "sampletime": 7.703620953980135,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 181,
        "timesteps": 3620000,
        "reward_mean": 0.6399500000000006,
        "reward_max": 1.6056250000000012,
        "reward_min": -0.30874999999999986,
        "leartime_s": 0.021629544004099444,
        "sampletime": 7.701800640003057,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 182,
        "timesteps": 3640000,
        "reward_mean": 0.7199750000000006,
        "reward_max": 1.6837500000000007,
        "reward_min": -0.3937499999999998,
        "leartime_s": 0.019431159977102652,
        "sampletime": 7.707250325009227,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 183,
        "timesteps": 3660000,
        "reward_mean": 0.3970000000000007,
        "reward_max": 1.3843750000000008,
        "reward_min": -0.6018749999999998,
        "leartime_s": 0.015144336997764185,
        "sampletime": 8.002597805985715,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 184,
        "timesteps": 3680000,
        "reward_mean": 0.5821250000000007,
        "reward_max": 1.6537500000000007,
        "reward_min": -0.22999999999999945,
        "leartime_s": 0.01128539300407283,
        "sampletime": 7.827510557981441,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 185,
        "timesteps": 3700000,
        "reward_mean": 0.6692500000000007,
        "reward_max": 1.4156250000000006,
        "reward_min": -0.47187499999999927,
        "leartime_s": 0.011270846996922046,
        "sampletime": 7.770293459994718,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 186,
        "timesteps": 3720000,
        "reward_mean": 0.4605500000000006,
        "reward_max": 1.293125000000001,
        "reward_min": -0.32499999999999973,
        "leartime_s": 0.01126926700817421,
        "sampletime": 7.813578910019714,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 187,
        "timesteps": 3740000,
        "reward_mean": 0.6465500000000006,
        "reward_max": 1.7093750000000005,
        "reward_min": -0.2918749999999991,
        "leartime_s": 0.011576905002584681,
        "sampletime": 7.829019711003639,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 188,
        "timesteps": 3760000,
        "reward_mean": 0.4895000000000007,
        "reward_max": 1.2643750000000007,
        "reward_min": -0.32374999999999904,
        "leartime_s": 0.012625350995222107,
        "sampletime": 7.795220985019114,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 189,
        "timesteps": 3780000,
        "reward_mean": 0.11532500000000068,
        "reward_max": 1.3493750000000009,
        "reward_min": -1.008124999999999,
        "leartime_s": 0.01353030899190344,
        "sampletime": 7.764007573015988,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 190,
        "timesteps": 3800000,
        "reward_mean": 0.3207250000000006,
        "reward_max": 1.2225000000000008,
        "reward_min": -1.0481249999999998,
        "leartime_s": 0.02873941499274224,
        "sampletime": 7.837019698985387,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 191,
        "timesteps": 3820000,
        "reward_mean": 0.4172750000000007,
        "reward_max": 1.3668750000000007,
        "reward_min": -1.3187499999999996,
        "leartime_s": 0.008933079981943592,
        "sampletime": 7.8206031230220105,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 192,
        "timesteps": 3840000,
        "reward_mean": 0.5846250000000006,
        "reward_max": 1.617500000000001,
        "reward_min": -1.0631249999999994,
        "leartime_s": 0.011407545011024922,
        "sampletime": 7.712172709027072,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 193,
        "timesteps": 3860000,
        "reward_mean": 0.3134000000000007,
        "reward_max": 1.2306250000000005,
        "reward_min": -0.9824999999999999,
        "leartime_s": 0.011586077976971865,
        "sampletime": 7.827934712986462,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 194,
        "timesteps": 3880000,
        "reward_mean": 0.3428250000000007,
        "reward_max": 1.1543750000000013,
        "reward_min": -0.993749999999999,
        "leartime_s": 0.015827880997676402,
        "sampletime": 7.865526900975965,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 195,
        "timesteps": 3900000,
        "reward_mean": 0.7589500000000007,
        "reward_max": 1.8768750000000005,
        "reward_min": -0.26499999999999846,
        "leartime_s": 0.01152926599024795,
        "sampletime": 8.045699987997068,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 196,
        "timesteps": 3920000,
        "reward_mean": 0.41090000000000076,
        "reward_max": 1.2187500000000007,
        "reward_min": -0.43687499999999896,
        "leartime_s": 0.011477677995571867,
        "sampletime": 7.724784401012585,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 197,
        "timesteps": 3940000,
        "reward_mean": 0.5049250000000007,
        "reward_max": 1.4962500000000005,
        "reward_min": -0.5943749999999989,
        "leartime_s": 0.02595792998909019,
        "sampletime": 7.7308744360052515,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 198,
        "timesteps": 3960000,
        "reward_mean": 0.9209500000000006,
        "reward_max": 1.7993750000000008,
        "reward_min": -0.10624999999999933,
        "leartime_s": 0.011887979984749109,
        "sampletime": 7.865325224003755,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 199,
        "timesteps": 3980000,
        "reward_mean": 0.34970000000000057,
        "reward_max": 1.5768750000000002,
        "reward_min": -0.490625,
        "leartime_s": 0.011416917986935005,
        "sampletime": 7.776867651002249,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 200,
        "timesteps": 4000000,
        "reward_mean": 0.5657000000000005,
        "reward_max": 1.5087500000000003,
        "reward_min": -0.4737499999999991,
        "leartime_s": 0.02933533099712804,
        "sampletime": 7.920788067014655,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 201,
        "timesteps": 4020000,
        "reward_mean": 0.5753750000000006,
        "reward_max": 1.5037500000000001,
        "reward_min": -0.6624999999999994,
        "leartime_s": 0.011905656981980428,
        "sampletime": 7.777171915979125,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 202,
        "timesteps": 4040000,
        "reward_mean": 0.5730000000000007,
        "reward_max": 1.4231250000000006,
        "reward_min": -0.3481249999999997,
        "leartime_s": 0.0158590929931961,
        "sampletime": 7.757476086000679,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 203,
        "timesteps": 4060000,
        "reward_mean": 0.8509000000000005,
        "reward_max": 1.7581250000000006,
        "reward_min": -0.3337499999999995,
        "leartime_s": 0.029647624003700912,
        "sampletime": 7.8739073110045865,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 204,
        "timesteps": 4080000,
        "reward_mean": 0.4605750000000006,
        "reward_max": 1.2968750000000004,
        "reward_min": -0.6437499999999998,
        "leartime_s": 0.011936058988794684,
        "sampletime": 7.816484859999036,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 205,
        "timesteps": 4100000,
        "reward_mean": 0.5551500000000007,
        "reward_max": 1.686250000000001,
        "reward_min": -0.44812499999999944,
        "leartime_s": 0.011903311009518802,
        "sampletime": 7.69673415098805,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 206,
        "timesteps": 4120000,
        "reward_mean": 0.6317750000000006,
        "reward_max": 1.4943750000000011,
        "reward_min": -0.5418749999999989,
        "leartime_s": 0.02443863300140947,
        "sampletime": 7.750521244015545,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 207,
        "timesteps": 4140000,
        "reward_mean": 0.9130500000000006,
        "reward_max": 1.707500000000001,
        "reward_min": -0.09562499999999988,
        "leartime_s": 0.013161048002075404,
        "sampletime": 7.778574856987689,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 208,
        "timesteps": 4160000,
        "reward_mean": 0.6437500000000007,
        "reward_max": 1.5531250000000005,
        "reward_min": -0.3156249999999994,
        "leartime_s": 0.01247745199361816,
        "sampletime": 7.892137254006229,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 209,
        "timesteps": 4180000,
        "reward_mean": 0.48262500000000064,
        "reward_max": 1.3300000000000005,
        "reward_min": -0.5,
        "leartime_s": 0.012701514002401382,
        "sampletime": 7.833106714999303,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 210,
        "timesteps": 4200000,
        "reward_mean": 0.5922250000000006,
        "reward_max": 1.4281250000000008,
        "reward_min": -0.75875,
        "leartime_s": 0.028594462986802682,
        "sampletime": 7.87306117801927,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 211,
        "timesteps": 4220000,
        "reward_mean": 0.8036000000000004,
        "reward_max": 1.8687500000000008,
        "reward_min": -0.18687499999999968,
        "leartime_s": 0.021129859989741817,
        "sampletime": 7.576126483007101,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 212,
        "timesteps": 4240000,
        "reward_mean": 0.6457750000000005,
        "reward_max": 1.5075000000000007,
        "reward_min": -0.16749999999999932,
        "leartime_s": 0.02655251999385655,
        "sampletime": 7.756699650984956,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 213,
        "timesteps": 4260000,
        "reward_mean": 0.9158500000000006,
        "reward_max": 1.8593750000000007,
        "reward_min": -0.2650000000000001,
        "leartime_s": 0.02474171097856015,
        "sampletime": 7.742030719004106,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 214,
        "timesteps": 4280000,
        "reward_mean": 0.7753500000000006,
        "reward_max": 1.5456250000000014,
        "reward_min": -0.07999999999999953,
        "leartime_s": 0.032334917021216825,
        "sampletime": 7.841265857015969,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 215,
        "timesteps": 4300000,
        "reward_mean": 0.7062000000000007,
        "reward_max": 1.6162500000000006,
        "reward_min": -1.5512499999999996,
        "leartime_s": 0.01851683499990031,
        "sampletime": 7.829181273991708,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 216,
        "timesteps": 4320000,
        "reward_mean": 0.7832250000000008,
        "reward_max": 1.5818750000000006,
        "reward_min": -0.14624999999999982,
        "leartime_s": 0.01719719500397332,
        "sampletime": 7.883745361992624,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 217,
        "timesteps": 4340000,
        "reward_mean": 0.9381000000000008,
        "reward_max": 1.7987500000000012,
        "reward_min": 0.12937500000000052,
        "leartime_s": 0.025231287989299744,
        "sampletime": 7.681996695988346,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 218,
        "timesteps": 4360000,
        "reward_mean": 0.18912500000000065,
        "reward_max": 1.1081250000000007,
        "reward_min": -0.8974999999999991,
        "leartime_s": 0.01218942500418052,
        "sampletime": 7.971203811990563,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 219,
        "timesteps": 4380000,
        "reward_mean": 0.9527000000000008,
        "reward_max": 1.8368750000000005,
        "reward_min": 0.10125000000000049,
        "leartime_s": 0.013463167008012533,
        "sampletime": 7.774230868002633,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 220,
        "timesteps": 4400000,
        "reward_mean": 0.5746750000000007,
        "reward_max": 1.3881250000000007,
        "reward_min": -0.7474999999999996,
        "leartime_s": 0.012740079982904717,
        "sampletime": 7.783842602017103,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 221,
        "timesteps": 4420000,
        "reward_mean": 0.6247750000000006,
        "reward_max": 1.5268750000000004,
        "reward_min": -0.6149999999999994,
        "leartime_s": 0.012667884991969913,
        "sampletime": 7.8418087440077215,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 222,
        "timesteps": 4440000,
        "reward_mean": 0.5138250000000008,
        "reward_max": 1.4637500000000006,
        "reward_min": -0.8118749999999995,
        "leartime_s": 0.013327249995199963,
        "sampletime": 7.854956405994017,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 223,
        "timesteps": 4460000,
        "reward_mean": 0.7575250000000006,
        "reward_max": 1.6,
        "reward_min": 0.0037500000000003364,
        "leartime_s": 0.034740937990136445,
        "sampletime": 7.819704413006548,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 224,
        "timesteps": 4480000,
        "reward_mean": 0.7076000000000007,
        "reward_max": 1.7525000000000004,
        "reward_min": -0.10437499999999963,
        "leartime_s": 0.012867976998677477,
        "sampletime": 7.769411524001043,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 225,
        "timesteps": 4500000,
        "reward_mean": 0.9252750000000005,
        "reward_max": 2.0800000000000005,
        "reward_min": -0.5406249999999996,
        "leartime_s": 0.013616847980301827,
        "sampletime": 7.729210162011441,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 226,
        "timesteps": 4520000,
        "reward_mean": 0.9438250000000005,
        "reward_max": 2.2462500000000007,
        "reward_min": -0.11562499999999974,
        "leartime_s": 0.0123914219730068,
        "sampletime": 7.843882768996991,
        "best_mean": 1.0293000000000005,
        "best_max": 1.9893750000000008,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 227,
        "timesteps": 4540000,
        "reward_mean": 1.0599250000000007,
        "reward_max": 1.9156250000000006,
        "reward_min": 0.18625000000000042,
        "leartime_s": 0.012827726983232424,
        "sampletime": 7.7199133959948085,
        "best_mean": 1.0599250000000007,
        "best_max": 1.9156250000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 228,
        "timesteps": 4560000,
        "reward_mean": 0.9403000000000007,
        "reward_max": 1.781875,
        "reward_min": -0.08124999999999949,
        "leartime_s": 0.024623776989756152,
        "sampletime": 7.7776854730036575,
        "best_mean": 1.0599250000000007,
        "best_max": 1.9156250000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 229,
        "timesteps": 4580000,
        "reward_mean": 0.8020750000000006,
        "reward_max": 1.7181250000000006,
        "reward_min": -0.06374999999999922,
        "leartime_s": 0.012821165000787005,
        "sampletime": 7.796231387008447,
        "best_mean": 1.0599250000000007,
        "best_max": 1.9156250000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 230,
        "timesteps": 4600000,
        "reward_mean": 1.1696000000000009,
        "reward_max": 2.0012500000000006,
        "reward_min": 0.1812500000000004,
        "leartime_s": 0.029253857006551698,
        "sampletime": 7.682222175993957,
        "best_mean": 1.1696000000000009,
        "best_max": 2.0012500000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 231,
        "timesteps": 4620000,
        "reward_mean": 1.0047000000000008,
        "reward_max": 1.9512500000000004,
        "reward_min": -0.23437499999999914,
        "leartime_s": 0.013508205011021346,
        "sampletime": 7.741183931007981,
        "best_mean": 1.1696000000000009,
        "best_max": 2.0012500000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 232,
        "timesteps": 4640000,
        "reward_mean": 0.7609000000000008,
        "reward_max": 1.6862500000000011,
        "reward_min": -0.9799999999999996,
        "leartime_s": 0.020478601014474407,
        "sampletime": 7.690227724000579,
        "best_mean": 1.1696000000000009,
        "best_max": 2.0012500000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 233,
        "timesteps": 4660000,
        "reward_mean": 0.8284250000000006,
        "reward_max": 1.7200000000000009,
        "reward_min": -0.259375,
        "leartime_s": 0.012995831988519058,
        "sampletime": 7.816095226997277,
        "best_mean": 1.1696000000000009,
        "best_max": 2.0012500000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 234,
        "timesteps": 4680000,
        "reward_mean": 0.7050000000000007,
        "reward_max": 1.4993750000000006,
        "reward_min": -0.032499999999999474,
        "leartime_s": 0.05079267401015386,
        "sampletime": 7.910878358001355,
        "best_mean": 1.1696000000000009,
        "best_max": 2.0012500000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 235,
        "timesteps": 4700000,
        "reward_mean": 0.8506500000000007,
        "reward_max": 1.6681250000000005,
        "reward_min": -0.28499999999999936,
        "leartime_s": 0.02923344701412134,
        "sampletime": 7.862629337003455,
        "best_mean": 1.1696000000000009,
        "best_max": 2.0012500000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 236,
        "timesteps": 4720000,
        "reward_mean": 0.7651750000000006,
        "reward_max": 1.6943750000000009,
        "reward_min": -0.2693749999999995,
        "leartime_s": 0.008581711008446291,
        "sampletime": 7.872411037009442,
        "best_mean": 1.1696000000000009,
        "best_max": 2.0012500000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 237,
        "timesteps": 4740000,
        "reward_mean": 0.969700000000001,
        "reward_max": 1.872500000000001,
        "reward_min": -0.08374999999999923,
        "leartime_s": 0.013333346985746175,
        "sampletime": 7.729654787981417,
        "best_mean": 1.1696000000000009,
        "best_max": 2.0012500000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 238,
        "timesteps": 4760000,
        "reward_mean": 0.8472750000000008,
        "reward_max": 1.7843750000000005,
        "reward_min": -0.5606249999999989,
        "leartime_s": 0.013175092986784875,
        "sampletime": 7.765422511001816,
        "best_mean": 1.1696000000000009,
        "best_max": 2.0012500000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 239,
        "timesteps": 4780000,
        "reward_mean": 1.0865750000000007,
        "reward_max": 2.0375000000000005,
        "reward_min": 0.26250000000000095,
        "leartime_s": 0.014417533006053418,
        "sampletime": 7.756414445000701,
        "best_mean": 1.1696000000000009,
        "best_max": 2.0012500000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 240,
        "timesteps": 4800000,
        "reward_mean": 0.7643250000000007,
        "reward_max": 1.763125000000001,
        "reward_min": -0.2968749999999993,
        "leartime_s": 0.013845709996530786,
        "sampletime": 7.782829800009495,
        "best_mean": 1.1696000000000009,
        "best_max": 2.0012500000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 241,
        "timesteps": 4820000,
        "reward_mean": 0.7712000000000008,
        "reward_max": 1.8043750000000014,
        "reward_min": -0.20937499999999923,
        "leartime_s": 0.023876921011833474,
        "sampletime": 7.9327001179917715,
        "best_mean": 1.1696000000000009,
        "best_max": 2.0012500000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 242,
        "timesteps": 4840000,
        "reward_mean": 0.6821500000000008,
        "reward_max": 1.3493750000000009,
        "reward_min": -0.3624999999999994,
        "leartime_s": 0.02309363297536038,
        "sampletime": 7.732576150010573,
        "best_mean": 1.1696000000000009,
        "best_max": 2.0012500000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 243,
        "timesteps": 4860000,
        "reward_mean": 0.8758750000000008,
        "reward_max": 1.6650000000000005,
        "reward_min": 0.2750000000000011,
        "leartime_s": 0.013070435990812257,
        "sampletime": 7.81119873400894,
        "best_mean": 1.1696000000000009,
        "best_max": 2.0012500000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 244,
        "timesteps": 4880000,
        "reward_mean": 0.7355750000000008,
        "reward_max": 1.9031250000000008,
        "reward_min": -0.242499999999999,
        "leartime_s": 0.01549529898329638,
        "sampletime": 7.898690253001405,
        "best_mean": 1.1696000000000009,
        "best_max": 2.0012500000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 245,
        "timesteps": 4900000,
        "reward_mean": 0.7667500000000007,
        "reward_max": 1.4181250000000005,
        "reward_min": -0.02874999999999933,
        "leartime_s": 0.03238880998105742,
        "sampletime": 7.833270333008841,
        "best_mean": 1.1696000000000009,
        "best_max": 2.0012500000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 246,
        "timesteps": 4920000,
        "reward_mean": 0.9717500000000007,
        "reward_max": 1.8200000000000005,
        "reward_min": 0.005625000000000421,
        "leartime_s": 0.013564797001890838,
        "sampletime": 7.816143653995823,
        "best_mean": 1.1696000000000009,
        "best_max": 2.0012500000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 247,
        "timesteps": 4940000,
        "reward_mean": 0.7897750000000007,
        "reward_max": 1.666250000000001,
        "reward_min": 0.023750000000000472,
        "leartime_s": 0.014860547002172098,
        "sampletime": 7.729380211996613,
        "best_mean": 1.1696000000000009,
        "best_max": 2.0012500000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 248,
        "timesteps": 4960000,
        "reward_mean": 0.8722000000000006,
        "reward_max": 1.6006250000000004,
        "reward_min": -0.04249999999999945,
        "leartime_s": 0.012687832990195602,
        "sampletime": 7.735542159003671,
        "best_mean": 1.1696000000000009,
        "best_max": 2.0012500000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 249,
        "timesteps": 4980000,
        "reward_mean": 1.0613250000000007,
        "reward_max": 1.8081250000000006,
        "reward_min": -0.2524999999999994,
        "leartime_s": 0.033878647023811936,
        "sampletime": 7.8287612659914885,
        "best_mean": 1.1696000000000009,
        "best_max": 2.0012500000000006,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 250,
        "timesteps": 5000000,
        "reward_mean": 1.1815500000000005,
        "reward_max": 2.239375000000001,
        "reward_min": 0.07000000000000009,
        "leartime_s": 0.013891817012336105,
        "sampletime": 7.669308487005765,
        "best_mean": 1.1815500000000005,
        "best_max": 2.239375000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 251,
        "timesteps": 5020000,
        "reward_mean": 0.8528250000000007,
        "reward_max": 1.6093750000000004,
        "reward_min": 0.009375000000000203,
        "leartime_s": 0.023392236995277926,
        "sampletime": 7.854949783999473,
        "best_mean": 1.1815500000000005,
        "best_max": 2.239375000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 252,
        "timesteps": 5040000,
        "reward_mean": 0.7014500000000007,
        "reward_max": 1.6818750000000007,
        "reward_min": -0.6775,
        "leartime_s": 0.013733373983995989,
        "sampletime": 7.900247317011235,
        "best_mean": 1.1815500000000005,
        "best_max": 2.239375000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 253,
        "timesteps": 5060000,
        "reward_mean": 0.5926250000000007,
        "reward_max": 1.6800000000000008,
        "reward_min": -0.4349999999999993,
        "leartime_s": 0.01739331299904734,
        "sampletime": 7.843907233007485,
        "best_mean": 1.1815500000000005,
        "best_max": 2.239375000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 254,
        "timesteps": 5080000,
        "reward_mean": 0.7982000000000007,
        "reward_max": 1.9875000000000007,
        "reward_min": -0.4799999999999992,
        "leartime_s": 0.014496479008812457,
        "sampletime": 7.610914869001135,
        "best_mean": 1.1815500000000005,
        "best_max": 2.239375000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 255,
        "timesteps": 5100000,
        "reward_mean": 0.7612250000000007,
        "reward_max": 1.8706250000000009,
        "reward_min": -0.4743749999999997,
        "leartime_s": 0.03426288301125169,
        "sampletime": 7.765557815000648,
        "best_mean": 1.1815500000000005,
        "best_max": 2.239375000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 256,
        "timesteps": 5120000,
        "reward_mean": 0.9423750000000009,
        "reward_max": 1.7206250000000007,
        "reward_min": -0.0718749999999991,
        "leartime_s": 0.0139699210121762,
        "sampletime": 8.0127489019942,
        "best_mean": 1.1815500000000005,
        "best_max": 2.239375000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 257,
        "timesteps": 5140000,
        "reward_mean": 1.0918250000000007,
        "reward_max": 2.135000000000001,
        "reward_min": 0.08062500000000063,
        "leartime_s": 0.02930737700080499,
        "sampletime": 7.759452594007598,
        "best_mean": 1.1815500000000005,
        "best_max": 2.239375000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 258,
        "timesteps": 5160000,
        "reward_mean": 0.5340000000000007,
        "reward_max": 1.5656250000000007,
        "reward_min": -0.6206249999999995,
        "leartime_s": 0.04681784301646985,
        "sampletime": 7.837251899996772,
        "best_mean": 1.1815500000000005,
        "best_max": 2.239375000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 259,
        "timesteps": 5180000,
        "reward_mean": 0.8391750000000009,
        "reward_max": 1.711875000000001,
        "reward_min": -0.34312499999999935,
        "leartime_s": 0.013946665014373139,
        "sampletime": 7.733566348993918,
        "best_mean": 1.1815500000000005,
        "best_max": 2.239375000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 260,
        "timesteps": 5200000,
        "reward_mean": 0.6411000000000006,
        "reward_max": 1.8543750000000006,
        "reward_min": -0.45187500000000014,
        "leartime_s": 0.015349334018537775,
        "sampletime": 7.761536723002791,
        "best_mean": 1.1815500000000005,
        "best_max": 2.239375000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 261,
        "timesteps": 5220000,
        "reward_mean": 0.8945250000000008,
        "reward_max": 1.866250000000001,
        "reward_min": -0.12562499999999935,
        "leartime_s": 0.016473780007800087,
        "sampletime": 7.727011118986411,
        "best_mean": 1.1815500000000005,
        "best_max": 2.239375000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 262,
        "timesteps": 5240000,
        "reward_mean": 0.7717250000000005,
        "reward_max": 1.661250000000001,
        "reward_min": -0.5412499999999991,
        "leartime_s": 0.014257236995035782,
        "sampletime": 7.714554086007411,
        "best_mean": 1.1815500000000005,
        "best_max": 2.239375000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 263,
        "timesteps": 5260000,
        "reward_mean": 0.9550250000000008,
        "reward_max": 2.0681250000000007,
        "reward_min": 0.04187500000000115,
        "leartime_s": 0.02776270901085809,
        "sampletime": 7.767166609992273,
        "best_mean": 1.1815500000000005,
        "best_max": 2.239375000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 264,
        "timesteps": 5280000,
        "reward_mean": 0.6665500000000006,
        "reward_max": 1.685000000000001,
        "reward_min": -0.6393749999999996,
        "leartime_s": 0.029712782008573413,
        "sampletime": 7.766393918020185,
        "best_mean": 1.1815500000000005,
        "best_max": 2.239375000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 265,
        "timesteps": 5300000,
        "reward_mean": 0.8474500000000006,
        "reward_max": 2.0662500000000006,
        "reward_min": -0.2931249999999995,
        "leartime_s": 0.01415286201518029,
        "sampletime": 7.752597382001113,
        "best_mean": 1.1815500000000005,
        "best_max": 2.239375000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 266,
        "timesteps": 5320000,
        "reward_mean": 1.0051750000000008,
        "reward_max": 2.176250000000001,
        "reward_min": -0.5624999999999988,
        "leartime_s": 0.014672874996904284,
        "sampletime": 7.841117036005016,
        "best_mean": 1.1815500000000005,
        "best_max": 2.239375000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 267,
        "timesteps": 5340000,
        "reward_mean": 0.7451750000000007,
        "reward_max": 1.6818750000000007,
        "reward_min": -0.07062499999999933,
        "leartime_s": 0.01459490301203914,
        "sampletime": 7.685225424997043,
        "best_mean": 1.1815500000000005,
        "best_max": 2.239375000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 268,
        "timesteps": 5360000,
        "reward_mean": 0.8384750000000007,
        "reward_max": 1.8225000000000002,
        "reward_min": -0.7937499999999991,
        "leartime_s": 0.023140987002989277,
        "sampletime": 7.832697167992592,
        "best_mean": 1.1815500000000005,
        "best_max": 2.239375000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 269,
        "timesteps": 5380000,
        "reward_mean": 0.8644000000000006,
        "reward_max": 1.7937500000000006,
        "reward_min": -0.11999999999999975,
        "leartime_s": 0.014421130006667227,
        "sampletime": 7.899702930008061,
        "best_mean": 1.1815500000000005,
        "best_max": 2.239375000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 270,
        "timesteps": 5400000,
        "reward_mean": 1.1021750000000006,
        "reward_max": 2.1750000000000007,
        "reward_min": -0.1137499999999993,
        "leartime_s": 0.02792414600844495,
        "sampletime": 7.7918246510089375,
        "best_mean": 1.1815500000000005,
        "best_max": 2.239375000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 271,
        "timesteps": 5420000,
        "reward_mean": 1.0296750000000006,
        "reward_max": 2.299375000000001,
        "reward_min": 0.11375000000000125,
        "leartime_s": 0.018436368001857772,
        "sampletime": 7.858511189988349,
        "best_mean": 1.1815500000000005,
        "best_max": 2.239375000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 272,
        "timesteps": 5440000,
        "reward_mean": 0.8563500000000007,
        "reward_max": 1.8118750000000008,
        "reward_min": -0.45499999999999935,
        "leartime_s": 0.02492527401773259,
        "sampletime": 7.823207004985306,
        "best_mean": 1.1815500000000005,
        "best_max": 2.239375000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 273,
        "timesteps": 5460000,
        "reward_mean": 0.9779250000000007,
        "reward_max": 2.2031250000000004,
        "reward_min": -0.2274999999999999,
        "leartime_s": 0.016208479995839298,
        "sampletime": 7.87558215399622,
        "best_mean": 1.1815500000000005,
        "best_max": 2.239375000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 274,
        "timesteps": 5480000,
        "reward_mean": 1.1412250000000008,
        "reward_max": 2.04375,
        "reward_min": -0.34062499999999923,
        "leartime_s": 0.014652484998805448,
        "sampletime": 7.762722277984722,
        "best_mean": 1.1815500000000005,
        "best_max": 2.239375000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 275,
        "timesteps": 5500000,
        "reward_mean": 1.004750000000001,
        "reward_max": 1.7906250000000004,
        "reward_min": 0.020625000000000837,
        "leartime_s": 0.014893731015035883,
        "sampletime": 7.6711002590018325,
        "best_mean": 1.1815500000000005,
        "best_max": 2.239375000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 276,
        "timesteps": 5520000,
        "reward_mean": 0.9583000000000006,
        "reward_max": 1.8350000000000009,
        "reward_min": -0.23749999999999907,
        "leartime_s": 0.037289950996637344,
        "sampletime": 7.810871048015542,
        "best_mean": 1.1815500000000005,
        "best_max": 2.239375000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 277,
        "timesteps": 5540000,
        "reward_mean": 1.0542500000000006,
        "reward_max": 2.091875000000001,
        "reward_min": 0.16687500000000088,
        "leartime_s": 0.01481191601487808,
        "sampletime": 7.836663353984477,
        "best_mean": 1.1815500000000005,
        "best_max": 2.239375000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 278,
        "timesteps": 5560000,
        "reward_mean": 0.8886500000000006,
        "reward_max": 1.9725000000000006,
        "reward_min": -0.20812499999999967,
        "leartime_s": 0.014990348019637167,
        "sampletime": 7.729695554997306,
        "best_mean": 1.1815500000000005,
        "best_max": 2.239375000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 279,
        "timesteps": 5580000,
        "reward_mean": 1.0135500000000006,
        "reward_max": 1.9968750000000006,
        "reward_min": -0.12499999999999957,
        "leartime_s": 0.022224574990104884,
        "sampletime": 7.688538563990733,
        "best_mean": 1.1815500000000005,
        "best_max": 2.239375000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 280,
        "timesteps": 5600000,
        "reward_mean": 1.2539750000000005,
        "reward_max": 2.0881250000000007,
        "reward_min": -0.023749999999999372,
        "leartime_s": 0.01711732300464064,
        "sampletime": 7.827171584009193,
        "best_mean": 1.2539750000000005,
        "best_max": 2.0881250000000007,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 281,
        "timesteps": 5620000,
        "reward_mean": 0.9836500000000006,
        "reward_max": 1.7975000000000012,
        "reward_min": -0.4224999999999992,
        "leartime_s": 0.017055567994248122,
        "sampletime": 7.653588874003617,
        "best_mean": 1.2539750000000005,
        "best_max": 2.0881250000000007,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 282,
        "timesteps": 5640000,
        "reward_mean": 1.0790000000000006,
        "reward_max": 2.4487500000000004,
        "reward_min": -0.2574999999999997,
        "leartime_s": 0.016393780009821057,
        "sampletime": 7.838041504001012,
        "best_mean": 1.2539750000000005,
        "best_max": 2.0881250000000007,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 283,
        "timesteps": 5660000,
        "reward_mean": 0.8532500000000007,
        "reward_max": 1.7406250000000008,
        "reward_min": -0.011874999999999566,
        "leartime_s": 0.015479228983167559,
        "sampletime": 7.754786311008502,
        "best_mean": 1.2539750000000005,
        "best_max": 2.0881250000000007,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 284,
        "timesteps": 5680000,
        "reward_mean": 0.7965250000000008,
        "reward_max": 1.9456250000000004,
        "reward_min": -0.07874999999999903,
        "leartime_s": 0.019882671011146158,
        "sampletime": 7.927586204983527,
        "best_mean": 1.2539750000000005,
        "best_max": 2.0881250000000007,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 285,
        "timesteps": 5700000,
        "reward_mean": 0.8726500000000008,
        "reward_max": 1.9068750000000005,
        "reward_min": -0.32062499999999894,
        "leartime_s": 0.022560910001629964,
        "sampletime": 7.830951577983797,
        "best_mean": 1.2539750000000005,
        "best_max": 2.0881250000000007,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 286,
        "timesteps": 5720000,
        "reward_mean": 0.8275000000000007,
        "reward_max": 1.8681250000000003,
        "reward_min": -0.6424999999999994,
        "leartime_s": 0.025351233023684472,
        "sampletime": 7.740067892998923,
        "best_mean": 1.2539750000000005,
        "best_max": 2.0881250000000007,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 287,
        "timesteps": 5740000,
        "reward_mean": 1.2101250000000008,
        "reward_max": 2.423750000000001,
        "reward_min": 0.15000000000000108,
        "leartime_s": 0.0360858729982283,
        "sampletime": 7.8790048160008155,
        "best_mean": 1.2539750000000005,
        "best_max": 2.0881250000000007,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 288,
        "timesteps": 5760000,
        "reward_mean": 1.1444250000000007,
        "reward_max": 2.138750000000001,
        "reward_min": 0.1643750000000011,
        "leartime_s": 0.024387730984017253,
        "sampletime": 7.760723979998147,
        "best_mean": 1.2539750000000005,
        "best_max": 2.0881250000000007,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 289,
        "timesteps": 5780000,
        "reward_mean": 0.7930750000000008,
        "reward_max": 1.729375000000001,
        "reward_min": -0.3043749999999995,
        "leartime_s": 0.01530680400901474,
        "sampletime": 7.879349859984359,
        "best_mean": 1.2539750000000005,
        "best_max": 2.0881250000000007,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 290,
        "timesteps": 5800000,
        "reward_mean": 0.9958750000000007,
        "reward_max": 1.7056250000000008,
        "reward_min": 0.1975000000000003,
        "leartime_s": 0.03014445398002863,
        "sampletime": 7.765844290988753,
        "best_mean": 1.2539750000000005,
        "best_max": 2.0881250000000007,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 291,
        "timesteps": 5820000,
        "reward_mean": 0.9742000000000007,
        "reward_max": 1.7837500000000004,
        "reward_min": -0.08312499999999957,
        "leartime_s": 0.01931433702702634,
        "sampletime": 7.726025819021743,
        "best_mean": 1.2539750000000005,
        "best_max": 2.0881250000000007,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 292,
        "timesteps": 5840000,
        "reward_mean": 1.4016250000000008,
        "reward_max": 2.423750000000001,
        "reward_min": 0.45750000000000063,
        "leartime_s": 0.019156786001985893,
        "sampletime": 7.77062956802547,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 293,
        "timesteps": 5860000,
        "reward_mean": 1.0172411666666674,
        "reward_max": 2.2118750000000005,
        "reward_min": -0.3849999999999993,
        "leartime_s": 0.023324803012656048,
        "sampletime": 7.951232897001319,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 294,
        "timesteps": 5880000,
        "reward_mean": 1.1798250000000008,
        "reward_max": 2.256875,
        "reward_min": 0.20750000000000043,
        "leartime_s": 0.016990506002912298,
        "sampletime": 8.093653739982983,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 295,
        "timesteps": 5900000,
        "reward_mean": 0.9639750000000007,
        "reward_max": 1.9637500000000006,
        "reward_min": 0.13562500000000072,
        "leartime_s": 0.015312197007006034,
        "sampletime": 7.756887423020089,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 296,
        "timesteps": 5920000,
        "reward_mean": 0.8143250000000007,
        "reward_max": 1.7318750000000005,
        "reward_min": -0.2837499999999996,
        "leartime_s": 0.016791124013252556,
        "sampletime": 7.8017017480160575,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 297,
        "timesteps": 5940000,
        "reward_mean": 1.2375250000000009,
        "reward_max": 2.0206250000000003,
        "reward_min": 0.4806250000000004,
        "leartime_s": 0.0157364479964599,
        "sampletime": 7.725563352025347,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 298,
        "timesteps": 5960000,
        "reward_mean": 1.0545750000000007,
        "reward_max": 2.1012500000000003,
        "reward_min": 0.11750000000000066,
        "leartime_s": 0.028554872988024727,
        "sampletime": 7.797571026982041,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 299,
        "timesteps": 5980000,
        "reward_mean": 1.2817000000000007,
        "reward_max": 2.2150000000000003,
        "reward_min": 0.2575000000000012,
        "leartime_s": 0.015813578997040167,
        "sampletime": 7.846386156015797,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 300,
        "timesteps": 6000000,
        "reward_mean": 1.1505750000000008,
        "reward_max": 2.04,
        "reward_min": 0.16812500000000058,
        "leartime_s": 0.03255651600193232,
        "sampletime": 7.8246746629884,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 301,
        "timesteps": 6020000,
        "reward_mean": 0.6227750000000006,
        "reward_max": 1.7368750000000006,
        "reward_min": -1.5893749999999995,
        "leartime_s": 0.0252742120064795,
        "sampletime": 7.824001195986057,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 302,
        "timesteps": 6040000,
        "reward_mean": 1.1113500000000007,
        "reward_max": 2.4318750000000002,
        "reward_min": 0.14062500000000056,
        "leartime_s": 0.015759803995024413,
        "sampletime": 7.838889036007458,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 303,
        "timesteps": 6060000,
        "reward_mean": 1.2308000000000006,
        "reward_max": 2.3975000000000004,
        "reward_min": -0.24937499999999999,
        "leartime_s": 0.013366457977099344,
        "sampletime": 7.804067032993771,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 304,
        "timesteps": 6080000,
        "reward_mean": 0.9458250000000006,
        "reward_max": 1.790000000000001,
        "reward_min": 0.10250000000000012,
        "leartime_s": 0.03554952098056674,
        "sampletime": 7.753485107008601,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 305,
        "timesteps": 6100000,
        "reward_mean": 1.1023250000000007,
        "reward_max": 2.2375000000000003,
        "reward_min": -0.8424999999999996,
        "leartime_s": 0.01657235002494417,
        "sampletime": 7.781705070985481,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 306,
        "timesteps": 6120000,
        "reward_mean": 0.9821000000000006,
        "reward_max": 2.0881250000000007,
        "reward_min": -0.2150000000000001,
        "leartime_s": 0.03589987399755046,
        "sampletime": 7.8013194460072555,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 307,
        "timesteps": 6140000,
        "reward_mean": 0.8534750000000005,
        "reward_max": 1.9356250000000006,
        "reward_min": -0.33749999999999913,
        "leartime_s": 0.016399577987613156,
        "sampletime": 7.872474275995046,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 308,
        "timesteps": 6160000,
        "reward_mean": 0.9374000000000008,
        "reward_max": 1.8625000000000003,
        "reward_min": -0.4312499999999993,
        "leartime_s": 0.01595772398286499,
        "sampletime": 7.744368043000577,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 309,
        "timesteps": 6180000,
        "reward_mean": 1.0200000000000007,
        "reward_max": 1.831250000000001,
        "reward_min": -0.12187499999999918,
        "leartime_s": 0.03861241499544121,
        "sampletime": 7.7772622689954005,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 310,
        "timesteps": 6200000,
        "reward_mean": 0.8027000000000006,
        "reward_max": 1.8925000000000003,
        "reward_min": -0.8937499999999996,
        "leartime_s": 0.01612685198779218,
        "sampletime": 7.760259028000291,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 311,
        "timesteps": 6220000,
        "reward_mean": 0.6485750000000007,
        "reward_max": 1.5850000000000004,
        "reward_min": -0.7149999999999999,
        "leartime_s": 0.033675701008178294,
        "sampletime": 7.739517312002135,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 312,
        "timesteps": 6240000,
        "reward_mean": 1.0791000000000004,
        "reward_max": 2.1706250000000007,
        "reward_min": -0.0018749999999992661,
        "leartime_s": 0.01604539100662805,
        "sampletime": 7.628862632001983,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 313,
        "timesteps": 6260000,
        "reward_mean": 0.8176750000000006,
        "reward_max": 1.8225000000000007,
        "reward_min": -0.045625,
        "leartime_s": 0.030209342017769814,
        "sampletime": 7.875719593983376,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 314,
        "timesteps": 6280000,
        "reward_mean": 0.8736250000000005,
        "reward_max": 1.6918750000000005,
        "reward_min": -0.12374999999999989,
        "leartime_s": 0.030405842000618577,
        "sampletime": 7.83423883098294,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 315,
        "timesteps": 6300000,
        "reward_mean": 0.7907500000000007,
        "reward_max": 1.8243750000000005,
        "reward_min": -0.29812499999999975,
        "leartime_s": 0.020419936976395547,
        "sampletime": 7.768239326018374,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 316,
        "timesteps": 6320000,
        "reward_mean": 0.9168750000000007,
        "reward_max": 2.0168750000000006,
        "reward_min": -0.0556249999999994,
        "leartime_s": 0.029154098010621965,
        "sampletime": 7.856062801001826,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 317,
        "timesteps": 6340000,
        "reward_mean": 0.5484500000000008,
        "reward_max": 1.5075000000000005,
        "reward_min": -0.5824999999999989,
        "leartime_s": 0.04342299301060848,
        "sampletime": 7.92595122999046,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 318,
        "timesteps": 6360000,
        "reward_mean": 1.0935250000000007,
        "reward_max": 2.5731249999999997,
        "reward_min": -0.2787499999999991,
        "leartime_s": 0.03068536997307092,
        "sampletime": 7.693643606005935,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 319,
        "timesteps": 6380000,
        "reward_mean": 1.2559250000000004,
        "reward_max": 2.4525000000000006,
        "reward_min": 0.16250000000000042,
        "leartime_s": 0.017459143011365086,
        "sampletime": 7.914032693981426,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 320,
        "timesteps": 6400000,
        "reward_mean": 0.8998000000000005,
        "reward_max": 2.1081250000000002,
        "reward_min": -0.9162499999999999,
        "leartime_s": 0.016635993000818416,
        "sampletime": 7.839088359993184,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 321,
        "timesteps": 6420000,
        "reward_mean": 0.7013750000000006,
        "reward_max": 1.7737500000000008,
        "reward_min": -0.6568749999999995,
        "leartime_s": 0.025662954023573548,
        "sampletime": 7.776055479014758,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 322,
        "timesteps": 6440000,
        "reward_mean": 0.8933500000000009,
        "reward_max": 1.7006250000000007,
        "reward_min": -0.16624999999999956,
        "leartime_s": 0.01605859797564335,
        "sampletime": 7.854251327982638,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 323,
        "timesteps": 6460000,
        "reward_mean": 0.9612750000000007,
        "reward_max": 1.8543750000000008,
        "reward_min": -0.7068749999999998,
        "leartime_s": 0.016332936997059733,
        "sampletime": 7.785470392002026,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 324,
        "timesteps": 6480000,
        "reward_mean": 1.2686750000000007,
        "reward_max": 2.0750000000000006,
        "reward_min": 0.11250000000000071,
        "leartime_s": 0.0327866560255643,
        "sampletime": 7.7498532840108965,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 325,
        "timesteps": 6500000,
        "reward_mean": 1.0074750000000008,
        "reward_max": 2.309375000000001,
        "reward_min": -0.4474999999999994,
        "leartime_s": 0.038835397019283846,
        "sampletime": 7.853704158012988,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 326,
        "timesteps": 6520000,
        "reward_mean": 1.1629000000000005,
        "reward_max": 2.1987500000000004,
        "reward_min": -0.30374999999999924,
        "leartime_s": 0.04200990899698809,
        "sampletime": 7.949159400013741,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 327,
        "timesteps": 6540000,
        "reward_mean": 0.9506000000000006,
        "reward_max": 2.2481250000000004,
        "reward_min": -0.2318749999999994,
        "leartime_s": 0.016997254017041996,
        "sampletime": 7.835790006007301,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 328,
        "timesteps": 6560000,
        "reward_mean": 0.9545500000000007,
        "reward_max": 2.5256250000000002,
        "reward_min": -0.2749999999999997,
        "leartime_s": 0.017370937013765797,
        "sampletime": 7.715495182026643,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 329,
        "timesteps": 6580000,
        "reward_mean": 0.9966750000000006,
        "reward_max": 2.114375,
        "reward_min": -0.416249999999999,
        "leartime_s": 0.038872162986081094,
        "sampletime": 7.894149922998622,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 330,
        "timesteps": 6600000,
        "reward_mean": 1.1826250000000007,
        "reward_max": 2.44625,
        "reward_min": 0.135625000000001,
        "leartime_s": 0.0322115320013836,
        "sampletime": 7.754431338980794,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 331,
        "timesteps": 6620000,
        "reward_mean": 0.44642500000000057,
        "reward_max": 1.6781250000000005,
        "reward_min": -1.55625,
        "leartime_s": 0.06531775399344042,
        "sampletime": 7.734990589990048,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 332,
        "timesteps": 6640000,
        "reward_mean": 0.6703750000000006,
        "reward_max": 1.9006250000000005,
        "reward_min": -1.1168749999999994,
        "leartime_s": 0.017514334991574287,
        "sampletime": 7.606339557998581,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 333,
        "timesteps": 6660000,
        "reward_mean": 0.8031250000000006,
        "reward_max": 1.6037500000000007,
        "reward_min": -0.6056249999999991,
        "leartime_s": 0.01688659901265055,
        "sampletime": 7.83543083697441,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 334,
        "timesteps": 6680000,
        "reward_mean": 0.9009500000000006,
        "reward_max": 1.8937500000000005,
        "reward_min": -0.3762499999999993,
        "leartime_s": 0.014724623993970454,
        "sampletime": 7.900872783997329,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 335,
        "timesteps": 6700000,
        "reward_mean": 1.0799250000000007,
        "reward_max": 2.2468750000000006,
        "reward_min": -0.15624999999999953,
        "leartime_s": 0.017006437992677093,
        "sampletime": 7.907849541021278,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 336,
        "timesteps": 6720000,
        "reward_mean": 0.4715000000000007,
        "reward_max": 1.523125000000001,
        "reward_min": -0.7043749999999996,
        "leartime_s": 0.046958521008491516,
        "sampletime": 7.8592753449920565,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 337,
        "timesteps": 6740000,
        "reward_mean": 1.0657250000000007,
        "reward_max": 2.2462500000000007,
        "reward_min": 0.02937500000000043,
        "leartime_s": 0.026391480991151184,
        "sampletime": 7.764027751982212,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 338,
        "timesteps": 6760000,
        "reward_mean": 0.8540750000000006,
        "reward_max": 2.029375000000001,
        "reward_min": -1.0449999999999997,
        "leartime_s": 0.03621283298707567,
        "sampletime": 7.725506991992006,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 339,
        "timesteps": 6780000,
        "reward_mean": 1.0546000000000006,
        "reward_max": 2.17125,
        "reward_min": -0.1743749999999991,
        "leartime_s": 0.019014055986190215,
        "sampletime": 7.846571754984325,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 340,
        "timesteps": 6800000,
        "reward_mean": 0.8295815000000006,
        "reward_max": 1.9493750000000005,
        "reward_min": -0.8143749999999996,
        "leartime_s": 0.01704199699452147,
        "sampletime": 7.973564807005459,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 341,
        "timesteps": 6820000,
        "reward_mean": 0.8240500000000007,
        "reward_max": 1.6568750000000008,
        "reward_min": 0.06500000000000095,
        "leartime_s": 0.03947261199937202,
        "sampletime": 7.855476797994925,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 342,
        "timesteps": 6840000,
        "reward_mean": 0.7585500000000008,
        "reward_max": 1.8062500000000008,
        "reward_min": -0.5281249999999994,
        "leartime_s": 0.01861208101036027,
        "sampletime": 7.929208686022321,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 343,
        "timesteps": 6860000,
        "reward_mean": 0.8727750000000006,
        "reward_max": 2.1281250000000007,
        "reward_min": -0.2999999999999997,
        "leartime_s": 0.025582464004401118,
        "sampletime": 7.850024298997596,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 344,
        "timesteps": 6880000,
        "reward_mean": 0.7119500000000009,
        "reward_max": 1.6762500000000007,
        "reward_min": -0.8318749999999996,
        "leartime_s": 0.017329615977359936,
        "sampletime": 7.825712078018114,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 345,
        "timesteps": 6900000,
        "reward_mean": 0.7192250000000006,
        "reward_max": 1.9800000000000004,
        "reward_min": -1.3443749999999997,
        "leartime_s": 0.04456965500139631,
        "sampletime": 7.768993028003024,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 346,
        "timesteps": 6920000,
        "reward_mean": 1.0113500000000006,
        "reward_max": 1.9700000000000006,
        "reward_min": -0.32625,
        "leartime_s": 0.030208632990252227,
        "sampletime": 7.787678827007767,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 347,
        "timesteps": 6940000,
        "reward_mean": 1.0811750000000007,
        "reward_max": 2.166875000000001,
        "reward_min": -0.7749999999999994,
        "leartime_s": 0.01918346300953999,
        "sampletime": 7.816280839993851,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 348,
        "timesteps": 6960000,
        "reward_mean": 0.8193750000000006,
        "reward_max": 1.851250000000001,
        "reward_min": -0.778749999999999,
        "leartime_s": 0.02553134399931878,
        "sampletime": 7.823365557007492,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 349,
        "timesteps": 6980000,
        "reward_mean": 1.1371500000000005,
        "reward_max": 2.172500000000001,
        "reward_min": 0.2756250000000003,
        "leartime_s": 0.026490151998586953,
        "sampletime": 7.859293626010185,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 350,
        "timesteps": 7000000,
        "reward_mean": 0.8840750000000007,
        "reward_max": 1.8962500000000007,
        "reward_min": -0.4099999999999995,
        "leartime_s": 0.019695294002303854,
        "sampletime": 7.84421895199921,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 351,
        "timesteps": 7020000,
        "reward_mean": 0.6415750000000007,
        "reward_max": 1.8525000000000005,
        "reward_min": -0.7287499999999993,
        "leartime_s": 0.017714476998662576,
        "sampletime": 7.9978524330072105,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 352,
        "timesteps": 7040000,
        "reward_mean": 0.8494500000000006,
        "reward_max": 1.6762500000000007,
        "reward_min": -0.16812499999999914,
        "leartime_s": 0.037432563985930756,
        "sampletime": 7.842938354006037,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 353,
        "timesteps": 7060000,
        "reward_mean": 0.5629250000000007,
        "reward_max": 1.430625000000001,
        "reward_min": -0.588749999999999,
        "leartime_s": 0.020335119974333793,
        "sampletime": 7.806380427995464,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 354,
        "timesteps": 7080000,
        "reward_mean": 1.1040000000000008,
        "reward_max": 1.9100000000000008,
        "reward_min": -0.10749999999999968,
        "leartime_s": 0.02829431599820964,
        "sampletime": 7.762921079993248,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 355,
        "timesteps": 7100000,
        "reward_mean": 0.8463750000000007,
        "reward_max": 2.010000000000001,
        "reward_min": -0.17437499999999992,
        "leartime_s": 0.03497501902165823,
        "sampletime": 7.6902103789907414,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 356,
        "timesteps": 7120000,
        "reward_mean": 1.0214250000000007,
        "reward_max": 2.09,
        "reward_min": -0.005624999999999256,
        "leartime_s": 0.038727901002857834,
        "sampletime": 7.850866077002138,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 357,
        "timesteps": 7140000,
        "reward_mean": 0.5578500000000007,
        "reward_max": 1.5537500000000009,
        "reward_min": -0.7593749999999995,
        "leartime_s": 0.017815495986724272,
        "sampletime": 7.605971465993207,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 358,
        "timesteps": 7160000,
        "reward_mean": 0.9526000000000007,
        "reward_max": 1.9606250000000007,
        "reward_min": -0.25687499999999974,
        "leartime_s": 0.028515136014902964,
        "sampletime": 7.866443325008731,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 359,
        "timesteps": 7180000,
        "reward_mean": 1.1030250000000006,
        "reward_max": 2.184375,
        "reward_min": 0.07562500000000022,
        "leartime_s": 0.018180868995841593,
        "sampletime": 7.981988869985798,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 360,
        "timesteps": 7200000,
        "reward_mean": 0.7022000000000006,
        "reward_max": 1.7675000000000005,
        "reward_min": -0.6081249999999994,
        "leartime_s": 0.02249348899931647,
        "sampletime": 7.858158561022719,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 361,
        "timesteps": 7220000,
        "reward_mean": 0.7676250000000008,
        "reward_max": 1.8450000000000004,
        "reward_min": -0.453124999999999,
        "leartime_s": 0.024537097982829437,
        "sampletime": 7.786676718998933,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 362,
        "timesteps": 7240000,
        "reward_mean": 1.1475250000000006,
        "reward_max": 2.0281250000000006,
        "reward_min": 0.4212500000000007,
        "leartime_s": 0.027887656004168093,
        "sampletime": 7.8080002200149465,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 363,
        "timesteps": 7260000,
        "reward_mean": 0.5952500000000007,
        "reward_max": 1.4800000000000009,
        "reward_min": -0.8349999999999992,
        "leartime_s": 0.03160016899346374,
        "sampletime": 7.685209822026081,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 364,
        "timesteps": 7280000,
        "reward_mean": 0.8557750000000007,
        "reward_max": 1.9337500000000005,
        "reward_min": -0.18874999999999917,
        "leartime_s": 0.01996528499876149,
        "sampletime": 7.829620996984886,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 365,
        "timesteps": 7300000,
        "reward_mean": 0.8850500000000007,
        "reward_max": 1.9768750000000008,
        "reward_min": -0.5262499999999996,
        "leartime_s": 0.036753709020558745,
        "sampletime": 7.712262067012489,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 366,
        "timesteps": 7320000,
        "reward_mean": 0.9853750000000007,
        "reward_max": 2.006250000000001,
        "reward_min": 0.06812500000000035,
        "leartime_s": 0.035470228001940995,
        "sampletime": 7.661341436003568,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 367,
        "timesteps": 7340000,
        "reward_mean": 0.7726000000000007,
        "reward_max": 1.9143750000000006,
        "reward_min": -0.7143749999999998,
        "leartime_s": 0.01866954000433907,
        "sampletime": 7.8559772910084575,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 368,
        "timesteps": 7360000,
        "reward_mean": 0.6726000000000008,
        "reward_max": 1.5075000000000007,
        "reward_min": -0.38187499999999885,
        "leartime_s": 0.036030738992849365,
        "sampletime": 7.792394935997436,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 369,
        "timesteps": 7380000,
        "reward_mean": 0.5474000000000006,
        "reward_max": 1.5500000000000007,
        "reward_min": -0.8474999999999991,
        "leartime_s": 0.04028784699039534,
        "sampletime": 7.808687020005891,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 370,
        "timesteps": 7400000,
        "reward_mean": 1.0421750000000007,
        "reward_max": 2.2812500000000004,
        "reward_min": -0.16249999999999926,
        "leartime_s": 0.03505401700385846,
        "sampletime": 7.901510919997236,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 371,
        "timesteps": 7420000,
        "reward_mean": 1.0162750000000007,
        "reward_max": 2.38125,
        "reward_min": 0.07875000000000061,
        "leartime_s": 0.016703041997971013,
        "sampletime": 7.787170730996877,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 372,
        "timesteps": 7440000,
        "reward_mean": 0.7948500000000006,
        "reward_max": 1.751875000000001,
        "reward_min": -0.3493749999999992,
        "leartime_s": 0.03388770401943475,
        "sampletime": 7.67169379000552,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 373,
        "timesteps": 7460000,
        "reward_mean": 0.7747750000000007,
        "reward_max": 1.5731250000000006,
        "reward_min": -0.3074999999999991,
        "leartime_s": 0.02565261401468888,
        "sampletime": 7.758382826985326,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 374,
        "timesteps": 7480000,
        "reward_mean": 0.6610000000000006,
        "reward_max": 1.5850000000000006,
        "reward_min": -0.4468749999999992,
        "leartime_s": 0.01840103798895143,
        "sampletime": 7.822704274993157,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 375,
        "timesteps": 7500000,
        "reward_mean": 0.4214750000000007,
        "reward_max": 1.3256250000000007,
        "reward_min": -0.7531249999999989,
        "leartime_s": 0.019720729993423447,
        "sampletime": 7.864109674002975,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 376,
        "timesteps": 7520000,
        "reward_mean": 0.6910000000000007,
        "reward_max": 1.7925,
        "reward_min": -0.1499999999999993,
        "leartime_s": 0.023429552995366976,
        "sampletime": 7.748670757981017,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 377,
        "timesteps": 7540000,
        "reward_mean": 0.5311500000000006,
        "reward_max": 1.7375000000000007,
        "reward_min": -1.2137499999999992,
        "leartime_s": 0.020369823992950842,
        "sampletime": 7.8484758349950425,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 378,
        "timesteps": 7560000,
        "reward_mean": 0.6855750000000007,
        "reward_max": 1.555000000000001,
        "reward_min": -0.4606249999999995,
        "leartime_s": 0.01866401601000689,
        "sampletime": 7.880123712995555,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 379,
        "timesteps": 7580000,
        "reward_mean": 0.7403000000000007,
        "reward_max": 1.8868750000000005,
        "reward_min": -1.6543749999999993,
        "leartime_s": 0.01857963899965398,
        "sampletime": 7.8271569600037765,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 380,
        "timesteps": 7600000,
        "reward_mean": 0.4981250000000006,
        "reward_max": 1.5718750000000004,
        "reward_min": -1.0362499999999994,
        "leartime_s": 0.020037408015923575,
        "sampletime": 7.627810189995216,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 381,
        "timesteps": 7620000,
        "reward_mean": 0.9431000000000007,
        "reward_max": 2.1343750000000012,
        "reward_min": -0.4162499999999999,
        "leartime_s": 0.039381852984661236,
        "sampletime": 7.812994141975651,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 382,
        "timesteps": 7640000,
        "reward_mean": 0.8814000000000006,
        "reward_max": 2.015625000000001,
        "reward_min": 0.046250000000001124,
        "leartime_s": 0.018376595980953425,
        "sampletime": 7.794476398004917,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 383,
        "timesteps": 7660000,
        "reward_mean": 0.8693500000000006,
        "reward_max": 1.8750000000000004,
        "reward_min": -0.20062499999999928,
        "leartime_s": 0.019186270015779883,
        "sampletime": 7.802207650995115,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 384,
        "timesteps": 7680000,
        "reward_mean": 0.8658750000000007,
        "reward_max": 1.7362500000000005,
        "reward_min": -0.1674999999999997,
        "leartime_s": 0.030313127004774287,
        "sampletime": 7.96767211300903,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 385,
        "timesteps": 7700000,
        "reward_mean": 0.5887000000000004,
        "reward_max": 1.6243750000000003,
        "reward_min": -0.8662499999999989,
        "leartime_s": 0.027407593006500974,
        "sampletime": 7.898487727012252,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 386,
        "timesteps": 7720000,
        "reward_mean": 0.7986500000000006,
        "reward_max": 1.707500000000001,
        "reward_min": -0.15374999999999842,
        "leartime_s": 0.02434410701971501,
        "sampletime": 7.7197712720080744,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 387,
        "timesteps": 7740000,
        "reward_mean": 0.5487500000000005,
        "reward_max": 1.6575000000000004,
        "reward_min": -0.5356249999999995,
        "leartime_s": 0.018828447005944327,
        "sampletime": 7.835853058000794,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 388,
        "timesteps": 7760000,
        "reward_mean": 1.2145500000000007,
        "reward_max": 2.3868750000000007,
        "reward_min": -0.24562499999999937,
        "leartime_s": 0.019642633997136727,
        "sampletime": 7.815846942015924,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 389,
        "timesteps": 7780000,
        "reward_mean": 0.8125750000000005,
        "reward_max": 1.7487500000000002,
        "reward_min": -0.2618749999999994,
        "leartime_s": 0.023395886993966997,
        "sampletime": 7.809615220990963,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 390,
        "timesteps": 7800000,
        "reward_mean": 0.5441250000000006,
        "reward_max": 1.7112500000000008,
        "reward_min": -0.7537499999999988,
        "leartime_s": 0.019437837996520102,
        "sampletime": 7.855513215996325,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 391,
        "timesteps": 7820000,
        "reward_mean": 0.9055500000000006,
        "reward_max": 1.9387500000000006,
        "reward_min": -0.7531249999999989,
        "leartime_s": 0.02057150099426508,
        "sampletime": 7.79257253598189,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 392,
        "timesteps": 7840000,
        "reward_mean": 0.7153250000000008,
        "reward_max": 1.8443750000000005,
        "reward_min": -0.4418749999999994,
        "leartime_s": 0.021122503996593878,
        "sampletime": 7.89257876900956,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 393,
        "timesteps": 7860000,
        "reward_mean": 0.7057250000000005,
        "reward_max": 1.9612500000000002,
        "reward_min": -1.4574999999999998,
        "leartime_s": 0.020036177011206746,
        "sampletime": 7.721998688997701,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 394,
        "timesteps": 7880000,
        "reward_mean": 0.7780250000000006,
        "reward_max": 2.0843750000000005,
        "reward_min": -0.4531249999999994,
        "leartime_s": 0.019402912992518395,
        "sampletime": 7.7337045519961976,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 395,
        "timesteps": 7900000,
        "reward_mean": 0.46192500000000064,
        "reward_max": 1.3762500000000006,
        "reward_min": -0.8068749999999993,
        "leartime_s": 0.01971310400404036,
        "sampletime": 7.631479995005066,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 396,
        "timesteps": 7920000,
        "reward_mean": 0.5567500000000006,
        "reward_max": 1.756875000000001,
        "reward_min": -0.682499999999999,
        "leartime_s": 0.019222586997784674,
        "sampletime": 7.875977982010227,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 397,
        "timesteps": 7940000,
        "reward_mean": 0.6112750000000008,
        "reward_max": 1.615625000000001,
        "reward_min": -0.7924999999999991,
        "leartime_s": 0.026730031007900834,
        "sampletime": 7.927600641996833,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 398,
        "timesteps": 7960000,
        "reward_mean": 0.9127250000000007,
        "reward_max": 1.9656250000000004,
        "reward_min": 0.03687500000000096,
        "leartime_s": 0.01985549199162051,
        "sampletime": 7.788459143019281,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 399,
        "timesteps": 7980000,
        "reward_mean": 0.5096000000000006,
        "reward_max": 1.3162500000000004,
        "reward_min": -0.7849999999999993,
        "leartime_s": 0.037858972005778924,
        "sampletime": 7.827446387003874,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 400,
        "timesteps": 8000000,
        "reward_mean": 0.8055250000000005,
        "reward_max": 2.1587500000000004,
        "reward_min": -0.5025000000000002,
        "leartime_s": 0.028762789006577805,
        "sampletime": 7.763946193008451,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 401,
        "timesteps": 8020000,
        "reward_mean": 0.6492750000000005,
        "reward_max": 1.6543750000000006,
        "reward_min": -0.9093749999999998,
        "leartime_s": 0.02601995598524809,
        "sampletime": 7.758423880994087,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 402,
        "timesteps": 8040000,
        "reward_mean": 0.7821000000000006,
        "reward_max": 1.6968750000000001,
        "reward_min": -0.18374999999999975,
        "leartime_s": 0.02006694398005493,
        "sampletime": 7.793393739004387,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 403,
        "timesteps": 8060000,
        "reward_mean": 0.6681750000000006,
        "reward_max": 1.570000000000001,
        "reward_min": -0.3924999999999995,
        "leartime_s": 0.05117391899693757,
        "sampletime": 7.833217715000501,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 404,
        "timesteps": 8080000,
        "reward_mean": 1.3327250000000008,
        "reward_max": 2.081875,
        "reward_min": 0.4612500000000006,
        "leartime_s": 0.039314371009822935,
        "sampletime": 7.750958112999797,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 405,
        "timesteps": 8100000,
        "reward_mean": 0.8233500000000006,
        "reward_max": 1.802500000000001,
        "reward_min": -0.25499999999999934,
        "leartime_s": 0.017811241996241733,
        "sampletime": 7.75228225698811,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 406,
        "timesteps": 8120000,
        "reward_mean": 0.8217500000000006,
        "reward_max": 1.773750000000001,
        "reward_min": -0.09187499999999935,
        "leartime_s": 0.030507674004184082,
        "sampletime": 7.751042564021191,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 407,
        "timesteps": 8140000,
        "reward_mean": 0.8476000000000006,
        "reward_max": 2.045625000000001,
        "reward_min": -0.21437499999999915,
        "leartime_s": 0.04148816500674002,
        "sampletime": 7.625200873997528,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 408,
        "timesteps": 8160000,
        "reward_mean": 0.7448000000000007,
        "reward_max": 1.8118750000000003,
        "reward_min": -0.35687499999999955,
        "leartime_s": 0.019875909987604246,
        "sampletime": 7.923914842976956,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 409,
        "timesteps": 8180000,
        "reward_mean": 0.8654000000000006,
        "reward_max": 1.8825000000000007,
        "reward_min": -0.3999999999999998,
        "leartime_s": 0.03881011498742737,
        "sampletime": 7.703275553998537,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 410,
        "timesteps": 8200000,
        "reward_mean": 0.6022000000000007,
        "reward_max": 1.576875000000001,
        "reward_min": -0.21874999999999933,
        "leartime_s": 0.022466274996986613,
        "sampletime": 7.708682819007663,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 411,
        "timesteps": 8220000,
        "reward_mean": 0.8776000000000006,
        "reward_max": 2.0768750000000002,
        "reward_min": -0.1306249999999989,
        "leartime_s": 0.024959643022157252,
        "sampletime": 7.691476707987022,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 412,
        "timesteps": 8240000,
        "reward_mean": 0.8931500000000007,
        "reward_max": 2.031250000000001,
        "reward_min": -0.33124999999999977,
        "leartime_s": 0.019775416993070394,
        "sampletime": 7.710265961010009,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 413,
        "timesteps": 8260000,
        "reward_mean": 0.6245250000000008,
        "reward_max": 1.6018750000000006,
        "reward_min": -0.7999999999999993,
        "leartime_s": 0.02529331500409171,
        "sampletime": 7.736133603990311,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 414,
        "timesteps": 8280000,
        "reward_mean": 0.7486250000000007,
        "reward_max": 1.6881250000000012,
        "reward_min": -0.9937499999999999,
        "leartime_s": 0.019851357996230945,
        "sampletime": 7.791797436017077,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 415,
        "timesteps": 8300000,
        "reward_mean": 0.7204750000000006,
        "reward_max": 1.6737500000000005,
        "reward_min": -0.7337499999999997,
        "leartime_s": 0.03599904500879347,
        "sampletime": 7.892480957991211,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 416,
        "timesteps": 8320000,
        "reward_mean": 0.8586250000000004,
        "reward_max": 1.8956250000000001,
        "reward_min": -0.5043749999999992,
        "leartime_s": 0.04375684299157001,
        "sampletime": 7.952934222994372,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 417,
        "timesteps": 8340000,
        "reward_mean": 0.44010000000000066,
        "reward_max": 1.5587500000000007,
        "reward_min": -1.4375000000000002,
        "leartime_s": 0.046453666989691556,
        "sampletime": 7.7657074320013635,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 418,
        "timesteps": 8360000,
        "reward_mean": 0.6630000000000007,
        "reward_max": 1.6662500000000011,
        "reward_min": -0.6143749999999994,
        "leartime_s": 0.03279908001422882,
        "sampletime": 7.746778720000293,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 419,
        "timesteps": 8380000,
        "reward_mean": 0.7689000000000006,
        "reward_max": 1.8331250000000006,
        "reward_min": -0.7524999999999992,
        "leartime_s": 0.020542373997159302,
        "sampletime": 7.777453590009827,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 420,
        "timesteps": 8400000,
        "reward_mean": 0.8442750000000008,
        "reward_max": 1.7181250000000003,
        "reward_min": -0.9718749999999987,
        "leartime_s": 0.02018956100801006,
        "sampletime": 7.821192808973137,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 421,
        "timesteps": 8420000,
        "reward_mean": 1.0925500000000006,
        "reward_max": 2.06375,
        "reward_min": 0.14000000000000054,
        "leartime_s": 0.028381543001160026,
        "sampletime": 7.737956641009077,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 422,
        "timesteps": 8440000,
        "reward_mean": 0.7227250000000007,
        "reward_max": 1.7775000000000007,
        "reward_min": -0.5362499999999999,
        "leartime_s": 0.03533183201216161,
        "sampletime": 7.845902779023163,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 423,
        "timesteps": 8460000,
        "reward_mean": 1.1764000000000006,
        "reward_max": 2.2337500000000006,
        "reward_min": 0.0850000000000005,
        "leartime_s": 0.024736728984862566,
        "sampletime": 7.7231072789873,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 424,
        "timesteps": 8480000,
        "reward_mean": 0.7581000000000008,
        "reward_max": 1.7718750000000008,
        "reward_min": -0.054374999999999035,
        "leartime_s": 0.020520765014225617,
        "sampletime": 7.753470600990113,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 425,
        "timesteps": 8500000,
        "reward_mean": 0.8308750000000006,
        "reward_max": 1.883750000000001,
        "reward_min": -0.07812499999999928,
        "leartime_s": 0.02098384700366296,
        "sampletime": 7.560644123004749,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 426,
        "timesteps": 8520000,
        "reward_mean": 0.8197500000000005,
        "reward_max": 1.7443750000000007,
        "reward_min": -0.2956249999999997,
        "leartime_s": 0.020287972001824528,
        "sampletime": 7.7692726330133155,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 427,
        "timesteps": 8540000,
        "reward_mean": 0.9070750000000006,
        "reward_max": 1.98875,
        "reward_min": -0.3587499999999996,
        "leartime_s": 0.020721974986372516,
        "sampletime": 7.811721698992187,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 428,
        "timesteps": 8560000,
        "reward_mean": 1.1880500000000007,
        "reward_max": 1.9937500000000004,
        "reward_min": 0.3575000000000004,
        "leartime_s": 0.03118813200853765,
        "sampletime": 7.8154609960038215,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 429,
        "timesteps": 8580000,
        "reward_mean": 1.0390000000000006,
        "reward_max": 1.9250000000000005,
        "reward_min": 0.07562500000000079,
        "leartime_s": 0.020564364007441327,
        "sampletime": 7.851768337015528,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 430,
        "timesteps": 8600000,
        "reward_mean": 0.7475000000000007,
        "reward_max": 2.26125,
        "reward_min": -1.0668749999999991,
        "leartime_s": 0.020352830993942916,
        "sampletime": 7.785748030990362,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 431,
        "timesteps": 8620000,
        "reward_mean": 1.1176000000000008,
        "reward_max": 2.066875000000001,
        "reward_min": 0.4400000000000008,
        "leartime_s": 0.02061818100628443,
        "sampletime": 7.808360028982861,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 432,
        "timesteps": 8640000,
        "reward_mean": 1.2225500000000007,
        "reward_max": 2.317500000000001,
        "reward_min": 0.08187500000000061,
        "leartime_s": 0.050560695002786815,
        "sampletime": 7.820811839017551,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 433,
        "timesteps": 8660000,
        "reward_mean": 0.7994250000000006,
        "reward_max": 1.811875000000001,
        "reward_min": -0.3574999999999993,
        "leartime_s": 0.027213339984882623,
        "sampletime": 7.979983288998483,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 434,
        "timesteps": 8680000,
        "reward_mean": 0.9065250000000008,
        "reward_max": 1.7993750000000006,
        "reward_min": 0.04937500000000074,
        "leartime_s": 0.021846121991984546,
        "sampletime": 7.848066617996665,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 435,
        "timesteps": 8700000,
        "reward_mean": 0.9793000000000007,
        "reward_max": 1.8387500000000008,
        "reward_min": 0.27375000000000077,
        "leartime_s": 0.021267640026053414,
        "sampletime": 7.904101367021212,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 436,
        "timesteps": 8720000,
        "reward_mean": 0.6038500000000008,
        "reward_max": 1.2393750000000006,
        "reward_min": -0.5224999999999994,
        "leartime_s": 0.04539037198992446,
        "sampletime": 7.784833340003388,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 437,
        "timesteps": 8740000,
        "reward_mean": 0.7343750000000007,
        "reward_max": 1.8537500000000011,
        "reward_min": -0.5218749999999996,
        "leartime_s": 0.023983202001545578,
        "sampletime": 7.864916632999666,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 438,
        "timesteps": 8760000,
        "reward_mean": 0.9034250000000007,
        "reward_max": 1.863750000000001,
        "reward_min": -0.17499999999999866,
        "leartime_s": 0.02307505498174578,
        "sampletime": 7.85834620098467,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 439,
        "timesteps": 8780000,
        "reward_mean": 0.5391750000000006,
        "reward_max": 1.5281250000000006,
        "reward_min": -0.8599999999999994,
        "leartime_s": 0.02655097100068815,
        "sampletime": 7.6625838479958475,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 440,
        "timesteps": 8800000,
        "reward_mean": 0.9221500000000006,
        "reward_max": 1.7618750000000005,
        "reward_min": -0.44312499999999994,
        "leartime_s": 0.03115085998433642,
        "sampletime": 7.768715841986705,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 441,
        "timesteps": 8820000,
        "reward_mean": 0.9822750000000008,
        "reward_max": 2.1175,
        "reward_min": 0.04500000000000076,
        "leartime_s": 0.03070606300025247,
        "sampletime": 7.841250733996276,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 442,
        "timesteps": 8840000,
        "reward_mean": 0.7380750000000006,
        "reward_max": 1.8950000000000002,
        "reward_min": -0.4837499999999995,
        "leartime_s": 0.021181558986427262,
        "sampletime": 7.797152862010989,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 443,
        "timesteps": 8860000,
        "reward_mean": 0.9721750000000008,
        "reward_max": 1.754375000000001,
        "reward_min": -0.059999999999999026,
        "leartime_s": 0.03057199201430194,
        "sampletime": 7.6057224410178605,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 444,
        "timesteps": 8880000,
        "reward_mean": 0.8192750000000008,
        "reward_max": 1.7831250000000005,
        "reward_min": 0.05437500000000063,
        "leartime_s": 0.03190898700268008,
        "sampletime": 7.8093636379926465,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 445,
        "timesteps": 8900000,
        "reward_mean": 0.8242500000000006,
        "reward_max": 1.7612500000000009,
        "reward_min": -0.09249999999999942,
        "leartime_s": 0.023071481002261862,
        "sampletime": 7.783253700006753,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 446,
        "timesteps": 8920000,
        "reward_mean": 0.8536000000000006,
        "reward_max": 1.8637500000000007,
        "reward_min": -0.11937499999999955,
        "leartime_s": 0.02138943801401183,
        "sampletime": 7.763501022011042,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 447,
        "timesteps": 8940000,
        "reward_mean": 1.0955000000000006,
        "reward_max": 1.8750000000000013,
        "reward_min": 0.2906249999999999,
        "leartime_s": 0.030260903004091233,
        "sampletime": 7.747975631995359,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 448,
        "timesteps": 8960000,
        "reward_mean": 0.7640000000000005,
        "reward_max": 1.9050000000000007,
        "reward_min": -0.21749999999999942,
        "leartime_s": 0.021376819990109652,
        "sampletime": 7.883290619007312,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 449,
        "timesteps": 8980000,
        "reward_mean": 1.0784750000000007,
        "reward_max": 2.1043750000000006,
        "reward_min": 0.03437500000000006,
        "leartime_s": 0.021938835008768365,
        "sampletime": 7.689634478010703,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 450,
        "timesteps": 9000000,
        "reward_mean": 0.7869000000000007,
        "reward_max": 1.9518750000000007,
        "reward_min": -0.2787499999999996,
        "leartime_s": 0.05170121998526156,
        "sampletime": 7.710104991012486,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 451,
        "timesteps": 9020000,
        "reward_mean": 0.8840750000000007,
        "reward_max": 1.7850000000000004,
        "reward_min": -0.4724999999999988,
        "leartime_s": 0.021080348000396043,
        "sampletime": 7.858930958987912,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 452,
        "timesteps": 9040000,
        "reward_mean": 0.8863750000000006,
        "reward_max": 2.2437500000000004,
        "reward_min": -0.21874999999999992,
        "leartime_s": 0.02288599099847488,
        "sampletime": 7.7047147230186965,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 453,
        "timesteps": 9060000,
        "reward_mean": 0.7705750000000006,
        "reward_max": 2.075,
        "reward_min": -1.4206249999999991,
        "leartime_s": 0.03616595800849609,
        "sampletime": 7.761944272002438,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 454,
        "timesteps": 9080000,
        "reward_mean": 1.0480500000000006,
        "reward_max": 2.035625000000001,
        "reward_min": 0.05562500000000106,
        "leartime_s": 0.021544910996453837,
        "sampletime": 7.736092690000078,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 455,
        "timesteps": 9100000,
        "reward_mean": 0.6327500000000005,
        "reward_max": 2.036875,
        "reward_min": -0.4481249999999999,
        "leartime_s": 0.04097684100270271,
        "sampletime": 7.818525917013176,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 456,
        "timesteps": 9120000,
        "reward_mean": 0.5992000000000005,
        "reward_max": 1.6556250000000008,
        "reward_min": -0.49312500000000026,
        "leartime_s": 0.034219790977658704,
        "sampletime": 7.773819993977668,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 457,
        "timesteps": 9140000,
        "reward_mean": 0.7198500000000005,
        "reward_max": 1.8650000000000007,
        "reward_min": -0.3418749999999997,
        "leartime_s": 0.025003899994771928,
        "sampletime": 7.706908504012972,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 458,
        "timesteps": 9160000,
        "reward_mean": 1.0852750000000009,
        "reward_max": 2.196875000000001,
        "reward_min": -0.010624999999999898,
        "leartime_s": 0.0451732010114938,
        "sampletime": 7.814137459004996,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 459,
        "timesteps": 9180000,
        "reward_mean": 0.9628750000000006,
        "reward_max": 2.20375,
        "reward_min": -0.3462499999999999,
        "leartime_s": 0.022034432011423633,
        "sampletime": 7.783895194996148,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 460,
        "timesteps": 9200000,
        "reward_mean": 1.0449250000000008,
        "reward_max": 2.0493750000000013,
        "reward_min": 0.1356250000000005,
        "leartime_s": 0.03511870899819769,
        "sampletime": 7.846533688978525,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 461,
        "timesteps": 9220000,
        "reward_mean": 0.4830000000000006,
        "reward_max": 1.456875000000001,
        "reward_min": -0.656249999999999,
        "leartime_s": 0.03906895298860036,
        "sampletime": 7.826824254996609,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 462,
        "timesteps": 9240000,
        "reward_mean": 0.8790500000000006,
        "reward_max": 1.9162500000000007,
        "reward_min": -0.060624999999999846,
        "leartime_s": 0.04774996198830195,
        "sampletime": 7.803152096981648,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 463,
        "timesteps": 9260000,
        "reward_mean": 0.7189750000000006,
        "reward_max": 2.036875,
        "reward_min": -0.46874999999999967,
        "leartime_s": 0.02475392399355769,
        "sampletime": 7.789459778025048,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 464,
        "timesteps": 9280000,
        "reward_mean": 1.0240750000000007,
        "reward_max": 2.1831250000000013,
        "reward_min": -0.97875,
        "leartime_s": 0.04099475700058974,
        "sampletime": 7.8582212979963515,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 465,
        "timesteps": 9300000,
        "reward_mean": 0.9485250000000005,
        "reward_max": 1.903125000000001,
        "reward_min": -0.29375,
        "leartime_s": 0.02407250800752081,
        "sampletime": 7.862446357001318,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 466,
        "timesteps": 9320000,
        "reward_mean": 0.8706250000000006,
        "reward_max": 1.9112500000000003,
        "reward_min": -0.14062499999999947,
        "leartime_s": 0.025838367000687867,
        "sampletime": 7.87393175100442,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 467,
        "timesteps": 9340000,
        "reward_mean": 1.0374500000000006,
        "reward_max": 1.9362500000000005,
        "reward_min": 0.06062499999999987,
        "leartime_s": 0.025109686015639454,
        "sampletime": 7.755978258996038,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 468,
        "timesteps": 9360000,
        "reward_mean": 0.9307836666666672,
        "reward_max": 2.1250000000000004,
        "reward_min": -0.5431249999999994,
        "leartime_s": 0.023785999976098537,
        "sampletime": 7.8796981269842945,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 469,
        "timesteps": 9380000,
        "reward_mean": 1.0479250000000004,
        "reward_max": 2.0350000000000006,
        "reward_min": -0.07375000000000012,
        "leartime_s": 0.02475658099865541,
        "sampletime": 7.662647311983164,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 470,
        "timesteps": 9400000,
        "reward_mean": 1.2283750000000007,
        "reward_max": 2.215625000000001,
        "reward_min": 0.4375000000000007,
        "leartime_s": 0.02391193000948988,
        "sampletime": 7.770447234011954,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 471,
        "timesteps": 9420000,
        "reward_mean": 0.6577750000000007,
        "reward_max": 1.6456250000000008,
        "reward_min": -0.5562499999999995,
        "leartime_s": 0.0317453530151397,
        "sampletime": 7.7207753410039,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 472,
        "timesteps": 9440000,
        "reward_mean": 0.9980000000000007,
        "reward_max": 1.7275000000000005,
        "reward_min": -0.4893749999999992,
        "leartime_s": 0.047707209014333785,
        "sampletime": 7.771313714009011,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 473,
        "timesteps": 9460000,
        "reward_mean": 0.6804500000000006,
        "reward_max": 2.035,
        "reward_min": -0.2668749999999997,
        "leartime_s": 0.022294254013104364,
        "sampletime": 7.769337252015248,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 474,
        "timesteps": 9480000,
        "reward_mean": 1.0540250000000007,
        "reward_max": 2.1187500000000004,
        "reward_min": -0.11937499999999944,
        "leartime_s": 0.024381361989071593,
        "sampletime": 7.9258155029965565,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 475,
        "timesteps": 9500000,
        "reward_mean": 0.8334750000000006,
        "reward_max": 2.0587500000000007,
        "reward_min": -0.2906249999999997,
        "leartime_s": 0.032063428981928155,
        "sampletime": 7.797012274997542,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 476,
        "timesteps": 9520000,
        "reward_mean": 0.9291250000000006,
        "reward_max": 2.3731250000000004,
        "reward_min": -0.4568749999999992,
        "leartime_s": 0.05734748998656869,
        "sampletime": 7.729247112001758,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 477,
        "timesteps": 9540000,
        "reward_mean": 0.8429000000000006,
        "reward_max": 1.9181250000000007,
        "reward_min": -0.4912499999999996,
        "leartime_s": 0.04765463600051589,
        "sampletime": 7.723125746008009,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 478,
        "timesteps": 9560000,
        "reward_mean": 0.9235000000000007,
        "reward_max": 2.255625,
        "reward_min": -0.14999999999999972,
        "leartime_s": 0.029867906996514648,
        "sampletime": 7.867359789001057,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 479,
        "timesteps": 9580000,
        "reward_mean": 0.7014250000000006,
        "reward_max": 1.8512500000000003,
        "reward_min": -0.8493749999999995,
        "leartime_s": 0.022417239990318194,
        "sampletime": 7.932739522017073,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 480,
        "timesteps": 9600000,
        "reward_mean": 1.1798500000000007,
        "reward_max": 2.2893749999999997,
        "reward_min": 0.32062500000000094,
        "leartime_s": 0.022911759006092325,
        "sampletime": 7.660384696006076,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 481,
        "timesteps": 9620000,
        "reward_mean": 0.8746500000000006,
        "reward_max": 2.1706250000000007,
        "reward_min": -0.4099999999999999,
        "leartime_s": 0.053151533997152,
        "sampletime": 7.830396743025631,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 482,
        "timesteps": 9640000,
        "reward_mean": 1.2974250000000007,
        "reward_max": 2.3481250000000005,
        "reward_min": -0.049999999999999434,
        "leartime_s": 0.02423183200880885,
        "sampletime": 7.591127027000766,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 483,
        "timesteps": 9660000,
        "reward_mean": 0.9805000000000006,
        "reward_max": 2.1718750000000004,
        "reward_min": -0.05624999999999976,
        "leartime_s": 0.04838530198321678,
        "sampletime": 7.7995966610033065,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 484,
        "timesteps": 9680000,
        "reward_mean": 1.1244500000000008,
        "reward_max": 2.3500000000000005,
        "reward_min": -0.5312500000000002,
        "leartime_s": 0.024983095994684845,
        "sampletime": 7.7721620830125175,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 485,
        "timesteps": 9700000,
        "reward_mean": 1.1863750000000006,
        "reward_max": 2.2168750000000004,
        "reward_min": -0.0762499999999997,
        "leartime_s": 0.0411814019898884,
        "sampletime": 7.615621141972952,
        "best_mean": 1.4016250000000008,
        "best_max": 2.423750000000001,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 486,
        "timesteps": 9720000,
        "reward_mean": 1.5042750000000005,
        "reward_max": 2.6100000000000003,
        "reward_min": 0.5756250000000005,
        "leartime_s": 0.04076455798349343,
        "sampletime": 7.591667946981033,
        "best_mean": 1.5042750000000005,
        "best_max": 2.6100000000000003,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 487,
        "timesteps": 9740000,
        "reward_mean": 1.2004250000000007,
        "reward_max": 2.2937499999999993,
        "reward_min": 0.1750000000000006,
        "leartime_s": 0.04937270100344904,
        "sampletime": 7.5405964459932875,
        "best_mean": 1.5042750000000005,
        "best_max": 2.6100000000000003,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 488,
        "timesteps": 9760000,
        "reward_mean": 0.9729250000000004,
        "reward_max": 1.9962500000000005,
        "reward_min": -0.29125,
        "leartime_s": 0.022453840996604413,
        "sampletime": 7.6261319880140945,
        "best_mean": 1.5042750000000005,
        "best_max": 2.6100000000000003,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 489,
        "timesteps": 9780000,
        "reward_mean": 0.9791000000000005,
        "reward_max": 2.2925,
        "reward_min": -0.375625,
        "leartime_s": 0.023406518012052402,
        "sampletime": 7.5694927090080455,
        "best_mean": 1.5042750000000005,
        "best_max": 2.6100000000000003,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 490,
        "timesteps": 9800000,
        "reward_mean": 1.1813250000000006,
        "reward_max": 2.3662500000000004,
        "reward_min": 0.009375000000000827,
        "leartime_s": 0.06563556002220139,
        "sampletime": 7.641174507007236,
        "best_mean": 1.5042750000000005,
        "best_max": 2.6100000000000003,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 491,
        "timesteps": 9820000,
        "reward_mean": 0.7893500000000006,
        "reward_max": 1.761875,
        "reward_min": -0.41124999999999967,
        "leartime_s": 0.022648485988611355,
        "sampletime": 7.714681729994481,
        "best_mean": 1.5042750000000005,
        "best_max": 2.6100000000000003,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 492,
        "timesteps": 9840000,
        "reward_mean": 1.0924750000000005,
        "reward_max": 2.4256250000000006,
        "reward_min": -0.19312499999999924,
        "leartime_s": 0.06153723000898026,
        "sampletime": 7.906413613993209,
        "best_mean": 1.5042750000000005,
        "best_max": 2.6100000000000003,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 493,
        "timesteps": 9860000,
        "reward_mean": 1.3549500000000008,
        "reward_max": 2.7562499999999996,
        "reward_min": 0.2050000000000004,
        "leartime_s": 0.045244181994348764,
        "sampletime": 7.6851676179794595,
        "best_mean": 1.5042750000000005,
        "best_max": 2.6100000000000003,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 494,
        "timesteps": 9880000,
        "reward_mean": 1.2064750000000009,
        "reward_max": 2.5325000000000006,
        "reward_min": 0.28625000000000045,
        "leartime_s": 0.023191070009488612,
        "sampletime": 7.722928645991487,
        "best_mean": 1.5042750000000005,
        "best_max": 2.6100000000000003,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 495,
        "timesteps": 9900000,
        "reward_mean": 1.1076750000000006,
        "reward_max": 2.4781250000000004,
        "reward_min": 0.1750000000000002,
        "leartime_s": 0.034057295008096844,
        "sampletime": 7.6219819220132194,
        "best_mean": 1.5042750000000005,
        "best_max": 2.6100000000000003,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 496,
        "timesteps": 9920000,
        "reward_mean": 1.0751500000000005,
        "reward_max": 2.0400000000000005,
        "reward_min": -0.18812499999999985,
        "leartime_s": 0.03488051498425193,
        "sampletime": 7.6200802979874425,
        "best_mean": 1.5042750000000005,
        "best_max": 2.6100000000000003,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 497,
        "timesteps": 9940000,
        "reward_mean": 1.0238250000000007,
        "reward_max": 2.105625,
        "reward_min": -0.6012499999999993,
        "leartime_s": 0.03286454200861044,
        "sampletime": 7.732725067005958,
        "best_mean": 1.5042750000000005,
        "best_max": 2.6100000000000003,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 498,
        "timesteps": 9960000,
        "reward_mean": 1.0257500000000004,
        "reward_max": 2.2600000000000002,
        "reward_min": -0.1493749999999987,
        "leartime_s": 0.023183018987765536,
        "sampletime": 7.78407474301639,
        "best_mean": 1.5042750000000005,
        "best_max": 2.6100000000000003,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 499,
        "timesteps": 9980000,
        "reward_mean": 1.1890000000000007,
        "reward_max": 2.288125000000001,
        "reward_min": -0.10749999999999979,
        "leartime_s": 0.03210809797747061,
        "sampletime": 7.882718163979007,
        "best_mean": 1.5042750000000005,
        "best_max": 2.6100000000000003,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 500,
        "timesteps": 10000000,
        "reward_mean": 1.1610500000000006,
        "reward_max": 2.4625000000000004,
        "reward_min": 0.05000000000000043,
        "leartime_s": 0.049500296998303384,
        "sampletime": 7.8344743470079266,
        "best_mean": 1.5042750000000005,
        "best_max": 2.6100000000000003,
        "params": {
            "agentsize": 10,
            "yellow": 0,
            "seeds": 45685,
            "it": 500,
            "envs": 10,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    }
]