[
    {
        "generation": 1,
        "timesteps": 2000,
        "reward_mean": -39.088950000000004,
        "reward_max": -0.698687499999999,
        "reward_min": -87.39881249999999,
        "leartime_s": 0.020976163999876007,
        "sampletime": 1.6032069920038339,
        "best_mean": -39.088950000000004,
        "best_max": -0.698687499999999,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 2,
        "timesteps": 4000,
        "reward_mean": -35.74145,
        "reward_max": -3.0964999999999994,
        "reward_min": -196.67275000000004,
        "leartime_s": 0.017368516011629254,
        "sampletime": 2.089371458016103,
        "best_mean": -35.74145,
        "best_max": -3.0964999999999994,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 3,
        "timesteps": 6000,
        "reward_mean": -19.78405,
        "reward_max": 1.3571875000000002,
        "reward_min": -73.15506250000001,
        "leartime_s": 0.04785531500237994,
        "sampletime": 1.7116222259937786,
        "best_mean": -19.78405,
        "best_max": 1.3571875000000002,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 4,
        "timesteps": 8000,
        "reward_mean": -18.704925000000003,
        "reward_max": 0.872625,
        "reward_min": -64.19118750000001,
        "leartime_s": 0.014731514995219186,
        "sampletime": 1.9695387190149631,
        "best_mean": -18.704925000000003,
        "best_max": 0.872625,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 5,
        "timesteps": 10000,
        "reward_mean": -18.22565,
        "reward_max": 1.7780000000000002,
        "reward_min": -42.2629375,
        "leartime_s": 0.020190737006487325,
        "sampletime": 2.2084806480270345,
        "best_mean": -18.22565,
        "best_max": 1.7780000000000002,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 6,
        "timesteps": 12000,
        "reward_mean": -18.584774999999997,
        "reward_max": -0.8142500000000003,
        "reward_min": -58.99474999999998,
        "leartime_s": 0.005231520015513524,
        "sampletime": 1.654121005005436,
        "best_mean": -18.22565,
        "best_max": 1.7780000000000002,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 7,
        "timesteps": 14000,
        "reward_mean": -15.794974999999999,
        "reward_max": -4.683562500000001,
        "reward_min": -122.9134375,
        "leartime_s": 0.020126837014686316,
        "sampletime": 2.1428169120044913,
        "best_mean": -15.794974999999999,
        "best_max": -4.683562500000001,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 8,
        "timesteps": 16000,
        "reward_mean": -11.560475,
        "reward_max": -5.325499999999998,
        "reward_min": -53.33449999999999,
        "leartime_s": 0.01491952600190416,
        "sampletime": 2.15557514198008,
        "best_mean": -11.560475,
        "best_max": -5.325499999999998,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 9,
        "timesteps": 18000,
        "reward_mean": -8.987125,
        "reward_max": -3.3546250000000004,
        "reward_min": -26.0131875,
        "leartime_s": 0.03113411198137328,
        "sampletime": 2.0681768970098346,
        "best_mean": -8.987125,
        "best_max": -3.3546250000000004,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 10,
        "timesteps": 20000,
        "reward_mean": -5.797350000000001,
        "reward_max": -2.0232499999999995,
        "reward_min": -20.872750000000003,
        "leartime_s": 0.02924726699711755,
        "sampletime": 2.0042885500006378,
        "best_mean": -5.797350000000001,
        "best_max": -2.0232499999999995,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 11,
        "timesteps": 22000,
        "reward_mean": -3.2169250000000003,
        "reward_max": -0.9981874999999997,
        "reward_min": -10.9943125,
        "leartime_s": 0.016050084988819435,
        "sampletime": 1.9479341160040349,
        "best_mean": -3.2169250000000003,
        "best_max": -0.9981874999999997,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 12,
        "timesteps": 24000,
        "reward_mean": -2.4077750000000004,
        "reward_max": -0.2436875000000001,
        "reward_min": -5.047437500000002,
        "leartime_s": 0.014228401007130742,
        "sampletime": 1.8841923949948978,
        "best_mean": -2.4077750000000004,
        "best_max": -0.2436875000000001,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 13,
        "timesteps": 26000,
        "reward_mean": -2.58015,
        "reward_max": -1.0833124999999997,
        "reward_min": -4.705687500000001,
        "leartime_s": 0.00700829501147382,
        "sampletime": 1.7451793889922556,
        "best_mean": -2.4077750000000004,
        "best_max": -0.2436875000000001,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 14,
        "timesteps": 28000,
        "reward_mean": -2.403,
        "reward_max": -1.0036875000000003,
        "reward_min": -4.2521249999999995,
        "leartime_s": 0.021277634979924187,
        "sampletime": 2.038514292013133,
        "best_mean": -2.403,
        "best_max": -1.0036875000000003,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 15,
        "timesteps": 30000,
        "reward_mean": -2.2492499999999995,
        "reward_max": -0.7423749999999995,
        "reward_min": -3.8797499999999996,
        "leartime_s": 0.018132530996808782,
        "sampletime": 2.070713941997383,
        "best_mean": -2.2492499999999995,
        "best_max": -0.7423749999999995,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 16,
        "timesteps": 32000,
        "reward_mean": -2.14165,
        "reward_max": -0.9445624999999997,
        "reward_min": -3.8195624999999995,
        "leartime_s": 0.02048138898680918,
        "sampletime": 1.7604784189898055,
        "best_mean": -2.14165,
        "best_max": -0.9445624999999997,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 17,
        "timesteps": 34000,
        "reward_mean": -1.7785499999999996,
        "reward_max": -0.7994999999999997,
        "reward_min": -3.37775,
        "leartime_s": 0.01652914800797589,
        "sampletime": 1.8230278749833815,
        "best_mean": -1.7785499999999996,
        "best_max": -0.7994999999999997,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 18,
        "timesteps": 36000,
        "reward_mean": -2.0860999999999996,
        "reward_max": -0.6564999999999993,
        "reward_min": -3.7663749999999987,
        "leartime_s": 0.018818907003151253,
        "sampletime": 2.112603854009649,
        "best_mean": -1.7785499999999996,
        "best_max": -0.7994999999999997,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 19,
        "timesteps": 38000,
        "reward_mean": -1.7821,
        "reward_max": -0.8577500000000001,
        "reward_min": -3.2688749999999995,
        "leartime_s": 0.017723378026857972,
        "sampletime": 1.8639609630045015,
        "best_mean": -1.7785499999999996,
        "best_max": -0.7994999999999997,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 20,
        "timesteps": 40000,
        "reward_mean": -1.5522,
        "reward_max": -0.5639999999999996,
        "reward_min": -2.673875,
        "leartime_s": 0.05014413097524084,
        "sampletime": 1.9198084880190436,
        "best_mean": -1.5522,
        "best_max": -0.5639999999999996,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 21,
        "timesteps": 42000,
        "reward_mean": -1.6347749999999999,
        "reward_max": -0.8063749999999997,
        "reward_min": -2.609625,
        "leartime_s": 0.019703013997059315,
        "sampletime": 2.320447455975227,
        "best_mean": -1.5522,
        "best_max": -0.5639999999999996,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 22,
        "timesteps": 44000,
        "reward_mean": -1.8794,
        "reward_max": -0.8073125000000001,
        "reward_min": -3.2396875000000005,
        "leartime_s": 0.014928156015230343,
        "sampletime": 1.7104351200105157,
        "best_mean": -1.5522,
        "best_max": -0.5639999999999996,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 23,
        "timesteps": 46000,
        "reward_mean": -1.9031999999999998,
        "reward_max": -1.007875,
        "reward_min": -3.2403750000000002,
        "leartime_s": 0.015276963007636368,
        "sampletime": 2.304300935997162,
        "best_mean": -1.5522,
        "best_max": -0.5639999999999996,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 24,
        "timesteps": 48000,
        "reward_mean": -1.7928999999999997,
        "reward_max": -0.5904374999999997,
        "reward_min": -3.3491874999999998,
        "leartime_s": 0.006193887995323166,
        "sampletime": 1.8539004269987345,
        "best_mean": -1.5522,
        "best_max": -0.5639999999999996,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 25,
        "timesteps": 50000,
        "reward_mean": -1.6703749999999997,
        "reward_max": -0.35143750000000007,
        "reward_min": -2.8906874999999985,
        "leartime_s": 0.0053931319853290915,
        "sampletime": 1.839054935000604,
        "best_mean": -1.5522,
        "best_max": -0.5639999999999996,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 26,
        "timesteps": 52000,
        "reward_mean": -1.5268249999999999,
        "reward_max": -0.7076874999999999,
        "reward_min": -2.8219374999999984,
        "leartime_s": 0.005991137004457414,
        "sampletime": 2.150019579974469,
        "best_mean": -1.5268249999999999,
        "best_max": -0.7076874999999999,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 27,
        "timesteps": 54000,
        "reward_mean": -1.5024999999999997,
        "reward_max": -0.3962499999999996,
        "reward_min": -2.8975624999999994,
        "leartime_s": 0.011267127993050963,
        "sampletime": 1.8989730079774745,
        "best_mean": -1.5024999999999997,
        "best_max": -0.3962499999999996,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 28,
        "timesteps": 56000,
        "reward_mean": -1.33,
        "reward_max": -0.4481249999999999,
        "reward_min": -2.5388125,
        "leartime_s": 0.011531698983162642,
        "sampletime": 1.956767861993285,
        "best_mean": -1.33,
        "best_max": -0.4481249999999999,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 29,
        "timesteps": 58000,
        "reward_mean": -1.3863999999999999,
        "reward_max": -0.38606249999999986,
        "reward_min": -2.8993124999999993,
        "leartime_s": 0.010239589988486841,
        "sampletime": 1.8318650099972729,
        "best_mean": -1.33,
        "best_max": -0.4481249999999999,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 30,
        "timesteps": 60000,
        "reward_mean": -1.6720249999999997,
        "reward_max": -0.7696874999999999,
        "reward_min": -3.0515624999999993,
        "leartime_s": 0.005909435974899679,
        "sampletime": 1.8470248540106695,
        "best_mean": -1.33,
        "best_max": -0.4481249999999999,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 31,
        "timesteps": 62000,
        "reward_mean": -1.60635,
        "reward_max": -0.6859999999999999,
        "reward_min": -3.141125,
        "leartime_s": 0.005994125996949151,
        "sampletime": 1.6746181570051704,
        "best_mean": -1.33,
        "best_max": -0.4481249999999999,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 32,
        "timesteps": 64000,
        "reward_mean": -1.703375,
        "reward_max": -0.6457499999999999,
        "reward_min": -3.0346875,
        "leartime_s": 0.051025416993070394,
        "sampletime": 1.969620126998052,
        "best_mean": -1.33,
        "best_max": -0.4481249999999999,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 33,
        "timesteps": 66000,
        "reward_mean": -1.6098184500000001,
        "reward_max": -0.7247499999999999,
        "reward_min": -2.7978125000000005,
        "leartime_s": 0.03036579699255526,
        "sampletime": 1.7398172040120699,
        "best_mean": -1.33,
        "best_max": -0.4481249999999999,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 34,
        "timesteps": 68000,
        "reward_mean": -1.284,
        "reward_max": -0.26268749999999996,
        "reward_min": -2.5714375,
        "leartime_s": 0.017282224987866357,
        "sampletime": 1.94714499800466,
        "best_mean": -1.284,
        "best_max": -0.26268749999999996,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 35,
        "timesteps": 70000,
        "reward_mean": -1.689175,
        "reward_max": -0.7149375,
        "reward_min": -2.9536249999999997,
        "leartime_s": 0.02292733799549751,
        "sampletime": 1.9252788980084006,
        "best_mean": -1.284,
        "best_max": -0.26268749999999996,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 36,
        "timesteps": 72000,
        "reward_mean": -1.4520750000000002,
        "reward_max": -0.5456250000000001,
        "reward_min": -2.6055,
        "leartime_s": 0.0073165470093954355,
        "sampletime": 2.098001017002389,
        "best_mean": -1.284,
        "best_max": -0.26268749999999996,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 37,
        "timesteps": 74000,
        "reward_mean": -1.4170750000000003,
        "reward_max": -0.6037499999999999,
        "reward_min": -2.697250000000001,
        "leartime_s": 0.017238173983059824,
        "sampletime": 1.957886410993524,
        "best_mean": -1.284,
        "best_max": -0.26268749999999996,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 38,
        "timesteps": 76000,
        "reward_mean": -1.349925,
        "reward_max": -0.39799999999999985,
        "reward_min": -2.4244375000000002,
        "leartime_s": 0.019528553006239235,
        "sampletime": 1.8304698249849025,
        "best_mean": -1.284,
        "best_max": -0.26268749999999996,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 39,
        "timesteps": 78000,
        "reward_mean": -1.274025,
        "reward_max": -0.33806249999999993,
        "reward_min": -2.1530625000000003,
        "leartime_s": 0.011319307988742366,
        "sampletime": 1.9466840499953832,
        "best_mean": -1.274025,
        "best_max": -0.33806249999999993,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 40,
        "timesteps": 80000,
        "reward_mean": -1.5971750000000002,
        "reward_max": -0.47174999999999984,
        "reward_min": -2.8068125,
        "leartime_s": 0.008848499011946842,
        "sampletime": 1.9120975510159042,
        "best_mean": -1.274025,
        "best_max": -0.33806249999999993,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 41,
        "timesteps": 82000,
        "reward_mean": -1.8136999999999999,
        "reward_max": -0.9531250000000003,
        "reward_min": -2.9968750000000006,
        "leartime_s": 0.017077113006962463,
        "sampletime": 2.1198014320107177,
        "best_mean": -1.274025,
        "best_max": -0.33806249999999993,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 42,
        "timesteps": 84000,
        "reward_mean": -1.363975,
        "reward_max": -0.46799999999999997,
        "reward_min": -2.6274999999999995,
        "leartime_s": 0.019487091019982472,
        "sampletime": 2.2623765210155398,
        "best_mean": -1.274025,
        "best_max": -0.33806249999999993,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 43,
        "timesteps": 86000,
        "reward_mean": -1.26865,
        "reward_max": -0.4120625,
        "reward_min": -2.4394374999999995,
        "leartime_s": 0.017000653024297208,
        "sampletime": 1.8153686030127574,
        "best_mean": -1.26865,
        "best_max": -0.4120625,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 44,
        "timesteps": 88000,
        "reward_mean": -1.52755,
        "reward_max": -0.31368749999999995,
        "reward_min": -2.4826249999999996,
        "leartime_s": 0.01217951497528702,
        "sampletime": 2.235061974992277,
        "best_mean": -1.26865,
        "best_max": -0.4120625,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 45,
        "timesteps": 90000,
        "reward_mean": -1.4319500000000003,
        "reward_max": -0.5052500000000001,
        "reward_min": -2.4813125,
        "leartime_s": 0.008468535990687087,
        "sampletime": 1.8316623299906496,
        "best_mean": -1.26865,
        "best_max": -0.4120625,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 46,
        "timesteps": 92000,
        "reward_mean": -1.3060999999999998,
        "reward_max": -0.33756249999999993,
        "reward_min": -2.4422500000000005,
        "leartime_s": 0.02308350001112558,
        "sampletime": 2.110083751991624,
        "best_mean": -1.26865,
        "best_max": -0.4120625,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 47,
        "timesteps": 94000,
        "reward_mean": -1.455175,
        "reward_max": -0.5036250000000004,
        "reward_min": -2.4813750000000003,
        "leartime_s": 0.007897140982095152,
        "sampletime": 1.9707988940062933,
        "best_mean": -1.26865,
        "best_max": -0.4120625,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 48,
        "timesteps": 96000,
        "reward_mean": -1.4869500000000002,
        "reward_max": -0.5755,
        "reward_min": -2.6463750000000004,
        "leartime_s": 0.03206983901327476,
        "sampletime": 1.9518039060058072,
        "best_mean": -1.26865,
        "best_max": -0.4120625,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 49,
        "timesteps": 98000,
        "reward_mean": -1.157475,
        "reward_max": -0.2363124999999999,
        "reward_min": -2.3101875,
        "leartime_s": 0.0385022189875599,
        "sampletime": 2.143193196010543,
        "best_mean": -1.157475,
        "best_max": -0.2363124999999999,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 50,
        "timesteps": 100000,
        "reward_mean": -1.3460999999999999,
        "reward_max": -0.4633749999999998,
        "reward_min": -2.3551875,
        "leartime_s": 0.013513474987121299,
        "sampletime": 1.6853729269932956,
        "best_mean": -1.157475,
        "best_max": -0.2363124999999999,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 51,
        "timesteps": 102000,
        "reward_mean": -1.4577250000000002,
        "reward_max": -0.6761249999999999,
        "reward_min": -2.5755,
        "leartime_s": 0.018787776003591716,
        "sampletime": 1.6966623910120688,
        "best_mean": -1.157475,
        "best_max": -0.2363124999999999,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 52,
        "timesteps": 104000,
        "reward_mean": -1.3945500000000002,
        "reward_max": -0.5215,
        "reward_min": -2.530937500000001,
        "leartime_s": 0.009499963984126225,
        "sampletime": 2.0277828719990794,
        "best_mean": -1.157475,
        "best_max": -0.2363124999999999,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 53,
        "timesteps": 106000,
        "reward_mean": -1.3296000000000003,
        "reward_max": -0.47081250000000024,
        "reward_min": -2.3767500000000013,
        "leartime_s": 0.03370175702730194,
        "sampletime": 2.124352613987867,
        "best_mean": -1.157475,
        "best_max": -0.2363124999999999,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 54,
        "timesteps": 108000,
        "reward_mean": -1.5735500000000002,
        "reward_max": -0.6510000000000002,
        "reward_min": -2.7731875,
        "leartime_s": 0.02159209901583381,
        "sampletime": 1.966511170990998,
        "best_mean": -1.157475,
        "best_max": -0.2363124999999999,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 55,
        "timesteps": 110000,
        "reward_mean": -1.3963500000000004,
        "reward_max": -0.17712499999999998,
        "reward_min": -2.4803125,
        "leartime_s": 0.005454202007967979,
        "sampletime": 1.9570833120087627,
        "best_mean": -1.157475,
        "best_max": -0.2363124999999999,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 56,
        "timesteps": 112000,
        "reward_mean": -1.2736750000000003,
        "reward_max": -0.29731250000000015,
        "reward_min": -2.611562500000001,
        "leartime_s": 0.006512411026051268,
        "sampletime": 2.0161857880011667,
        "best_mean": -1.157475,
        "best_max": -0.2363124999999999,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 57,
        "timesteps": 114000,
        "reward_mean": -1.1967250000000003,
        "reward_max": -0.39206249999999976,
        "reward_min": -2.5948750000000005,
        "leartime_s": 0.030226845003198832,
        "sampletime": 1.7257304369995836,
        "best_mean": -1.157475,
        "best_max": -0.2363124999999999,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 58,
        "timesteps": 116000,
        "reward_mean": -1.2567250000000003,
        "reward_max": -0.19962500000000002,
        "reward_min": -2.3957500000000005,
        "leartime_s": 0.0068252730125095695,
        "sampletime": 2.1472174990049098,
        "best_mean": -1.157475,
        "best_max": -0.2363124999999999,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 59,
        "timesteps": 118000,
        "reward_mean": -1.3811,
        "reward_max": -0.22143749999999984,
        "reward_min": -2.53775,
        "leartime_s": 0.007110007980372757,
        "sampletime": 2.0617230189964175,
        "best_mean": -1.157475,
        "best_max": -0.2363124999999999,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 60,
        "timesteps": 120000,
        "reward_mean": -1.5370250000000003,
        "reward_max": -0.5941250000000002,
        "reward_min": -2.6756875000000004,
        "leartime_s": 0.06128391099628061,
        "sampletime": 1.9306745780049823,
        "best_mean": -1.157475,
        "best_max": -0.2363124999999999,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 61,
        "timesteps": 122000,
        "reward_mean": -1.37245,
        "reward_max": -0.08406249999999992,
        "reward_min": -2.5883125000000002,
        "leartime_s": 0.010242079995805398,
        "sampletime": 2.1537583080062177,
        "best_mean": -1.157475,
        "best_max": -0.2363124999999999,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 62,
        "timesteps": 124000,
        "reward_mean": -1.360675,
        "reward_max": -0.2426249999999999,
        "reward_min": -3.0006875000000006,
        "leartime_s": 0.020755652018124238,
        "sampletime": 1.68227858399041,
        "best_mean": -1.157475,
        "best_max": -0.2363124999999999,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 63,
        "timesteps": 126000,
        "reward_mean": -1.3806000000000003,
        "reward_max": -0.5760625000000001,
        "reward_min": -2.5450000000000004,
        "leartime_s": 0.03202342998702079,
        "sampletime": 2.012655185011681,
        "best_mean": -1.157475,
        "best_max": -0.2363124999999999,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 64,
        "timesteps": 128000,
        "reward_mean": -1.3019,
        "reward_max": -0.3894375000000002,
        "reward_min": -2.408187499999999,
        "leartime_s": 0.02785873698303476,
        "sampletime": 1.8204768499999773,
        "best_mean": -1.157475,
        "best_max": -0.2363124999999999,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 65,
        "timesteps": 130000,
        "reward_mean": -1.0836750000000002,
        "reward_max": -0.2096249999999999,
        "reward_min": -1.9812499999999997,
        "leartime_s": 0.02507931599393487,
        "sampletime": 2.06064179900568,
        "best_mean": -1.0836750000000002,
        "best_max": -0.2096249999999999,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 66,
        "timesteps": 132000,
        "reward_mean": -1.2917000000000003,
        "reward_max": -0.456375,
        "reward_min": -2.338562500000001,
        "leartime_s": 0.008661806990858167,
        "sampletime": 2.0764847889950033,
        "best_mean": -1.0836750000000002,
        "best_max": -0.2096249999999999,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 67,
        "timesteps": 134000,
        "reward_mean": -1.3923500000000002,
        "reward_max": -0.4231875000000001,
        "reward_min": -2.6173125000000006,
        "leartime_s": 0.02671153799747117,
        "sampletime": 1.817121614003554,
        "best_mean": -1.0836750000000002,
        "best_max": -0.2096249999999999,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 68,
        "timesteps": 136000,
        "reward_mean": -1.2745000000000004,
        "reward_max": -0.2980625000000001,
        "reward_min": -2.3269375000000005,
        "leartime_s": 0.022541184996953234,
        "sampletime": 1.6565622999914922,
        "best_mean": -1.0836750000000002,
        "best_max": -0.2096249999999999,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 69,
        "timesteps": 138000,
        "reward_mean": -1.4674500000000004,
        "reward_max": -0.5484375000000001,
        "reward_min": -2.487625,
        "leartime_s": 0.03825837801559828,
        "sampletime": 1.8374207070155535,
        "best_mean": -1.0836750000000002,
        "best_max": -0.2096249999999999,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 70,
        "timesteps": 140000,
        "reward_mean": -1.4649000000000005,
        "reward_max": -0.6591875,
        "reward_min": -2.507875000000001,
        "leartime_s": 0.007305667008040473,
        "sampletime": 1.9351030580000952,
        "best_mean": -1.0836750000000002,
        "best_max": -0.2096249999999999,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 71,
        "timesteps": 142000,
        "reward_mean": -1.2242250000000003,
        "reward_max": -0.3555000000000001,
        "reward_min": -2.2795000000000005,
        "leartime_s": 0.021865190006792545,
        "sampletime": 1.9388720570132136,
        "best_mean": -1.0836750000000002,
        "best_max": -0.2096249999999999,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 72,
        "timesteps": 144000,
        "reward_mean": -0.92945,
        "reward_max": -0.11974999999999998,
        "reward_min": -2.08225,
        "leartime_s": 0.007954332017106935,
        "sampletime": 1.9380514459917322,
        "best_mean": -0.92945,
        "best_max": -0.11974999999999998,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 73,
        "timesteps": 146000,
        "reward_mean": -1.1691,
        "reward_max": -0.32274999999999987,
        "reward_min": -2.28675,
        "leartime_s": 0.021293906000209972,
        "sampletime": 1.90531595601351,
        "best_mean": -0.92945,
        "best_max": -0.11974999999999998,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 74,
        "timesteps": 148000,
        "reward_mean": -1.4031250000000004,
        "reward_max": -0.43549999999999994,
        "reward_min": -2.6216250000000008,
        "leartime_s": 0.01783361900015734,
        "sampletime": 1.7849310740130022,
        "best_mean": -0.92945,
        "best_max": -0.11974999999999998,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 75,
        "timesteps": 150000,
        "reward_mean": -1.1912250000000004,
        "reward_max": -0.20918750000000014,
        "reward_min": -2.589562500000001,
        "leartime_s": 0.0166337100090459,
        "sampletime": 1.9588406079856213,
        "best_mean": -0.92945,
        "best_max": -0.11974999999999998,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 76,
        "timesteps": 152000,
        "reward_mean": -1.0965750000000003,
        "reward_max": -0.04431249999999992,
        "reward_min": -2.471875000000001,
        "leartime_s": 0.020674280996900052,
        "sampletime": 1.785619646019768,
        "best_mean": -0.92945,
        "best_max": -0.11974999999999998,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 77,
        "timesteps": 154000,
        "reward_mean": -1.0280250000000002,
        "reward_max": -0.08881249999999999,
        "reward_min": -2.147812500000001,
        "leartime_s": 0.01720276300329715,
        "sampletime": 2.0980234119924717,
        "best_mean": -0.92945,
        "best_max": -0.11974999999999998,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 78,
        "timesteps": 156000,
        "reward_mean": -1.3296750000000002,
        "reward_max": -0.4500625000000002,
        "reward_min": -2.2880000000000003,
        "leartime_s": 0.012986000976525247,
        "sampletime": 1.9562680580129381,
        "best_mean": -0.92945,
        "best_max": -0.11974999999999998,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 79,
        "timesteps": 158000,
        "reward_mean": -1.0197250000000002,
        "reward_max": -0.1449999999999999,
        "reward_min": -2.1338125000000003,
        "leartime_s": 0.0091233309940435,
        "sampletime": 1.9609827650128864,
        "best_mean": -0.92945,
        "best_max": -0.11974999999999998,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 80,
        "timesteps": 160000,
        "reward_mean": -1.1638500000000003,
        "reward_max": -0.013687500000000033,
        "reward_min": -2.3109375,
        "leartime_s": 0.007855831005144864,
        "sampletime": 1.9315953820187133,
        "best_mean": -0.92945,
        "best_max": -0.11974999999999998,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 81,
        "timesteps": 162000,
        "reward_mean": -1.2241000000000004,
        "reward_max": -0.357625,
        "reward_min": -2.1690625000000003,
        "leartime_s": 0.029364068992435932,
        "sampletime": 1.8376597899768967,
        "best_mean": -0.92945,
        "best_max": -0.11974999999999998,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 82,
        "timesteps": 164000,
        "reward_mean": -0.9501500000000003,
        "reward_max": -0.22481250000000005,
        "reward_min": -1.9863750000000002,
        "leartime_s": 0.08823050701175816,
        "sampletime": 1.803013071010355,
        "best_mean": -0.92945,
        "best_max": -0.11974999999999998,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 83,
        "timesteps": 166000,
        "reward_mean": -1.2884500000000003,
        "reward_max": -0.40393749999999984,
        "reward_min": -2.2828125000000004,
        "leartime_s": 0.006245449010748416,
        "sampletime": 1.714997545001097,
        "best_mean": -0.92945,
        "best_max": -0.11974999999999998,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 84,
        "timesteps": 168000,
        "reward_mean": -0.8937000000000003,
        "reward_max": 0.1359375000000002,
        "reward_min": -1.9342500000000007,
        "leartime_s": 0.008448535983916372,
        "sampletime": 1.9992214080120903,
        "best_mean": -0.8937000000000003,
        "best_max": 0.1359375000000002,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 85,
        "timesteps": 170000,
        "reward_mean": -1.2153500000000002,
        "reward_max": -0.39162500000000044,
        "reward_min": -2.686875,
        "leartime_s": 0.016897581983357668,
        "sampletime": 1.7992176009865943,
        "best_mean": -0.8937000000000003,
        "best_max": 0.1359375000000002,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 86,
        "timesteps": 172000,
        "reward_mean": -1.1224500000000002,
        "reward_max": -0.15768749999999965,
        "reward_min": -2.238125,
        "leartime_s": 0.011977223010035232,
        "sampletime": 1.9970922869979404,
        "best_mean": -0.8937000000000003,
        "best_max": 0.1359375000000002,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 87,
        "timesteps": 174000,
        "reward_mean": -1.1228500000000003,
        "reward_max": -0.29637499999999994,
        "reward_min": -2.4893750000000003,
        "leartime_s": 0.01503129699267447,
        "sampletime": 1.9727870729984716,
        "best_mean": -0.8937000000000003,
        "best_max": 0.1359375000000002,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 88,
        "timesteps": 176000,
        "reward_mean": -0.9778000000000003,
        "reward_max": 0.039562500000000125,
        "reward_min": -2.158312500000001,
        "leartime_s": 0.028147409000666812,
        "sampletime": 1.7665223719959613,
        "best_mean": -0.8937000000000003,
        "best_max": 0.1359375000000002,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 89,
        "timesteps": 178000,
        "reward_mean": -0.9030250000000003,
        "reward_max": 0.22387500000000013,
        "reward_min": -2.1226250000000007,
        "leartime_s": 0.029375598998740315,
        "sampletime": 2.108484144002432,
        "best_mean": -0.8937000000000003,
        "best_max": 0.1359375000000002,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 90,
        "timesteps": 180000,
        "reward_mean": -1.1362750000000004,
        "reward_max": -0.31668749999999984,
        "reward_min": -2.3963125000000005,
        "leartime_s": 0.01655237900558859,
        "sampletime": 2.160352114995476,
        "best_mean": -0.8937000000000003,
        "best_max": 0.1359375000000002,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 91,
        "timesteps": 182000,
        "reward_mean": -1.1763000000000003,
        "reward_max": -0.21437499999999995,
        "reward_min": -2.3044375000000006,
        "leartime_s": 0.03216506898752414,
        "sampletime": 1.9910131999931764,
        "best_mean": -0.8937000000000003,
        "best_max": 0.1359375000000002,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 92,
        "timesteps": 184000,
        "reward_mean": -1.0392250000000003,
        "reward_max": -0.07831250000000012,
        "reward_min": -2.0218125000000002,
        "leartime_s": 0.009086550999199972,
        "sampletime": 2.264034959982382,
        "best_mean": -0.8937000000000003,
        "best_max": 0.1359375000000002,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 93,
        "timesteps": 186000,
        "reward_mean": -0.7863250000000002,
        "reward_max": 0.21018750000000025,
        "reward_min": -2.066062500000001,
        "leartime_s": 0.015762642986373976,
        "sampletime": 1.7589103530044667,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 94,
        "timesteps": 188000,
        "reward_mean": -1.1064750000000003,
        "reward_max": -0.14918749999999992,
        "reward_min": -2.232,
        "leartime_s": 0.05956368401530199,
        "sampletime": 1.9840022410207894,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 95,
        "timesteps": 190000,
        "reward_mean": -1.1009500000000003,
        "reward_max": -0.12318749999999998,
        "reward_min": -2.1464374999999998,
        "leartime_s": 0.03893953299848363,
        "sampletime": 2.0534710209758487,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 96,
        "timesteps": 192000,
        "reward_mean": -0.8537750000000002,
        "reward_max": 0.1637500000000001,
        "reward_min": -2.454500000000001,
        "leartime_s": 0.020683531009126455,
        "sampletime": 1.9054823000042234,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 97,
        "timesteps": 194000,
        "reward_mean": -0.9668500000000002,
        "reward_max": 0.06918750000000001,
        "reward_min": -2.436875000000001,
        "leartime_s": 0.03370503199403174,
        "sampletime": 2.0424375220027287,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 98,
        "timesteps": 196000,
        "reward_mean": -1.1735500000000003,
        "reward_max": -0.16456250000000006,
        "reward_min": -2.2465000000000006,
        "leartime_s": 0.008672526979353279,
        "sampletime": 2.103344190021744,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 99,
        "timesteps": 198000,
        "reward_mean": -1.2050250000000002,
        "reward_max": -0.33293750000000005,
        "reward_min": -2.519625000000001,
        "leartime_s": 0.03936100599821657,
        "sampletime": 1.7927997479855549,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 100,
        "timesteps": 200000,
        "reward_mean": -0.9765250000000002,
        "reward_max": 0.061687500000000096,
        "reward_min": -2.2603750000000007,
        "leartime_s": 0.019787894998444244,
        "sampletime": 1.7003948130004574,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 101,
        "timesteps": 202000,
        "reward_mean": -1.0567750000000002,
        "reward_max": -0.12231250000000023,
        "reward_min": -2.2028125000000007,
        "leartime_s": 0.023305510985665023,
        "sampletime": 2.077651795989368,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 102,
        "timesteps": 204000,
        "reward_mean": -1.0110750000000002,
        "reward_max": -0.2041874999999999,
        "reward_min": -2.3479375000000005,
        "leartime_s": 0.028267560002859682,
        "sampletime": 1.8536648610024713,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 103,
        "timesteps": 206000,
        "reward_mean": -0.9590500000000003,
        "reward_max": -0.23031249999999992,
        "reward_min": -1.9621250000000006,
        "leartime_s": 0.008197434013709426,
        "sampletime": 2.0464408429979812,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 104,
        "timesteps": 208000,
        "reward_mean": -0.9423750000000002,
        "reward_max": -0.03437499999999985,
        "reward_min": -2.1924375000000005,
        "leartime_s": 0.026680876995669678,
        "sampletime": 1.9115235630015377,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 105,
        "timesteps": 210000,
        "reward_mean": -0.9476250000000003,
        "reward_max": 0.16537500000000038,
        "reward_min": -1.8145625,
        "leartime_s": 0.0216753380082082,
        "sampletime": 1.9389364620146807,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 106,
        "timesteps": 212000,
        "reward_mean": -1.1269000000000002,
        "reward_max": -0.2709375,
        "reward_min": -2.578875,
        "leartime_s": 0.0065796609851531684,
        "sampletime": 2.0557822750124615,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 107,
        "timesteps": 214000,
        "reward_mean": -1.134525,
        "reward_max": -0.2958125,
        "reward_min": -2.3760000000000012,
        "leartime_s": 0.012362345994915813,
        "sampletime": 1.9725905339873862,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 108,
        "timesteps": 216000,
        "reward_mean": -1.0472250000000003,
        "reward_max": -0.0318124999999997,
        "reward_min": -2.333000000000001,
        "leartime_s": 0.03612456101109274,
        "sampletime": 1.9714489440084435,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 109,
        "timesteps": 218000,
        "reward_mean": -1.2268750000000002,
        "reward_max": -0.0011874999999999221,
        "reward_min": -2.301375,
        "leartime_s": 0.031137332000071183,
        "sampletime": 2.0759906790044624,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 110,
        "timesteps": 220000,
        "reward_mean": -1.2019750000000007,
        "reward_max": -0.27087500000000014,
        "reward_min": -2.509125,
        "leartime_s": 0.0155617110140156,
        "sampletime": 1.8765139350143727,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 111,
        "timesteps": 222000,
        "reward_mean": -1.0111750000000004,
        "reward_max": -0.14687499999999992,
        "reward_min": -1.9395000000000004,
        "leartime_s": 0.03746582200983539,
        "sampletime": 1.82914891600376,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 112,
        "timesteps": 224000,
        "reward_mean": -1.3237500000000002,
        "reward_max": -0.07787499999999997,
        "reward_min": -2.6243750000000006,
        "leartime_s": 0.06828368699643761,
        "sampletime": 1.9567324090166949,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 113,
        "timesteps": 226000,
        "reward_mean": -1.3072250000000003,
        "reward_max": -0.3243125,
        "reward_min": -2.4166250000000002,
        "leartime_s": 0.017646627995418385,
        "sampletime": 1.9803753290034365,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 114,
        "timesteps": 228000,
        "reward_mean": -0.9339000000000001,
        "reward_max": -0.018624999999999947,
        "reward_min": -2.1557500000000003,
        "leartime_s": 0.0248221029760316,
        "sampletime": 1.9108843629946932,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 115,
        "timesteps": 230000,
        "reward_mean": -0.8107750000000002,
        "reward_max": 0.17987500000000023,
        "reward_min": -1.833437500000001,
        "leartime_s": 0.009115711000049487,
        "sampletime": 1.6953804760123603,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 116,
        "timesteps": 232000,
        "reward_mean": -1.0798250000000003,
        "reward_max": -0.10737499999999989,
        "reward_min": -2.4606250000000003,
        "leartime_s": 0.026503945991862565,
        "sampletime": 1.920957346999785,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 117,
        "timesteps": 234000,
        "reward_mean": -1.1273250000000004,
        "reward_max": -0.02393749999999982,
        "reward_min": -2.3218750000000004,
        "leartime_s": 0.01913014901219867,
        "sampletime": 1.7294009249890223,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 118,
        "timesteps": 236000,
        "reward_mean": -0.9849750000000003,
        "reward_max": -0.1591249999999998,
        "reward_min": -2.071125000000001,
        "leartime_s": 0.02770474599674344,
        "sampletime": 2.3636577889847104,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 119,
        "timesteps": 238000,
        "reward_mean": -1.324025,
        "reward_max": -0.3437499999999999,
        "reward_min": -2.6926250000000005,
        "leartime_s": 0.013885327993193641,
        "sampletime": 1.9792179059877526,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 120,
        "timesteps": 240000,
        "reward_mean": -1.163625,
        "reward_max": -0.10293749999999956,
        "reward_min": -2.5402500000000003,
        "leartime_s": 0.024698302004253492,
        "sampletime": 1.9235791669925675,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 121,
        "timesteps": 242000,
        "reward_mean": -1.1622250000000003,
        "reward_max": -0.08274999999999991,
        "reward_min": -2.2663749999999996,
        "leartime_s": 0.03296620701439679,
        "sampletime": 1.9193327700195368,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 122,
        "timesteps": 244000,
        "reward_mean": -1.1860000000000004,
        "reward_max": -0.29624999999999996,
        "reward_min": -2.5878750000000004,
        "leartime_s": 0.009606443985830992,
        "sampletime": 1.9169995859847404,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 123,
        "timesteps": 246000,
        "reward_mean": -0.9835500000000001,
        "reward_max": -0.1211250000000002,
        "reward_min": -2.2761250000000004,
        "leartime_s": 0.02972929200041108,
        "sampletime": 2.130153286008863,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 124,
        "timesteps": 248000,
        "reward_mean": -1.1075750000000004,
        "reward_max": -0.27200000000000024,
        "reward_min": -2.1855625000000005,
        "leartime_s": 0.035728698974708095,
        "sampletime": 1.9836444199900143,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 125,
        "timesteps": 250000,
        "reward_mean": -0.8448000000000002,
        "reward_max": 0.30168750000000033,
        "reward_min": -2.3795625000000005,
        "leartime_s": 0.02579697102191858,
        "sampletime": 1.9433851669891737,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 126,
        "timesteps": 252000,
        "reward_mean": -1.1623750000000002,
        "reward_max": -0.11999999999999972,
        "reward_min": -2.7031875000000003,
        "leartime_s": 0.029979548999108374,
        "sampletime": 1.9487856890191324,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 127,
        "timesteps": 254000,
        "reward_mean": -1.1761750000000002,
        "reward_max": -0.19343749999999998,
        "reward_min": -2.2993750000000013,
        "leartime_s": 0.010607292002532631,
        "sampletime": 1.8075955600070301,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 128,
        "timesteps": 256000,
        "reward_mean": -1.1507250000000004,
        "reward_max": -0.2546250000000002,
        "reward_min": -2.4329375000000013,
        "leartime_s": 0.009279502992285416,
        "sampletime": 1.828597843006719,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 129,
        "timesteps": 258000,
        "reward_mean": -1.3407250000000004,
        "reward_max": -0.4038124999999999,
        "reward_min": -2.4785000000000013,
        "leartime_s": 0.01821780198952183,
        "sampletime": 2.043954094988294,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 130,
        "timesteps": 260000,
        "reward_mean": -1.3137500000000004,
        "reward_max": -0.03718749999999997,
        "reward_min": -2.4358125,
        "leartime_s": 0.014907567005138844,
        "sampletime": 1.6537110919889528,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 131,
        "timesteps": 262000,
        "reward_mean": -1.1550500000000001,
        "reward_max": -0.10187500000000008,
        "reward_min": -2.2435,
        "leartime_s": 0.01724219400784932,
        "sampletime": 1.7281930320023093,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 132,
        "timesteps": 264000,
        "reward_mean": -1.4133250000000002,
        "reward_max": -0.6334375000000002,
        "reward_min": -2.417875000000001,
        "leartime_s": 0.010235708992695436,
        "sampletime": 1.8886056809860747,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 133,
        "timesteps": 266000,
        "reward_mean": -0.8963000000000002,
        "reward_max": 0.028249999999999987,
        "reward_min": -2.399375,
        "leartime_s": 0.028799219988286495,
        "sampletime": 1.9157444070151541,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 134,
        "timesteps": 268000,
        "reward_mean": -1.2015750000000003,
        "reward_max": -0.13612499999999997,
        "reward_min": -2.6918750000000014,
        "leartime_s": 0.06576446202234365,
        "sampletime": 2.0709475509938784,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 135,
        "timesteps": 270000,
        "reward_mean": -1.3805250000000002,
        "reward_max": -0.5116875,
        "reward_min": -2.6111875,
        "leartime_s": 0.011683891003485769,
        "sampletime": 2.1578003280155826,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 136,
        "timesteps": 272000,
        "reward_mean": -1.2232250000000002,
        "reward_max": -0.1916249999999999,
        "reward_min": -2.7424375,
        "leartime_s": 0.049855518009280786,
        "sampletime": 1.9650155859999359,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 137,
        "timesteps": 274000,
        "reward_mean": -1.142875,
        "reward_max": -0.2558749999999998,
        "reward_min": -2.3192500000000007,
        "leartime_s": 0.01097353600198403,
        "sampletime": 2.174524712987477,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 138,
        "timesteps": 276000,
        "reward_mean": -1.3154750000000004,
        "reward_max": -0.4840625,
        "reward_min": -2.4962500000000003,
        "leartime_s": 0.010425860993564129,
        "sampletime": 1.8648448410094716,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 139,
        "timesteps": 278000,
        "reward_mean": -1.2429750000000004,
        "reward_max": -0.27756250000000027,
        "reward_min": -2.616562500000001,
        "leartime_s": 0.026360185001976788,
        "sampletime": 1.8602378710056655,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 140,
        "timesteps": 280000,
        "reward_mean": -1.1162213833333334,
        "reward_max": -0.2680625000000001,
        "reward_min": -2.222937500000001,
        "leartime_s": 0.0502786319993902,
        "sampletime": 2.2219199519895483,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 141,
        "timesteps": 282000,
        "reward_mean": -1.0253750000000001,
        "reward_max": 0.04806250000000003,
        "reward_min": -2.1958125,
        "leartime_s": 0.02062083999044262,
        "sampletime": 1.854386295977747,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 142,
        "timesteps": 284000,
        "reward_mean": -1.3113250000000003,
        "reward_max": -0.3400000000000002,
        "reward_min": -2.5158750000000003,
        "leartime_s": 0.018661365000298247,
        "sampletime": 2.064204513997538,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 143,
        "timesteps": 286000,
        "reward_mean": -1.4078000000000002,
        "reward_max": -0.20637499999999975,
        "reward_min": -2.7969375000000003,
        "leartime_s": 0.04540926398476586,
        "sampletime": 2.2558350609906483,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 144,
        "timesteps": 288000,
        "reward_mean": -1.3221000000000003,
        "reward_max": -0.5019375000000001,
        "reward_min": -2.6793750000000003,
        "leartime_s": 0.012200605007819831,
        "sampletime": 1.6829049109946936,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 145,
        "timesteps": 290000,
        "reward_mean": -1.1592750000000005,
        "reward_max": -0.24700000000000005,
        "reward_min": -2.784812500000001,
        "leartime_s": 0.010963714972604066,
        "sampletime": 1.9959780939971097,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 146,
        "timesteps": 292000,
        "reward_mean": -1.3169000000000004,
        "reward_max": -0.2110624999999997,
        "reward_min": -2.85375,
        "leartime_s": 0.01410383899929002,
        "sampletime": 2.3261119480011985,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 147,
        "timesteps": 294000,
        "reward_mean": -1.2972000000000004,
        "reward_max": -0.31931249999999994,
        "reward_min": -2.6131875000000004,
        "leartime_s": 0.017222751019289717,
        "sampletime": 1.7778961099975277,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 148,
        "timesteps": 296000,
        "reward_mean": -1.354125,
        "reward_max": -0.3185625,
        "reward_min": -2.4748750000000013,
        "leartime_s": 0.011245497007621452,
        "sampletime": 1.7532689979998395,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 149,
        "timesteps": 298000,
        "reward_mean": -1.2596250000000002,
        "reward_max": -0.11143749999999991,
        "reward_min": -2.4310625000000012,
        "leartime_s": 0.021827050019055605,
        "sampletime": 2.0530391029897146,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 150,
        "timesteps": 300000,
        "reward_mean": -0.7974000000000001,
        "reward_max": 0.1462500000000002,
        "reward_min": -1.9002500000000007,
        "leartime_s": 0.028333941008895636,
        "sampletime": 1.974027822026983,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 151,
        "timesteps": 302000,
        "reward_mean": -0.9797750000000002,
        "reward_max": -0.12112500000000001,
        "reward_min": -2.01725,
        "leartime_s": 0.026526097004534677,
        "sampletime": 1.774731031007832,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 152,
        "timesteps": 304000,
        "reward_mean": -1.3065250000000002,
        "reward_max": -0.3101875,
        "reward_min": -2.6894375,
        "leartime_s": 0.11106061298050918,
        "sampletime": 2.073372498009121,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 153,
        "timesteps": 306000,
        "reward_mean": -1.1766,
        "reward_max": -0.12268749999999998,
        "reward_min": -2.391562500000001,
        "leartime_s": 0.010535101988352835,
        "sampletime": 2.207944255002076,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 154,
        "timesteps": 308000,
        "reward_mean": -1.2425750000000002,
        "reward_max": -0.1373124999999999,
        "reward_min": -2.5198124999999996,
        "leartime_s": 0.019092917995294556,
        "sampletime": 1.9221348939754535,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 155,
        "timesteps": 310000,
        "reward_mean": -1.1175,
        "reward_max": -0.27393749999999994,
        "reward_min": -2.4174375000000006,
        "leartime_s": 0.012754938972648233,
        "sampletime": 2.305320077983197,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 156,
        "timesteps": 312000,
        "reward_mean": -1.2858750000000003,
        "reward_max": -0.2603125000000001,
        "reward_min": -2.8358125000000007,
        "leartime_s": 0.011629880988039076,
        "sampletime": 2.2008467690029647,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 157,
        "timesteps": 314000,
        "reward_mean": -1.3349000000000002,
        "reward_max": -0.0004999999999998547,
        "reward_min": -2.8279375000000004,
        "leartime_s": 0.032718255009967834,
        "sampletime": 1.8197005359979812,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 158,
        "timesteps": 316000,
        "reward_mean": -1.0638500000000002,
        "reward_max": -0.13399999999999962,
        "reward_min": -2.3596875000000006,
        "leartime_s": 0.01184409300913103,
        "sampletime": 2.27842125800089,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 159,
        "timesteps": 318000,
        "reward_mean": -1.0964,
        "reward_max": -0.07968749999999986,
        "reward_min": -2.1786250000000003,
        "leartime_s": 0.024639481998747215,
        "sampletime": 1.9072934739815537,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 160,
        "timesteps": 320000,
        "reward_mean": -0.9872250000000001,
        "reward_max": -0.11137499999999997,
        "reward_min": -2.285062500000001,
        "leartime_s": 0.07532676600385457,
        "sampletime": 2.4801462800242007,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 161,
        "timesteps": 322000,
        "reward_mean": -1.2063750000000002,
        "reward_max": -0.10512500000000005,
        "reward_min": -2.3793125000000015,
        "leartime_s": 0.05362832799437456,
        "sampletime": 1.6990195710095577,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 162,
        "timesteps": 324000,
        "reward_mean": -1.3616000000000001,
        "reward_max": -0.21149999999999985,
        "reward_min": -2.9430624999999995,
        "leartime_s": 0.02432571997633204,
        "sampletime": 2.0311050830059685,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 163,
        "timesteps": 326000,
        "reward_mean": -1.3505500000000001,
        "reward_max": -0.4133125000000001,
        "reward_min": -2.7961875000000003,
        "leartime_s": 0.0315756659838371,
        "sampletime": 1.9108178020105697,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 164,
        "timesteps": 328000,
        "reward_mean": -1.3227250000000002,
        "reward_max": -0.32031249999999994,
        "reward_min": -2.8476250000000007,
        "leartime_s": 0.012868649995652959,
        "sampletime": 1.7797805559821427,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 165,
        "timesteps": 330000,
        "reward_mean": -1.4561750000000002,
        "reward_max": -0.5224374999999999,
        "reward_min": -2.5510000000000006,
        "leartime_s": 0.01089209399651736,
        "sampletime": 1.718530493992148,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 166,
        "timesteps": 332000,
        "reward_mean": -1.13165,
        "reward_max": -0.24468750000000006,
        "reward_min": -2.9675625000000005,
        "leartime_s": 0.01986033999128267,
        "sampletime": 1.9848956280038692,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 167,
        "timesteps": 334000,
        "reward_mean": -0.8964500000000003,
        "reward_max": 0.04793750000000007,
        "reward_min": -2.066312500000001,
        "leartime_s": 0.011758831999031827,
        "sampletime": 2.217594219982857,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 168,
        "timesteps": 336000,
        "reward_mean": -1.1629750000000003,
        "reward_max": -0.018124999999999905,
        "reward_min": -2.5048125000000003,
        "leartime_s": 0.014144719985779375,
        "sampletime": 1.8250693040026817,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 169,
        "timesteps": 338000,
        "reward_mean": -1.2121000000000004,
        "reward_max": -0.33175,
        "reward_min": -2.3601875000000003,
        "leartime_s": 0.03405677599948831,
        "sampletime": 2.0918013410118874,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 170,
        "timesteps": 340000,
        "reward_mean": -1.1392000000000002,
        "reward_max": -0.06531249999999988,
        "reward_min": -2.376562500000001,
        "leartime_s": 0.009493294026469812,
        "sampletime": 2.1003578789823223,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 171,
        "timesteps": 342000,
        "reward_mean": -1.1482500000000002,
        "reward_max": 0.16425000000000023,
        "reward_min": -2.3841250000000005,
        "leartime_s": 0.013561895000748336,
        "sampletime": 1.8470085440203547,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 172,
        "timesteps": 344000,
        "reward_mean": -1.3816250000000003,
        "reward_max": -0.3890625,
        "reward_min": -2.5621875,
        "leartime_s": 0.008974149997811764,
        "sampletime": 2.116677454992896,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 173,
        "timesteps": 346000,
        "reward_mean": -1.3258750000000001,
        "reward_max": -0.12356249999999991,
        "reward_min": -2.8156875000000006,
        "leartime_s": 0.051407590974122286,
        "sampletime": 2.11046724600601,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 174,
        "timesteps": 348000,
        "reward_mean": -1.2817250000000004,
        "reward_max": -0.37906250000000014,
        "reward_min": -2.9951250000000007,
        "leartime_s": 0.02042546699522063,
        "sampletime": 1.6742249919916503,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 175,
        "timesteps": 350000,
        "reward_mean": -0.8539500000000001,
        "reward_max": 0.06893750000000023,
        "reward_min": -1.9482500000000007,
        "leartime_s": 0.01508661700063385,
        "sampletime": 1.9885408910049591,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 176,
        "timesteps": 352000,
        "reward_mean": -1.1982250000000003,
        "reward_max": -0.030687499999999722,
        "reward_min": -2.841312500000001,
        "leartime_s": 0.030221941997297108,
        "sampletime": 2.0063280610193033,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 177,
        "timesteps": 354000,
        "reward_mean": -1.016575,
        "reward_max": -0.0765624999999999,
        "reward_min": -2.3256875000000004,
        "leartime_s": 0.027169367007445544,
        "sampletime": 1.7194849520165008,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 178,
        "timesteps": 356000,
        "reward_mean": -1.2897250000000005,
        "reward_max": -0.10918749999999985,
        "reward_min": -2.5810000000000004,
        "leartime_s": 0.024380340008065104,
        "sampletime": 2.5841148960171267,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 179,
        "timesteps": 358000,
        "reward_mean": -1.0410500000000003,
        "reward_max": -0.07193749999999971,
        "reward_min": -2.342062500000001,
        "leartime_s": 0.01980213398928754,
        "sampletime": 1.8700225100037642,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 180,
        "timesteps": 360000,
        "reward_mean": -1.1677500000000005,
        "reward_max": -0.20349999999999996,
        "reward_min": -2.4538750000000005,
        "leartime_s": 0.01245482699596323,
        "sampletime": 2.071878552000271,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 181,
        "timesteps": 362000,
        "reward_mean": -1.262925,
        "reward_max": -0.484125,
        "reward_min": -2.235625,
        "leartime_s": 0.011777211009757593,
        "sampletime": 1.6990975539956708,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 182,
        "timesteps": 364000,
        "reward_mean": -1.1094750000000002,
        "reward_max": 0.02293750000000028,
        "reward_min": -2.180812500000001,
        "leartime_s": 0.03610160099924542,
        "sampletime": 1.7981411700020544,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 183,
        "timesteps": 366000,
        "reward_mean": -1.3355250000000003,
        "reward_max": -0.3808749999999999,
        "reward_min": -2.6647500000000006,
        "leartime_s": 0.042073213000549003,
        "sampletime": 1.8745550849998835,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 184,
        "timesteps": 368000,
        "reward_mean": -1.24685,
        "reward_max": -0.373,
        "reward_min": -2.2301250000000006,
        "leartime_s": 0.040254869003547356,
        "sampletime": 1.8797764150076546,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 185,
        "timesteps": 370000,
        "reward_mean": -0.9844500000000003,
        "reward_max": 0.16862500000000014,
        "reward_min": -2.3016875000000008,
        "leartime_s": 0.034246672003064305,
        "sampletime": 2.0652898109983653,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 186,
        "timesteps": 372000,
        "reward_mean": -1.0386750000000002,
        "reward_max": 0.0386250000000001,
        "reward_min": -2.306687500000001,
        "leartime_s": 0.0389335929939989,
        "sampletime": 1.8322873209835961,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 187,
        "timesteps": 374000,
        "reward_mean": -1.1800500000000003,
        "reward_max": -0.22893749999999988,
        "reward_min": -2.3770000000000002,
        "leartime_s": 0.04454759700456634,
        "sampletime": 1.8615868389897514,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 188,
        "timesteps": 376000,
        "reward_mean": -1.0830250000000001,
        "reward_max": -0.18100000000000016,
        "reward_min": -2.4321250000000005,
        "leartime_s": 0.01783674900070764,
        "sampletime": 1.9774988279968966,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 189,
        "timesteps": 378000,
        "reward_mean": -1.0695500000000002,
        "reward_max": -0.03106250000000002,
        "reward_min": -2.5361875000000014,
        "leartime_s": 0.058628146012779325,
        "sampletime": 2.107012580992887,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 190,
        "timesteps": 380000,
        "reward_mean": -1.2054500000000001,
        "reward_max": -0.3010625,
        "reward_min": -2.439812500000001,
        "leartime_s": 0.04168424001545645,
        "sampletime": 1.7101465049781837,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 191,
        "timesteps": 382000,
        "reward_mean": -1.2144750000000002,
        "reward_max": -0.20924999999999985,
        "reward_min": -2.2144375000000003,
        "leartime_s": 0.026701157999923453,
        "sampletime": 2.2207422819919884,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 192,
        "timesteps": 384000,
        "reward_mean": -1.4414250000000002,
        "reward_max": -0.5401249999999999,
        "reward_min": -3.1080625,
        "leartime_s": 0.03865959099493921,
        "sampletime": 1.8758851460006554,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 193,
        "timesteps": 386000,
        "reward_mean": -0.9492250000000002,
        "reward_max": 0.08706250000000024,
        "reward_min": -2.6536250000000003,
        "leartime_s": 0.032483132992638275,
        "sampletime": 1.9037893239874393,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 194,
        "timesteps": 388000,
        "reward_mean": -0.9627250000000002,
        "reward_max": -0.03281249999999976,
        "reward_min": -2.700375,
        "leartime_s": 0.02701908999006264,
        "sampletime": 2.099643360998016,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 195,
        "timesteps": 390000,
        "reward_mean": -1.0859750000000001,
        "reward_max": -0.09349999999999992,
        "reward_min": -2.4448125000000007,
        "leartime_s": 0.025314055004855618,
        "sampletime": 1.8720760700234678,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 196,
        "timesteps": 392000,
        "reward_mean": -1.1635000000000002,
        "reward_max": -0.3026250000000001,
        "reward_min": -2.3424375,
        "leartime_s": 0.06186516900197603,
        "sampletime": 1.8884962340234779,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 197,
        "timesteps": 394000,
        "reward_mean": -1.1100250000000003,
        "reward_max": -0.0013124999999998138,
        "reward_min": -3.1081875000000014,
        "leartime_s": 0.03685450702323578,
        "sampletime": 1.6712295380129945,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 198,
        "timesteps": 396000,
        "reward_mean": -1.0845000000000002,
        "reward_max": -0.09568749999999995,
        "reward_min": -2.1566250000000005,
        "leartime_s": 0.031690366013208404,
        "sampletime": 2.0700639889982995,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 199,
        "timesteps": 398000,
        "reward_mean": -1.0182750000000003,
        "reward_max": -0.16949999999999998,
        "reward_min": -2.2295625,
        "leartime_s": 0.03880046200356446,
        "sampletime": 1.6964794640080072,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 200,
        "timesteps": 400000,
        "reward_mean": -1.1732250000000004,
        "reward_max": -0.08506249999999968,
        "reward_min": -2.4033750000000005,
        "leartime_s": 0.016157095989910886,
        "sampletime": 2.1264283979835454,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 201,
        "timesteps": 402000,
        "reward_mean": -1.0198250000000002,
        "reward_max": -0.018874999999999857,
        "reward_min": -2.0865000000000005,
        "leartime_s": 0.016504578990861773,
        "sampletime": 2.0025198129878845,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 202,
        "timesteps": 404000,
        "reward_mean": -0.9579500000000003,
        "reward_max": -0.026562500000000037,
        "reward_min": -2.078187500000001,
        "leartime_s": 0.029359508014749736,
        "sampletime": 1.8849377270089462,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 203,
        "timesteps": 406000,
        "reward_mean": -1.2126750000000002,
        "reward_max": -0.06668749999999962,
        "reward_min": -3.0415625000000004,
        "leartime_s": 0.013353771006222814,
        "sampletime": 1.997289135993924,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 204,
        "timesteps": 408000,
        "reward_mean": -0.7995000000000002,
        "reward_max": 0.14306250000000034,
        "reward_min": -1.916625000000001,
        "leartime_s": 0.035472346004098654,
        "sampletime": 1.8884954100067262,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 205,
        "timesteps": 410000,
        "reward_mean": -1.0793750000000002,
        "reward_max": -0.16168749999999982,
        "reward_min": -2.3153125000000006,
        "leartime_s": 0.04523997800424695,
        "sampletime": 1.8876117169857025,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 206,
        "timesteps": 412000,
        "reward_mean": -1.2052000000000003,
        "reward_max": -0.13837499999999986,
        "reward_min": -2.678375000000001,
        "leartime_s": 0.04662845900747925,
        "sampletime": 2.171723145991564,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 207,
        "timesteps": 414000,
        "reward_mean": -0.9068500000000002,
        "reward_max": -0.03374999999999999,
        "reward_min": -2.3843125000000005,
        "leartime_s": 0.02408369700424373,
        "sampletime": 1.9847667849971913,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 208,
        "timesteps": 416000,
        "reward_mean": -0.9752500000000001,
        "reward_max": -0.17762499999999992,
        "reward_min": -2.0838125000000005,
        "leartime_s": 0.012626587995328009,
        "sampletime": 1.7592743290006183,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 209,
        "timesteps": 418000,
        "reward_mean": -1.1503250000000003,
        "reward_max": -0.06587499999999986,
        "reward_min": -2.2484375000000005,
        "leartime_s": 0.08392069899127819,
        "sampletime": 1.7999771010072436,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 210,
        "timesteps": 420000,
        "reward_mean": -1.0419500000000002,
        "reward_max": -0.16737500000000016,
        "reward_min": -2.0306875000000004,
        "leartime_s": 0.01993190500070341,
        "sampletime": 2.1539298680145293,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 211,
        "timesteps": 422000,
        "reward_mean": -0.8832000000000001,
        "reward_max": -0.034937500000000093,
        "reward_min": -2.1436250000000006,
        "leartime_s": 0.03215147499577142,
        "sampletime": 1.873283432010794,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 212,
        "timesteps": 424000,
        "reward_mean": -0.8468750000000002,
        "reward_max": 0.12700000000000028,
        "reward_min": -1.9801875000000002,
        "leartime_s": 0.027803956996649504,
        "sampletime": 1.9928393530135509,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 213,
        "timesteps": 426000,
        "reward_mean": -0.8869000000000001,
        "reward_max": 0.12162500000000007,
        "reward_min": -1.9886875000000004,
        "leartime_s": 0.02956947000348009,
        "sampletime": 1.6215313310094643,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 214,
        "timesteps": 428000,
        "reward_mean": -1.0538750000000001,
        "reward_max": -0.08562499999999998,
        "reward_min": -2.565750000000001,
        "leartime_s": 0.058241149003151804,
        "sampletime": 1.8963433709868696,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 215,
        "timesteps": 430000,
        "reward_mean": -0.9378750000000001,
        "reward_max": 0.08843750000000024,
        "reward_min": -1.9266250000000005,
        "leartime_s": 0.10022474598372355,
        "sampletime": 1.9224870699981693,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 216,
        "timesteps": 432000,
        "reward_mean": -0.9230250000000001,
        "reward_max": -0.06937499999999981,
        "reward_min": -2.1530625000000003,
        "leartime_s": 0.019270095974206924,
        "sampletime": 1.994254079007078,
        "best_mean": -0.7863250000000002,
        "best_max": 0.21018750000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 217,
        "timesteps": 434000,
        "reward_mean": -0.740075,
        "reward_max": 0.15306250000000038,
        "reward_min": -1.6172500000000003,
        "leartime_s": 0.06865195001591928,
        "sampletime": 1.6983548840216827,
        "best_mean": -0.740075,
        "best_max": 0.15306250000000038,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 218,
        "timesteps": 436000,
        "reward_mean": -0.8960250000000001,
        "reward_max": 0.05193750000000014,
        "reward_min": -2.3155625000000004,
        "leartime_s": 0.040222859010100365,
        "sampletime": 2.132889348984463,
        "best_mean": -0.740075,
        "best_max": 0.15306250000000038,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 219,
        "timesteps": 438000,
        "reward_mean": -0.7824750000000001,
        "reward_max": 0.31462500000000015,
        "reward_min": -1.8881875000000008,
        "leartime_s": 0.022822907980298623,
        "sampletime": 1.9402654340083245,
        "best_mean": -0.740075,
        "best_max": 0.15306250000000038,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 220,
        "timesteps": 440000,
        "reward_mean": -0.95265,
        "reward_max": -0.04612499999999971,
        "reward_min": -2.3183750000000005,
        "leartime_s": 0.014588563004508615,
        "sampletime": 1.6619270709925331,
        "best_mean": -0.740075,
        "best_max": 0.15306250000000038,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 221,
        "timesteps": 442000,
        "reward_mean": -1.2524000000000002,
        "reward_max": -0.12456249999999981,
        "reward_min": -2.3598125000000008,
        "leartime_s": 0.02823225999600254,
        "sampletime": 2.0113223530061077,
        "best_mean": -0.740075,
        "best_max": 0.15306250000000038,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 222,
        "timesteps": 444000,
        "reward_mean": -0.726875,
        "reward_max": 0.14337500000000014,
        "reward_min": -2.2431875000000003,
        "leartime_s": 0.013793297024676576,
        "sampletime": 2.079704906005645,
        "best_mean": -0.726875,
        "best_max": 0.14337500000000014,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 223,
        "timesteps": 446000,
        "reward_mean": -0.7827250000000001,
        "reward_max": 0.22756250000000028,
        "reward_min": -2.2904375000000003,
        "leartime_s": 0.03682763600954786,
        "sampletime": 1.6380086129938718,
        "best_mean": -0.726875,
        "best_max": 0.14337500000000014,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 224,
        "timesteps": 448000,
        "reward_mean": -0.9580000000000002,
        "reward_max": 0.06650000000000002,
        "reward_min": -1.9524375000000003,
        "leartime_s": 0.014243498007999733,
        "sampletime": 2.1451475110079627,
        "best_mean": -0.726875,
        "best_max": 0.14337500000000014,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 225,
        "timesteps": 450000,
        "reward_mean": -0.8775000000000002,
        "reward_max": 0.15731250000000024,
        "reward_min": -1.9029375000000008,
        "leartime_s": 0.04577007601619698,
        "sampletime": 2.093936521996511,
        "best_mean": -0.726875,
        "best_max": 0.14337500000000014,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 226,
        "timesteps": 452000,
        "reward_mean": -1.006175,
        "reward_max": 0.060062500000000144,
        "reward_min": -2.3001250000000004,
        "leartime_s": 0.04748015900258906,
        "sampletime": 1.656141610990744,
        "best_mean": -0.726875,
        "best_max": 0.14337500000000014,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 227,
        "timesteps": 454000,
        "reward_mean": -0.7666000000000002,
        "reward_max": 0.3329375000000005,
        "reward_min": -2.3099375000000006,
        "leartime_s": 0.014139071019599214,
        "sampletime": 2.0067067769996356,
        "best_mean": -0.726875,
        "best_max": 0.14337500000000014,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 228,
        "timesteps": 456000,
        "reward_mean": -0.8444,
        "reward_max": 0.02418750000000036,
        "reward_min": -1.8476250000000007,
        "leartime_s": 0.05571453302400187,
        "sampletime": 2.03846514999168,
        "best_mean": -0.726875,
        "best_max": 0.14337500000000014,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 229,
        "timesteps": 458000,
        "reward_mean": -0.9399750000000001,
        "reward_max": 0.14450000000000018,
        "reward_min": -2.3075625000000004,
        "leartime_s": 0.03609387099277228,
        "sampletime": 1.8055639299855102,
        "best_mean": -0.726875,
        "best_max": 0.14337500000000014,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 230,
        "timesteps": 460000,
        "reward_mean": -0.5414249999999999,
        "reward_max": 0.5481250000000001,
        "reward_min": -1.8756250000000003,
        "leartime_s": 0.008724938001250848,
        "sampletime": 1.6681407550058793,
        "best_mean": -0.5414249999999999,
        "best_max": 0.5481250000000001,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 231,
        "timesteps": 462000,
        "reward_mean": -0.798625,
        "reward_max": 0.3161250000000001,
        "reward_min": -2.060125,
        "leartime_s": 0.009316101990407333,
        "sampletime": 1.9614167750114575,
        "best_mean": -0.5414249999999999,
        "best_max": 0.5481250000000001,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 232,
        "timesteps": 464000,
        "reward_mean": -0.8385250000000002,
        "reward_max": 0.06643750000000018,
        "reward_min": -2.3039375000000004,
        "leartime_s": 0.04546104100882076,
        "sampletime": 1.9143245809827931,
        "best_mean": -0.5414249999999999,
        "best_max": 0.5481250000000001,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 233,
        "timesteps": 466000,
        "reward_mean": -0.5654250000000001,
        "reward_max": 0.3649375000000003,
        "reward_min": -1.7552500000000002,
        "leartime_s": 0.061294052022276446,
        "sampletime": 1.7818250360141974,
        "best_mean": -0.5414249999999999,
        "best_max": 0.5481250000000001,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 234,
        "timesteps": 468000,
        "reward_mean": -0.946575,
        "reward_max": -0.11706250000000014,
        "reward_min": -2.1335000000000006,
        "leartime_s": 0.02025767700979486,
        "sampletime": 1.9213839730073232,
        "best_mean": -0.5414249999999999,
        "best_max": 0.5481250000000001,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 235,
        "timesteps": 470000,
        "reward_mean": -0.8311750000000002,
        "reward_max": 0.30675000000000024,
        "reward_min": -2.0877500000000007,
        "leartime_s": 0.014454323012614623,
        "sampletime": 2.040107362001436,
        "best_mean": -0.5414249999999999,
        "best_max": 0.5481250000000001,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 236,
        "timesteps": 472000,
        "reward_mean": -0.6705500000000001,
        "reward_max": 0.3495625000000004,
        "reward_min": -1.7864375000000008,
        "leartime_s": 0.04196151701034978,
        "sampletime": 1.7806752120086458,
        "best_mean": -0.5414249999999999,
        "best_max": 0.5481250000000001,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 237,
        "timesteps": 474000,
        "reward_mean": -0.9943250000000002,
        "reward_max": -0.005999999999999749,
        "reward_min": -2.2962500000000006,
        "leartime_s": 0.01484341500326991,
        "sampletime": 2.286602489009965,
        "best_mean": -0.5414249999999999,
        "best_max": 0.5481250000000001,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 238,
        "timesteps": 476000,
        "reward_mean": -0.5028750000000001,
        "reward_max": 0.5171250000000003,
        "reward_min": -1.6875000000000004,
        "leartime_s": 0.028684812976280227,
        "sampletime": 1.6740842170256656,
        "best_mean": -0.5028750000000001,
        "best_max": 0.5171250000000003,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 239,
        "timesteps": 478000,
        "reward_mean": -0.709075,
        "reward_max": 0.17887500000000045,
        "reward_min": -2.0565625000000005,
        "leartime_s": 0.03772660298272967,
        "sampletime": 2.2099823460157495,
        "best_mean": -0.5028750000000001,
        "best_max": 0.5171250000000003,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 240,
        "timesteps": 480000,
        "reward_mean": -0.8972250000000002,
        "reward_max": -0.011187499999999947,
        "reward_min": -2.1982500000000007,
        "leartime_s": 0.022709896991727874,
        "sampletime": 2.285042885981966,
        "best_mean": -0.5028750000000001,
        "best_max": 0.5171250000000003,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 241,
        "timesteps": 482000,
        "reward_mean": -0.603075,
        "reward_max": 0.33768750000000036,
        "reward_min": -1.6676250000000008,
        "leartime_s": 0.03975815500598401,
        "sampletime": 1.83152601798065,
        "best_mean": -0.5028750000000001,
        "best_max": 0.5171250000000003,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 242,
        "timesteps": 484000,
        "reward_mean": -0.7306750000000002,
        "reward_max": 0.07287500000000012,
        "reward_min": -2.2516875000000005,
        "leartime_s": 0.023668234003707767,
        "sampletime": 2.1482754060125444,
        "best_mean": -0.5028750000000001,
        "best_max": 0.5171250000000003,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 243,
        "timesteps": 486000,
        "reward_mean": -0.8453,
        "reward_max": 0.23206250000000023,
        "reward_min": -2.0105625,
        "leartime_s": 0.02936674901866354,
        "sampletime": 1.9185645660036243,
        "best_mean": -0.5028750000000001,
        "best_max": 0.5171250000000003,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 244,
        "timesteps": 488000,
        "reward_mean": -0.6966750000000002,
        "reward_max": 0.09675000000000022,
        "reward_min": -1.5670625000000005,
        "leartime_s": 0.041796466015512124,
        "sampletime": 1.6418629350082483,
        "best_mean": -0.5028750000000001,
        "best_max": 0.5171250000000003,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 245,
        "timesteps": 490000,
        "reward_mean": -0.54545,
        "reward_max": 0.35706250000000034,
        "reward_min": -2.0685000000000002,
        "leartime_s": 0.024372420011786744,
        "sampletime": 1.9647290659777354,
        "best_mean": -0.5028750000000001,
        "best_max": 0.5171250000000003,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 246,
        "timesteps": 492000,
        "reward_mean": -0.6795000000000002,
        "reward_max": 0.32043750000000015,
        "reward_min": -1.7421875000000009,
        "leartime_s": 0.013983898010337725,
        "sampletime": 1.6107295340043493,
        "best_mean": -0.5028750000000001,
        "best_max": 0.5171250000000003,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 247,
        "timesteps": 494000,
        "reward_mean": -0.582375,
        "reward_max": 0.38112500000000027,
        "reward_min": -1.637625000000001,
        "leartime_s": 0.0166831300011836,
        "sampletime": 1.7180704349884763,
        "best_mean": -0.5028750000000001,
        "best_max": 0.5171250000000003,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 248,
        "timesteps": 496000,
        "reward_mean": -0.8319500000000001,
        "reward_max": 0.16268750000000035,
        "reward_min": -1.8765000000000007,
        "leartime_s": 0.021665257983841002,
        "sampletime": 1.5993220749951433,
        "best_mean": -0.5028750000000001,
        "best_max": 0.5171250000000003,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 249,
        "timesteps": 498000,
        "reward_mean": -0.77425,
        "reward_max": 0.2817500000000004,
        "reward_min": -1.9920000000000004,
        "leartime_s": 0.015810303011676297,
        "sampletime": 1.6673832540109288,
        "best_mean": -0.5028750000000001,
        "best_max": 0.5171250000000003,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 250,
        "timesteps": 500000,
        "reward_mean": -0.7152250000000001,
        "reward_max": 0.16450000000000015,
        "reward_min": -2.235125,
        "leartime_s": 0.03947455299203284,
        "sampletime": 1.566998518013861,
        "best_mean": -0.5028750000000001,
        "best_max": 0.5171250000000003,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 251,
        "timesteps": 502000,
        "reward_mean": -0.6970500000000001,
        "reward_max": 0.15718750000000029,
        "reward_min": -2.0115000000000003,
        "leartime_s": 0.028962765005417168,
        "sampletime": 1.5222239189897664,
        "best_mean": -0.5028750000000001,
        "best_max": 0.5171250000000003,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 252,
        "timesteps": 504000,
        "reward_mean": -0.7608500000000001,
        "reward_max": 0.36550000000000027,
        "reward_min": -1.9754375000000004,
        "leartime_s": 0.052924897987395525,
        "sampletime": 1.6370703479915392,
        "best_mean": -0.5028750000000001,
        "best_max": 0.5171250000000003,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 253,
        "timesteps": 506000,
        "reward_mean": -0.47867499999999996,
        "reward_max": 0.38406250000000025,
        "reward_min": -1.5419999999999998,
        "leartime_s": 0.025652160024037585,
        "sampletime": 1.6465524320083205,
        "best_mean": -0.47867499999999996,
        "best_max": 0.38406250000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 254,
        "timesteps": 508000,
        "reward_mean": -0.89805,
        "reward_max": -0.07537499999999982,
        "reward_min": -2.1403750000000006,
        "leartime_s": 0.018661531008547172,
        "sampletime": 1.6081261129875202,
        "best_mean": -0.47867499999999996,
        "best_max": 0.38406250000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 255,
        "timesteps": 510000,
        "reward_mean": -0.58935,
        "reward_max": 0.26956250000000015,
        "reward_min": -2.185062500000001,
        "leartime_s": 0.02012695698067546,
        "sampletime": 1.5608122590056155,
        "best_mean": -0.47867499999999996,
        "best_max": 0.38406250000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 256,
        "timesteps": 512000,
        "reward_mean": -0.76985,
        "reward_max": 0.11131250000000031,
        "reward_min": -1.7469375000000005,
        "leartime_s": 0.0198208509827964,
        "sampletime": 1.5729938930016942,
        "best_mean": -0.47867499999999996,
        "best_max": 0.38406250000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 257,
        "timesteps": 514000,
        "reward_mean": -0.6866000000000001,
        "reward_max": 0.3231875000000001,
        "reward_min": -1.6932500000000008,
        "leartime_s": 0.027788122999481857,
        "sampletime": 1.5910115190199576,
        "best_mean": -0.47867499999999996,
        "best_max": 0.38406250000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 258,
        "timesteps": 516000,
        "reward_mean": -0.6091749999999999,
        "reward_max": 0.35406250000000034,
        "reward_min": -1.7234375000000004,
        "leartime_s": 0.017642787017393857,
        "sampletime": 1.5933838389755692,
        "best_mean": -0.47867499999999996,
        "best_max": 0.38406250000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 259,
        "timesteps": 518000,
        "reward_mean": -0.701825,
        "reward_max": 0.36737500000000034,
        "reward_min": -1.8785000000000007,
        "leartime_s": 0.014368881995324045,
        "sampletime": 1.615258317993721,
        "best_mean": -0.47867499999999996,
        "best_max": 0.38406250000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 260,
        "timesteps": 520000,
        "reward_mean": -0.7770750000000001,
        "reward_max": 0.2390625000000002,
        "reward_min": -1.6520625,
        "leartime_s": 0.030673524976009503,
        "sampletime": 1.571563731005881,
        "best_mean": -0.47867499999999996,
        "best_max": 0.38406250000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 261,
        "timesteps": 522000,
        "reward_mean": -0.6578999999999999,
        "reward_max": 0.39425000000000027,
        "reward_min": -1.780875,
        "leartime_s": 0.014662011002656072,
        "sampletime": 1.640308953996282,
        "best_mean": -0.47867499999999996,
        "best_max": 0.38406250000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 262,
        "timesteps": 524000,
        "reward_mean": -0.9482250000000001,
        "reward_max": 0.4678750000000004,
        "reward_min": -2.1182500000000006,
        "leartime_s": 0.031008787016617134,
        "sampletime": 1.6247389630007092,
        "best_mean": -0.47867499999999996,
        "best_max": 0.38406250000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 263,
        "timesteps": 526000,
        "reward_mean": -0.660575,
        "reward_max": 0.34475000000000033,
        "reward_min": -1.7272500000000002,
        "leartime_s": 0.036768060992471874,
        "sampletime": 1.5998707989929244,
        "best_mean": -0.47867499999999996,
        "best_max": 0.38406250000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 264,
        "timesteps": 528000,
        "reward_mean": -0.67275,
        "reward_max": 0.37081250000000043,
        "reward_min": -1.7724374999999997,
        "leartime_s": 0.015552880999166518,
        "sampletime": 1.6274562399776187,
        "best_mean": -0.47867499999999996,
        "best_max": 0.38406250000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 265,
        "timesteps": 530000,
        "reward_mean": -0.5228749999999999,
        "reward_max": 0.5563125000000004,
        "reward_min": -1.7545000000000004,
        "leartime_s": 0.01553808999597095,
        "sampletime": 1.571514268987812,
        "best_mean": -0.47867499999999996,
        "best_max": 0.38406250000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 266,
        "timesteps": 532000,
        "reward_mean": -0.593925,
        "reward_max": 0.3261875000000004,
        "reward_min": -2.1739375000000005,
        "leartime_s": 0.03461411502212286,
        "sampletime": 1.600428492994979,
        "best_mean": -0.47867499999999996,
        "best_max": 0.38406250000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 267,
        "timesteps": 534000,
        "reward_mean": -0.56095,
        "reward_max": 0.34962500000000035,
        "reward_min": -1.8648125000000007,
        "leartime_s": 0.020529456989606842,
        "sampletime": 1.7192168820183724,
        "best_mean": -0.47867499999999996,
        "best_max": 0.38406250000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 268,
        "timesteps": 536000,
        "reward_mean": -0.6927249999999999,
        "reward_max": 0.21556250000000016,
        "reward_min": -1.7419375000000004,
        "leartime_s": 0.061258062021806836,
        "sampletime": 1.5041184139845427,
        "best_mean": -0.47867499999999996,
        "best_max": 0.38406250000000025,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 269,
        "timesteps": 538000,
        "reward_mean": -0.44937499999999997,
        "reward_max": 0.3565625000000001,
        "reward_min": -1.5000625000000003,
        "leartime_s": 0.025322846980998293,
        "sampletime": 1.6531275390007067,
        "best_mean": -0.44937499999999997,
        "best_max": 0.3565625000000001,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 270,
        "timesteps": 540000,
        "reward_mean": -0.492425,
        "reward_max": 0.4825625000000003,
        "reward_min": -1.6143750000000003,
        "leartime_s": 0.03613288700580597,
        "sampletime": 1.567831799009582,
        "best_mean": -0.44937499999999997,
        "best_max": 0.3565625000000001,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 271,
        "timesteps": 542000,
        "reward_mean": -0.6584500000000001,
        "reward_max": 0.3908750000000002,
        "reward_min": -1.84625,
        "leartime_s": 0.027958627993939444,
        "sampletime": 1.6755677290202584,
        "best_mean": -0.44937499999999997,
        "best_max": 0.3565625000000001,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 272,
        "timesteps": 544000,
        "reward_mean": -0.5682249999999999,
        "reward_max": 0.3060625000000005,
        "reward_min": -1.5315625000000006,
        "leartime_s": 0.05219375298474915,
        "sampletime": 1.558899129013298,
        "best_mean": -0.44937499999999997,
        "best_max": 0.3565625000000001,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 273,
        "timesteps": 546000,
        "reward_mean": -0.6742749999999998,
        "reward_max": 0.31712500000000043,
        "reward_min": -1.8056875,
        "leartime_s": 0.0155999019916635,
        "sampletime": 1.712106702994788,
        "best_mean": -0.44937499999999997,
        "best_max": 0.3565625000000001,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 274,
        "timesteps": 548000,
        "reward_mean": -0.4019749999999999,
        "reward_max": 0.4587500000000002,
        "reward_min": -1.4140625000000004,
        "leartime_s": 0.06189099801122211,
        "sampletime": 1.664267671003472,
        "best_mean": -0.4019749999999999,
        "best_max": 0.4587500000000002,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 275,
        "timesteps": 550000,
        "reward_mean": -0.5348499999999999,
        "reward_max": 0.41356250000000033,
        "reward_min": -1.9740625000000003,
        "leartime_s": 0.014529723004670814,
        "sampletime": 1.908844757010229,
        "best_mean": -0.4019749999999999,
        "best_max": 0.4587500000000002,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 276,
        "timesteps": 552000,
        "reward_mean": -0.5416499999999999,
        "reward_max": 0.29343750000000035,
        "reward_min": -1.5453750000000004,
        "leartime_s": 0.027846212004078552,
        "sampletime": 2.1013231839751825,
        "best_mean": -0.4019749999999999,
        "best_max": 0.4587500000000002,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 277,
        "timesteps": 554000,
        "reward_mean": -0.6775999999999999,
        "reward_max": 0.4717500000000004,
        "reward_min": -1.9134375,
        "leartime_s": 0.034304305008845404,
        "sampletime": 1.7320450590050314,
        "best_mean": -0.4019749999999999,
        "best_max": 0.4587500000000002,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 278,
        "timesteps": 556000,
        "reward_mean": -0.5099,
        "reward_max": 0.6490625000000002,
        "reward_min": -1.7293750000000003,
        "leartime_s": 0.06191281697829254,
        "sampletime": 1.9574918409925885,
        "best_mean": -0.4019749999999999,
        "best_max": 0.4587500000000002,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 279,
        "timesteps": 558000,
        "reward_mean": -0.3613999999999999,
        "reward_max": 0.5448125000000001,
        "reward_min": -1.6167500000000001,
        "leartime_s": 0.0292313429818023,
        "sampletime": 2.0997539589880034,
        "best_mean": -0.3613999999999999,
        "best_max": 0.5448125000000001,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 280,
        "timesteps": 560000,
        "reward_mean": -0.5067999999999999,
        "reward_max": 0.41881250000000037,
        "reward_min": -1.6025000000000005,
        "leartime_s": 0.03353632098878734,
        "sampletime": 1.85692457301775,
        "best_mean": -0.3613999999999999,
        "best_max": 0.5448125000000001,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 281,
        "timesteps": 562000,
        "reward_mean": -0.4446749999999998,
        "reward_max": 0.45675000000000043,
        "reward_min": -1.9043125000000005,
        "leartime_s": 0.01715956599218771,
        "sampletime": 1.8101731659844518,
        "best_mean": -0.3613999999999999,
        "best_max": 0.5448125000000001,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 282,
        "timesteps": 564000,
        "reward_mean": -0.39389999999999986,
        "reward_max": 0.46193750000000044,
        "reward_min": -2.1857500000000005,
        "leartime_s": 0.01808070600964129,
        "sampletime": 1.97915031798766,
        "best_mean": -0.3613999999999999,
        "best_max": 0.5448125000000001,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 283,
        "timesteps": 566000,
        "reward_mean": -0.1738499999999998,
        "reward_max": 0.7431875000000007,
        "reward_min": -1.3981250000000003,
        "leartime_s": 0.040844573988579214,
        "sampletime": 1.8606521550100297,
        "best_mean": -0.1738499999999998,
        "best_max": 0.7431875000000007,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 284,
        "timesteps": 568000,
        "reward_mean": -0.35229999999999984,
        "reward_max": 0.5160625000000005,
        "reward_min": -1.3823125000000003,
        "leartime_s": 0.025152843998512253,
        "sampletime": 1.830295331979869,
        "best_mean": -0.1738499999999998,
        "best_max": 0.7431875000000007,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 285,
        "timesteps": 570000,
        "reward_mean": -0.4954749999999998,
        "reward_max": 0.6505000000000005,
        "reward_min": -1.7781875,
        "leartime_s": 0.018988405005075037,
        "sampletime": 1.9057544929964934,
        "best_mean": -0.1738499999999998,
        "best_max": 0.7431875000000007,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 286,
        "timesteps": 572000,
        "reward_mean": -0.5912499999999997,
        "reward_max": 0.3782500000000004,
        "reward_min": -1.8627500000000001,
        "leartime_s": 0.03305166200152598,
        "sampletime": 1.8712431429885328,
        "best_mean": -0.1738499999999998,
        "best_max": 0.7431875000000007,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 287,
        "timesteps": 574000,
        "reward_mean": -0.22999999999999982,
        "reward_max": 0.5975625000000004,
        "reward_min": -1.2423125,
        "leartime_s": 0.07665592600824311,
        "sampletime": 1.8880825609958265,
        "best_mean": -0.1738499999999998,
        "best_max": 0.7431875000000007,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 288,
        "timesteps": 576000,
        "reward_mean": -0.39992499999999986,
        "reward_max": 0.6116250000000004,
        "reward_min": -1.604625,
        "leartime_s": 0.0839862099965103,
        "sampletime": 1.9534480680013075,
        "best_mean": -0.1738499999999998,
        "best_max": 0.7431875000000007,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 289,
        "timesteps": 578000,
        "reward_mean": -0.3112249999999998,
        "reward_max": 0.8216250000000006,
        "reward_min": -1.1301875000000003,
        "leartime_s": 0.03196392199606635,
        "sampletime": 2.0190807539911475,
        "best_mean": -0.1738499999999998,
        "best_max": 0.7431875000000007,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 290,
        "timesteps": 580000,
        "reward_mean": -0.42634999999999984,
        "reward_max": 0.6231250000000006,
        "reward_min": -1.5096874999999998,
        "leartime_s": 0.06506676599383354,
        "sampletime": 1.7071188169938978,
        "best_mean": -0.1738499999999998,
        "best_max": 0.7431875000000007,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 291,
        "timesteps": 582000,
        "reward_mean": -0.4334249999999999,
        "reward_max": 0.4290625000000003,
        "reward_min": -1.7730624999999998,
        "leartime_s": 0.018396865023532882,
        "sampletime": 1.6296364800073206,
        "best_mean": -0.1738499999999998,
        "best_max": 0.7431875000000007,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 292,
        "timesteps": 584000,
        "reward_mean": -0.3988999999999998,
        "reward_max": 0.5363125000000004,
        "reward_min": -1.4556250000000004,
        "leartime_s": 0.01934030299889855,
        "sampletime": 2.036711798980832,
        "best_mean": -0.1738499999999998,
        "best_max": 0.7431875000000007,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 293,
        "timesteps": 586000,
        "reward_mean": -0.41844999999999993,
        "reward_max": 0.4295625000000003,
        "reward_min": -1.6060625,
        "leartime_s": 0.021527272008825094,
        "sampletime": 1.9492567259876523,
        "best_mean": -0.1738499999999998,
        "best_max": 0.7431875000000007,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 294,
        "timesteps": 588000,
        "reward_mean": -0.43277499999999985,
        "reward_max": 0.5734375000000005,
        "reward_min": -1.7248750000000002,
        "leartime_s": 0.03462385598686524,
        "sampletime": 2.222147980995942,
        "best_mean": -0.1738499999999998,
        "best_max": 0.7431875000000007,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 295,
        "timesteps": 590000,
        "reward_mean": -0.2829749999999998,
        "reward_max": 0.6295000000000004,
        "reward_min": -1.4489375000000002,
        "leartime_s": 0.03836836799746379,
        "sampletime": 2.097728141990956,
        "best_mean": -0.1738499999999998,
        "best_max": 0.7431875000000007,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 296,
        "timesteps": 592000,
        "reward_mean": -0.10994999999999981,
        "reward_max": 0.6905000000000006,
        "reward_min": -1.1836250000000001,
        "leartime_s": 0.028871075017377734,
        "sampletime": 1.897168932016939,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 297,
        "timesteps": 594000,
        "reward_mean": -0.4643499999999998,
        "reward_max": 0.45043750000000055,
        "reward_min": -1.8385625000000003,
        "leartime_s": 0.03947912700823508,
        "sampletime": 1.8975188600015827,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 298,
        "timesteps": 596000,
        "reward_mean": -0.6344999999999997,
        "reward_max": 0.26612500000000044,
        "reward_min": -1.8295000000000001,
        "leartime_s": 0.01621832000091672,
        "sampletime": 1.9369337190000806,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 299,
        "timesteps": 598000,
        "reward_mean": -0.5073749999999998,
        "reward_max": 0.4380625000000003,
        "reward_min": -1.7120625,
        "leartime_s": 0.01942611500271596,
        "sampletime": 1.8847536589892115,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 300,
        "timesteps": 600000,
        "reward_mean": -0.5057249999999999,
        "reward_max": 0.5065000000000004,
        "reward_min": -1.4992500000000002,
        "leartime_s": 0.042602244997397065,
        "sampletime": 1.7897498710080981,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 301,
        "timesteps": 602000,
        "reward_mean": -0.3833249999999999,
        "reward_max": 0.4237500000000003,
        "reward_min": -1.490875,
        "leartime_s": 0.029261891992064193,
        "sampletime": 2.125370013003703,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 302,
        "timesteps": 604000,
        "reward_mean": -0.37827499999999986,
        "reward_max": 0.8280625000000005,
        "reward_min": -1.3874375000000003,
        "leartime_s": 0.01987308799289167,
        "sampletime": 1.9688794130051974,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 303,
        "timesteps": 606000,
        "reward_mean": -0.3181999999999997,
        "reward_max": 0.5563125000000003,
        "reward_min": -1.8711250000000004,
        "leartime_s": 0.04328050999902189,
        "sampletime": 1.874880524002947,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 304,
        "timesteps": 608000,
        "reward_mean": -0.38537499999999986,
        "reward_max": 0.5422500000000003,
        "reward_min": -1.7947500000000003,
        "leartime_s": 0.03716521698515862,
        "sampletime": 2.187619234988233,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 305,
        "timesteps": 610000,
        "reward_mean": -0.5227749999999999,
        "reward_max": 0.4201250000000005,
        "reward_min": -1.7030000000000005,
        "leartime_s": 0.061053459998220205,
        "sampletime": 1.7224932360113598,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 306,
        "timesteps": 612000,
        "reward_mean": -0.4550999999999999,
        "reward_max": 0.5080000000000006,
        "reward_min": -1.4941875000000002,
        "leartime_s": 0.09360817799461074,
        "sampletime": 1.9295329149754252,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 307,
        "timesteps": 614000,
        "reward_mean": -0.4938749999999999,
        "reward_max": 0.47631250000000047,
        "reward_min": -1.5393124999999996,
        "leartime_s": 0.0593397049815394,
        "sampletime": 1.7877296119986568,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 308,
        "timesteps": 616000,
        "reward_mean": -0.3320999999999998,
        "reward_max": 0.6513750000000004,
        "reward_min": -1.5260000000000002,
        "leartime_s": 0.04531908800709061,
        "sampletime": 1.9373755700071342,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 309,
        "timesteps": 618000,
        "reward_mean": -0.3811249999999998,
        "reward_max": 0.6501250000000003,
        "reward_min": -1.5980625000000002,
        "leartime_s": 0.02382613197551109,
        "sampletime": 2.1469621540163644,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 310,
        "timesteps": 620000,
        "reward_mean": -0.6728249999999999,
        "reward_max": 0.4062500000000005,
        "reward_min": -1.7129375,
        "leartime_s": 0.019850127981044352,
        "sampletime": 1.7896749530045781,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 311,
        "timesteps": 622000,
        "reward_mean": -0.5289999999999999,
        "reward_max": 0.4016875000000004,
        "reward_min": -1.5456250000000002,
        "leartime_s": 0.055157010996481404,
        "sampletime": 1.859486700996058,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 312,
        "timesteps": 624000,
        "reward_mean": -0.35967499999999986,
        "reward_max": 0.8013125000000006,
        "reward_min": -1.9039375,
        "leartime_s": 0.06382337500690483,
        "sampletime": 1.8108692670066375,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 313,
        "timesteps": 626000,
        "reward_mean": -0.14037499999999986,
        "reward_max": 0.7102500000000005,
        "reward_min": -1.163625,
        "leartime_s": 0.032950250984868035,
        "sampletime": 2.0804309000086505,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 314,
        "timesteps": 628000,
        "reward_mean": -0.12307499999999984,
        "reward_max": 0.9261875000000005,
        "reward_min": -1.0559375000000002,
        "leartime_s": 0.02498837298480794,
        "sampletime": 1.6741978649806697,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 315,
        "timesteps": 630000,
        "reward_mean": -0.28149999999999975,
        "reward_max": 0.5378750000000005,
        "reward_min": -1.6870000000000005,
        "leartime_s": 0.01783660100772977,
        "sampletime": 1.7564462810114492,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 316,
        "timesteps": 632000,
        "reward_mean": -0.3806499999999999,
        "reward_max": 0.6450000000000005,
        "reward_min": -1.6156249999999999,
        "leartime_s": 0.08133732099668123,
        "sampletime": 1.9917353329947218,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 317,
        "timesteps": 634000,
        "reward_mean": -0.1917499999999998,
        "reward_max": 0.7278750000000003,
        "reward_min": -1.1229375000000004,
        "leartime_s": 0.02786524800467305,
        "sampletime": 1.963213046983583,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 318,
        "timesteps": 636000,
        "reward_mean": -0.2710499999999999,
        "reward_max": 0.5536250000000004,
        "reward_min": -1.3860000000000003,
        "leartime_s": 0.05402091800351627,
        "sampletime": 1.863962369010551,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 319,
        "timesteps": 638000,
        "reward_mean": -0.42994999999999983,
        "reward_max": 0.48775000000000046,
        "reward_min": -1.5291250000000003,
        "leartime_s": 0.03030801800196059,
        "sampletime": 2.2282036160177086,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 320,
        "timesteps": 640000,
        "reward_mean": -0.33514999999999995,
        "reward_max": 0.5608125,
        "reward_min": -1.5849374999999997,
        "leartime_s": 0.026144303992623463,
        "sampletime": 1.7925307909899857,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 321,
        "timesteps": 642000,
        "reward_mean": -0.585425,
        "reward_max": 0.4037500000000002,
        "reward_min": -2.0432500000000005,
        "leartime_s": 0.033886606979649514,
        "sampletime": 1.9930152900051326,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 322,
        "timesteps": 644000,
        "reward_mean": -0.4596249999999999,
        "reward_max": 0.5571875000000004,
        "reward_min": -1.9795625000000003,
        "leartime_s": 0.01737783700809814,
        "sampletime": 2.0355333360203076,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 323,
        "timesteps": 646000,
        "reward_mean": -0.5280750000000001,
        "reward_max": 0.42512500000000014,
        "reward_min": -1.7022499999999996,
        "leartime_s": 0.03237367299152538,
        "sampletime": 1.6365818780031987,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 324,
        "timesteps": 648000,
        "reward_mean": -0.4775999999999999,
        "reward_max": 0.6445625000000004,
        "reward_min": -1.4640625,
        "leartime_s": 0.021574022015556693,
        "sampletime": 1.6344738070038147,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 325,
        "timesteps": 650000,
        "reward_mean": -0.26379999999999987,
        "reward_max": 0.6331875000000005,
        "reward_min": -1.3355000000000004,
        "leartime_s": 0.027422942977864295,
        "sampletime": 1.844100788992364,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 326,
        "timesteps": 652000,
        "reward_mean": -0.5421999999999999,
        "reward_max": 0.39187500000000025,
        "reward_min": -1.6786875000000003,
        "leartime_s": 0.03894215900800191,
        "sampletime": 1.8907672890054528,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 327,
        "timesteps": 654000,
        "reward_mean": -0.41607499999999986,
        "reward_max": 0.5813750000000005,
        "reward_min": -1.5633750000000006,
        "leartime_s": 0.022647211997536942,
        "sampletime": 1.8583852240117267,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 328,
        "timesteps": 656000,
        "reward_mean": -0.6510499999999999,
        "reward_max": 0.5045000000000004,
        "reward_min": -1.6906875000000001,
        "leartime_s": 0.019183182012056932,
        "sampletime": 2.229409275983926,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 329,
        "timesteps": 658000,
        "reward_mean": -0.60815,
        "reward_max": 0.3872500000000006,
        "reward_min": -1.8040625000000006,
        "leartime_s": 0.04954005000763573,
        "sampletime": 1.9457184619968757,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 330,
        "timesteps": 660000,
        "reward_mean": -0.4767499999999999,
        "reward_max": 0.4433750000000005,
        "reward_min": -1.7390000000000003,
        "leartime_s": 0.022497080004541203,
        "sampletime": 1.784206530021038,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 331,
        "timesteps": 662000,
        "reward_mean": -0.45129999999999987,
        "reward_max": 0.4451875000000005,
        "reward_min": -1.638375,
        "leartime_s": 0.03904471901478246,
        "sampletime": 1.8235980890167411,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 332,
        "timesteps": 664000,
        "reward_mean": -0.604375,
        "reward_max": 0.28743750000000035,
        "reward_min": -1.5842500000000004,
        "leartime_s": 0.05066511098993942,
        "sampletime": 1.938707285997225,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 333,
        "timesteps": 666000,
        "reward_mean": -0.3867749999999999,
        "reward_max": 0.4670000000000002,
        "reward_min": -1.3342500000000002,
        "leartime_s": 0.02311233599903062,
        "sampletime": 2.099816975998692,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 334,
        "timesteps": 668000,
        "reward_mean": -0.5619999999999998,
        "reward_max": 0.33237500000000036,
        "reward_min": -1.9635624999999997,
        "leartime_s": 0.0545170400000643,
        "sampletime": 1.7810052649874706,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 335,
        "timesteps": 670000,
        "reward_mean": -0.46882499999999994,
        "reward_max": 0.5650000000000004,
        "reward_min": -1.6055000000000001,
        "leartime_s": 0.04070244400645606,
        "sampletime": 1.8998990949767176,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 336,
        "timesteps": 672000,
        "reward_mean": -0.5182749999999998,
        "reward_max": 0.36087500000000045,
        "reward_min": -1.8351875000000004,
        "leartime_s": 0.01899764098925516,
        "sampletime": 1.9758254049811512,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 337,
        "timesteps": 674000,
        "reward_mean": -0.5837,
        "reward_max": 0.5054375000000005,
        "reward_min": -2.120000000000001,
        "leartime_s": 0.05211773901828565,
        "sampletime": 1.9966693739988841,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 338,
        "timesteps": 676000,
        "reward_mean": -0.3326249999999999,
        "reward_max": 0.8356250000000006,
        "reward_min": -1.4164375,
        "leartime_s": 0.061485718993935734,
        "sampletime": 1.8108634719974361,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 339,
        "timesteps": 678000,
        "reward_mean": -0.4207999999999999,
        "reward_max": 0.6403125000000003,
        "reward_min": -1.4632500000000002,
        "leartime_s": 0.04507030997774564,
        "sampletime": 1.6517895540164318,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 340,
        "timesteps": 680000,
        "reward_mean": -0.3945999999999998,
        "reward_max": 0.5522500000000006,
        "reward_min": -1.5817500000000009,
        "leartime_s": 0.033080830005928874,
        "sampletime": 1.7412135529739317,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 341,
        "timesteps": 682000,
        "reward_mean": -0.5407499999999997,
        "reward_max": 0.46162500000000045,
        "reward_min": -2.0508124999999997,
        "leartime_s": 0.04144244999042712,
        "sampletime": 1.889388762996532,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 342,
        "timesteps": 684000,
        "reward_mean": -0.2969499999999998,
        "reward_max": 0.7160625000000005,
        "reward_min": -1.5650625,
        "leartime_s": 0.07456280998303555,
        "sampletime": 1.7189024979888927,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 343,
        "timesteps": 686000,
        "reward_mean": -0.5656749999999999,
        "reward_max": 0.6272500000000005,
        "reward_min": -1.9676250000000006,
        "leartime_s": 0.04719990899320692,
        "sampletime": 2.0839634840085637,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 344,
        "timesteps": 688000,
        "reward_mean": -0.534225,
        "reward_max": 0.5145000000000002,
        "reward_min": -1.7246875,
        "leartime_s": 0.04863938898779452,
        "sampletime": 2.1202577670046594,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 345,
        "timesteps": 690000,
        "reward_mean": -0.5004999999999998,
        "reward_max": 0.5700000000000004,
        "reward_min": -1.5160000000000005,
        "leartime_s": 0.019488492020173,
        "sampletime": 1.946476885001175,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 346,
        "timesteps": 692000,
        "reward_mean": -0.668075,
        "reward_max": 0.16256250000000028,
        "reward_min": -1.6885000000000001,
        "leartime_s": 0.0951160529803019,
        "sampletime": 2.028008595982101,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 347,
        "timesteps": 694000,
        "reward_mean": -0.779625,
        "reward_max": 0.4364375000000003,
        "reward_min": -2.8416875,
        "leartime_s": 0.022443769994424656,
        "sampletime": 2.124312694009859,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 348,
        "timesteps": 696000,
        "reward_mean": -0.4645749999999999,
        "reward_max": 0.3539375000000002,
        "reward_min": -1.4079375000000005,
        "leartime_s": 0.0579283150145784,
        "sampletime": 1.7998747079982422,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 349,
        "timesteps": 698000,
        "reward_mean": -0.5477000000000001,
        "reward_max": 0.5618750000000005,
        "reward_min": -1.8159375000000013,
        "leartime_s": 0.06628605799051002,
        "sampletime": 2.015463785995962,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 350,
        "timesteps": 700000,
        "reward_mean": -0.5560750000000001,
        "reward_max": 0.3700625000000005,
        "reward_min": -1.6618125000000001,
        "leartime_s": 0.046337603009305894,
        "sampletime": 1.9546487699844874,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 351,
        "timesteps": 702000,
        "reward_mean": -0.5512249999999999,
        "reward_max": 0.5777500000000003,
        "reward_min": -1.8035000000000005,
        "leartime_s": 0.0455868839926552,
        "sampletime": 1.963183127983939,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 352,
        "timesteps": 704000,
        "reward_mean": -0.6954000000000001,
        "reward_max": 0.24243750000000033,
        "reward_min": -1.7405624999999998,
        "leartime_s": 0.07603889898746274,
        "sampletime": 2.2134353000146803,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 353,
        "timesteps": 706000,
        "reward_mean": -0.38339999999999996,
        "reward_max": 0.5576875000000007,
        "reward_min": -1.47575,
        "leartime_s": 0.05019097198965028,
        "sampletime": 1.7598010569927283,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 354,
        "timesteps": 708000,
        "reward_mean": -0.5919249999999999,
        "reward_max": 0.18062500000000017,
        "reward_min": -1.7756875000000003,
        "leartime_s": 0.02160388301126659,
        "sampletime": 1.9518880789983086,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 355,
        "timesteps": 710000,
        "reward_mean": -0.7159249999999999,
        "reward_max": 0.1980625000000003,
        "reward_min": -2.0776875,
        "leartime_s": 0.04262304800795391,
        "sampletime": 1.7551214240083937,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 356,
        "timesteps": 712000,
        "reward_mean": -0.6993999999999999,
        "reward_max": 0.11487500000000023,
        "reward_min": -1.7417500000000008,
        "leartime_s": 0.019476570014376193,
        "sampletime": 1.8702183389978018,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 357,
        "timesteps": 714000,
        "reward_mean": -0.930825,
        "reward_max": 0.00024999999999991696,
        "reward_min": -2.275312500000001,
        "leartime_s": 0.03907915600575507,
        "sampletime": 1.91517496999586,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 358,
        "timesteps": 716000,
        "reward_mean": -0.5311999999999999,
        "reward_max": 0.7276875000000003,
        "reward_min": -1.6170000000000007,
        "leartime_s": 0.0843502490024548,
        "sampletime": 1.9517177189991344,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 359,
        "timesteps": 718000,
        "reward_mean": -0.637025,
        "reward_max": 0.2293125000000003,
        "reward_min": -1.9532500000000002,
        "leartime_s": 0.0651259490114171,
        "sampletime": 2.0815551170089748,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 360,
        "timesteps": 720000,
        "reward_mean": -0.613175,
        "reward_max": 0.22862500000000002,
        "reward_min": -1.6095625000000005,
        "leartime_s": 0.057221331022446975,
        "sampletime": 1.9339610729948618,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 361,
        "timesteps": 722000,
        "reward_mean": -0.559125,
        "reward_max": 0.34687500000000043,
        "reward_min": -2.0082500000000003,
        "leartime_s": 0.07223112400970422,
        "sampletime": 1.7658639309811406,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 362,
        "timesteps": 724000,
        "reward_mean": -0.5826749999999999,
        "reward_max": 0.21737500000000054,
        "reward_min": -1.8470625000000005,
        "leartime_s": 0.03509173300699331,
        "sampletime": 1.9161276480008382,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 363,
        "timesteps": 726000,
        "reward_mean": -0.486,
        "reward_max": 0.5248750000000002,
        "reward_min": -1.8884374999999998,
        "leartime_s": 0.03234054098720662,
        "sampletime": 2.120617995999055,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 364,
        "timesteps": 728000,
        "reward_mean": -0.6295999999999999,
        "reward_max": 0.4121250000000003,
        "reward_min": -2.0241250000000006,
        "leartime_s": 0.030680787982419133,
        "sampletime": 1.9185259279911406,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 365,
        "timesteps": 730000,
        "reward_mean": -0.7011499999999998,
        "reward_max": 0.24906250000000035,
        "reward_min": -1.9086875,
        "leartime_s": 0.035260814998764545,
        "sampletime": 1.7763749640143942,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 366,
        "timesteps": 732000,
        "reward_mean": -0.8181499999999999,
        "reward_max": 0.023500000000000375,
        "reward_min": -1.9850625000000002,
        "leartime_s": 0.024811726005282253,
        "sampletime": 1.9485522019967902,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 367,
        "timesteps": 734000,
        "reward_mean": -0.615675,
        "reward_max": 0.3472500000000001,
        "reward_min": -1.547125,
        "leartime_s": 0.02505907800514251,
        "sampletime": 2.1008702169929165,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 368,
        "timesteps": 736000,
        "reward_mean": -0.55255,
        "reward_max": 0.4786250000000003,
        "reward_min": -1.8965000000000003,
        "leartime_s": 0.0271588169853203,
        "sampletime": 1.6167123609920964,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 369,
        "timesteps": 738000,
        "reward_mean": -0.7395250000000001,
        "reward_max": 0.32543750000000027,
        "reward_min": -1.9757500000000003,
        "leartime_s": 0.05226612801197916,
        "sampletime": 2.110298154002521,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 370,
        "timesteps": 740000,
        "reward_mean": -0.86725,
        "reward_max": 0.12075000000000034,
        "reward_min": -2.06875,
        "leartime_s": 0.049074270005803555,
        "sampletime": 1.6197763340023812,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 371,
        "timesteps": 742000,
        "reward_mean": -0.699375,
        "reward_max": 0.3933750000000005,
        "reward_min": -2.068375,
        "leartime_s": 0.025987396016716957,
        "sampletime": 1.5381159060052596,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 372,
        "timesteps": 744000,
        "reward_mean": -0.7689250000000001,
        "reward_max": 0.19025000000000034,
        "reward_min": -1.7746249999999997,
        "leartime_s": 0.046718402998521924,
        "sampletime": 2.3852705339959357,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 373,
        "timesteps": 746000,
        "reward_mean": -0.7967500000000001,
        "reward_max": 0.15762500000000024,
        "reward_min": -2.081187500000001,
        "leartime_s": 0.0319139740022365,
        "sampletime": 1.9577155899896752,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 374,
        "timesteps": 748000,
        "reward_mean": -0.8883750000000001,
        "reward_max": 0.30368750000000044,
        "reward_min": -2.412250000000001,
        "leartime_s": 0.06405463698320091,
        "sampletime": 1.8692304549913388,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 375,
        "timesteps": 750000,
        "reward_mean": -0.6863499999999999,
        "reward_max": 0.2913125000000003,
        "reward_min": -2.1327500000000006,
        "leartime_s": 0.03979092399822548,
        "sampletime": 1.943485841009533,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 376,
        "timesteps": 752000,
        "reward_mean": -0.7561249999999999,
        "reward_max": 0.23193750000000027,
        "reward_min": -2.3202500000000006,
        "leartime_s": 0.05501316100708209,
        "sampletime": 1.7976597899978515,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 377,
        "timesteps": 754000,
        "reward_mean": -0.6680750000000001,
        "reward_max": 0.3624375000000003,
        "reward_min": -1.9528750000000001,
        "leartime_s": 0.07995899001252837,
        "sampletime": 2.021377955999924,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 378,
        "timesteps": 756000,
        "reward_mean": -0.804075,
        "reward_max": 0.1716250000000003,
        "reward_min": -2.079625,
        "leartime_s": 0.043274820025544614,
        "sampletime": 2.0250465459830593,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 379,
        "timesteps": 758000,
        "reward_mean": -0.58205,
        "reward_max": 0.47412500000000035,
        "reward_min": -1.6884375000000007,
        "leartime_s": 0.026032394001958892,
        "sampletime": 1.7803457870031707,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 380,
        "timesteps": 760000,
        "reward_mean": -0.7836749999999999,
        "reward_max": 0.4768750000000004,
        "reward_min": -1.972312500000001,
        "leartime_s": 0.08623933902708814,
        "sampletime": 2.0365896919975057,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 381,
        "timesteps": 762000,
        "reward_mean": -0.912375,
        "reward_max": 0.17274999999999996,
        "reward_min": -2.7241250000000004,
        "leartime_s": 0.06927363900467753,
        "sampletime": 2.037871915992582,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 382,
        "timesteps": 764000,
        "reward_mean": -0.696075,
        "reward_max": 0.18681250000000005,
        "reward_min": -1.8248125000000004,
        "leartime_s": 0.04249449598137289,
        "sampletime": 1.744301380997058,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 383,
        "timesteps": 766000,
        "reward_mean": -0.7682749999999998,
        "reward_max": 0.2233750000000004,
        "reward_min": -2.2289375000000002,
        "leartime_s": 0.036480476992437616,
        "sampletime": 2.236838867975166,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 384,
        "timesteps": 768000,
        "reward_mean": -0.5665999999999999,
        "reward_max": 0.5225625000000005,
        "reward_min": -1.600875,
        "leartime_s": 0.05666471199947409,
        "sampletime": 1.972865254007047,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 385,
        "timesteps": 770000,
        "reward_mean": -0.6102,
        "reward_max": 0.5776875000000005,
        "reward_min": -2.1345000000000005,
        "leartime_s": 0.07991201599361375,
        "sampletime": 1.6331398829934187,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 386,
        "timesteps": 772000,
        "reward_mean": -0.4350749999999998,
        "reward_max": 0.6630625000000007,
        "reward_min": -1.7634375000000004,
        "leartime_s": 0.058374018990434706,
        "sampletime": 2.086778422992211,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 387,
        "timesteps": 774000,
        "reward_mean": -0.4856249999999999,
        "reward_max": 0.6483125000000003,
        "reward_min": -1.8122500000000006,
        "leartime_s": 0.026800365012604743,
        "sampletime": 1.6945207999960985,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 388,
        "timesteps": 776000,
        "reward_mean": -0.4109499999999999,
        "reward_max": 0.44943750000000054,
        "reward_min": -1.6671250000000002,
        "leartime_s": 0.030069289001403376,
        "sampletime": 1.8272837350086775,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 389,
        "timesteps": 778000,
        "reward_mean": -0.4681249999999999,
        "reward_max": 0.4200625000000002,
        "reward_min": -1.7811875000000006,
        "leartime_s": 0.03860772101324983,
        "sampletime": 1.9631585830065887,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 390,
        "timesteps": 780000,
        "reward_mean": -0.7916749999999999,
        "reward_max": 0.2815000000000003,
        "reward_min": -1.8538749999999997,
        "leartime_s": 0.02187125402269885,
        "sampletime": 2.3748420200136025,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 391,
        "timesteps": 782000,
        "reward_mean": -0.46602499999999986,
        "reward_max": 0.5796875000000002,
        "reward_min": -1.7623125000000002,
        "leartime_s": 0.04063124899403192,
        "sampletime": 1.716595670004608,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 392,
        "timesteps": 784000,
        "reward_mean": -0.5329499999999998,
        "reward_max": 0.42412500000000053,
        "reward_min": -2.4816875000000005,
        "leartime_s": 0.023895427002571523,
        "sampletime": 2.132368239981588,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 393,
        "timesteps": 786000,
        "reward_mean": -0.5137499999999998,
        "reward_max": 0.4063750000000004,
        "reward_min": -1.7565624999999996,
        "leartime_s": 0.04671599899302237,
        "sampletime": 1.9148990169924218,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 394,
        "timesteps": 788000,
        "reward_mean": -0.4764249999999999,
        "reward_max": 0.48550000000000054,
        "reward_min": -1.6148125000000004,
        "leartime_s": 0.03150596100022085,
        "sampletime": 1.8182405259867664,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 395,
        "timesteps": 790000,
        "reward_mean": -0.4427249999999999,
        "reward_max": 0.7323750000000003,
        "reward_min": -1.8905,
        "leartime_s": 0.09125453000888228,
        "sampletime": 1.8369033900089562,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 396,
        "timesteps": 792000,
        "reward_mean": -0.6284249999999998,
        "reward_max": 0.3440625000000004,
        "reward_min": -2.0576874999999997,
        "leartime_s": 0.04369780397973955,
        "sampletime": 2.3178054580057506,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 397,
        "timesteps": 794000,
        "reward_mean": -0.7057749999999998,
        "reward_max": 0.24781250000000057,
        "reward_min": -2.3981874999999997,
        "leartime_s": 0.0810102219984401,
        "sampletime": 1.7890601440158207,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 398,
        "timesteps": 796000,
        "reward_mean": -0.45719999999999983,
        "reward_max": 0.4538125000000006,
        "reward_min": -1.5274375000000007,
        "leartime_s": 0.02591789700090885,
        "sampletime": 2.097553517000051,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 399,
        "timesteps": 798000,
        "reward_mean": -0.43914999999999976,
        "reward_max": 0.7561875000000005,
        "reward_min": -1.6264374999999998,
        "leartime_s": 0.0528593199851457,
        "sampletime": 2.1500615859986283,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 400,
        "timesteps": 800000,
        "reward_mean": -0.6142,
        "reward_max": 0.27850000000000014,
        "reward_min": -1.7073750000000003,
        "leartime_s": 0.05322209300356917,
        "sampletime": 1.8063753690221347,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 401,
        "timesteps": 802000,
        "reward_mean": -0.736775,
        "reward_max": 0.41193750000000023,
        "reward_min": -2.228625000000001,
        "leartime_s": 0.054450261988677084,
        "sampletime": 1.8096267690125387,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 402,
        "timesteps": 804000,
        "reward_mean": -0.5260499999999999,
        "reward_max": 0.5181250000000004,
        "reward_min": -1.6588125000000002,
        "leartime_s": 0.04923673000303097,
        "sampletime": 1.7342011499858927,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 403,
        "timesteps": 806000,
        "reward_mean": -0.5113999999999997,
        "reward_max": 0.6163125000000007,
        "reward_min": -1.9772499999999997,
        "leartime_s": 0.031425823020981625,
        "sampletime": 1.7248608980153222,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 404,
        "timesteps": 808000,
        "reward_mean": -0.6984749999999998,
        "reward_max": 0.35375000000000045,
        "reward_min": -2.1396875,
        "leartime_s": 0.06284802197478712,
        "sampletime": 1.8477259979990777,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 405,
        "timesteps": 810000,
        "reward_mean": -0.5843499999999999,
        "reward_max": 0.4631250000000004,
        "reward_min": -1.7583125,
        "leartime_s": 0.07049956900300458,
        "sampletime": 1.8144764059979934,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 406,
        "timesteps": 812000,
        "reward_mean": -0.43339999999999973,
        "reward_max": 0.7599375000000002,
        "reward_min": -2.0305,
        "leartime_s": 0.0691381270007696,
        "sampletime": 1.9804875209811144,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 407,
        "timesteps": 814000,
        "reward_mean": -0.6237749999999999,
        "reward_max": 0.32000000000000034,
        "reward_min": -2.074937500000001,
        "leartime_s": 0.05258129598223604,
        "sampletime": 1.8851912020181771,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 408,
        "timesteps": 816000,
        "reward_mean": -0.5450249999999999,
        "reward_max": 0.49581250000000043,
        "reward_min": -2.1114375,
        "leartime_s": 0.050836023001465946,
        "sampletime": 1.886183620983502,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 409,
        "timesteps": 818000,
        "reward_mean": -0.733425,
        "reward_max": 0.31168750000000056,
        "reward_min": -1.7204375,
        "leartime_s": 0.022770270996261388,
        "sampletime": 1.9763128079939634,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 410,
        "timesteps": 820000,
        "reward_mean": -0.720875,
        "reward_max": 0.2663750000000005,
        "reward_min": -1.9419375,
        "leartime_s": 0.06889296101871878,
        "sampletime": 1.9973517400212586,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 411,
        "timesteps": 822000,
        "reward_mean": -0.5181249999999998,
        "reward_max": 0.49456250000000046,
        "reward_min": -2.0992500000000005,
        "leartime_s": 0.02712985299876891,
        "sampletime": 1.656029056000989,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 412,
        "timesteps": 824000,
        "reward_mean": -0.6357999999999999,
        "reward_max": 0.40581250000000035,
        "reward_min": -1.8116875000000003,
        "leartime_s": 0.060061459022108465,
        "sampletime": 2.4044717760116328,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 413,
        "timesteps": 826000,
        "reward_mean": -0.6429499999999998,
        "reward_max": 0.29587500000000067,
        "reward_min": -1.7029999999999998,
        "leartime_s": 0.0652258129848633,
        "sampletime": 1.646512032020837,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 414,
        "timesteps": 828000,
        "reward_mean": -0.4270999999999999,
        "reward_max": 0.7287500000000003,
        "reward_min": -1.7977500000000004,
        "leartime_s": 0.0739174319896847,
        "sampletime": 1.849929310992593,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 415,
        "timesteps": 830000,
        "reward_mean": -0.7118,
        "reward_max": 0.3013125000000005,
        "reward_min": -1.9058750000000004,
        "leartime_s": 0.027270309015875682,
        "sampletime": 2.113455801998498,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 416,
        "timesteps": 832000,
        "reward_mean": -0.6560249999999999,
        "reward_max": 0.31975000000000015,
        "reward_min": -1.8073750000000008,
        "leartime_s": 0.05967247500666417,
        "sampletime": 1.8151534509961493,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 417,
        "timesteps": 834000,
        "reward_mean": -0.35377499999999973,
        "reward_max": 0.7556250000000004,
        "reward_min": -1.6876249999999997,
        "leartime_s": 0.04750042999512516,
        "sampletime": 1.7391500169760548,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 418,
        "timesteps": 836000,
        "reward_mean": -0.3591999999999998,
        "reward_max": 0.6093750000000006,
        "reward_min": -1.4794375000000002,
        "leartime_s": 0.02898905798792839,
        "sampletime": 1.887243873992702,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 419,
        "timesteps": 838000,
        "reward_mean": -0.5989249999999999,
        "reward_max": 0.3433750000000005,
        "reward_min": -1.6157500000000002,
        "leartime_s": 0.04283300199313089,
        "sampletime": 1.7207657199760433,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 420,
        "timesteps": 840000,
        "reward_mean": -0.5968249999999998,
        "reward_max": 0.5071250000000004,
        "reward_min": -1.9601875000000002,
        "leartime_s": 0.023083690990461037,
        "sampletime": 1.8853030290047172,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 421,
        "timesteps": 842000,
        "reward_mean": -0.7560999999999999,
        "reward_max": 0.3674375000000004,
        "reward_min": -1.9142500000000002,
        "leartime_s": 0.037730609998106956,
        "sampletime": 1.7566543520078994,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 422,
        "timesteps": 844000,
        "reward_mean": -0.6802999999999997,
        "reward_max": 0.14768750000000028,
        "reward_min": -1.8745000000000005,
        "leartime_s": 0.07435395300853997,
        "sampletime": 1.8960883820254821,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 423,
        "timesteps": 846000,
        "reward_mean": -0.5159749999999999,
        "reward_max": 0.49868750000000056,
        "reward_min": -1.9721250000000001,
        "leartime_s": 0.07090084700030275,
        "sampletime": 2.0811410660098772,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 424,
        "timesteps": 848000,
        "reward_mean": -0.32224999999999976,
        "reward_max": 0.6111250000000007,
        "reward_min": -1.3671250000000004,
        "leartime_s": 0.032837873994139954,
        "sampletime": 2.0952187410148326,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 425,
        "timesteps": 850000,
        "reward_mean": -0.5160749999999997,
        "reward_max": 0.6296875000000006,
        "reward_min": -1.8288750000000003,
        "leartime_s": 0.03831761499168351,
        "sampletime": 1.719422151974868,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 426,
        "timesteps": 852000,
        "reward_mean": -0.36394999999999983,
        "reward_max": 0.7734375000000006,
        "reward_min": -1.4224375000000002,
        "leartime_s": 0.06493181499536149,
        "sampletime": 2.304654427978676,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 427,
        "timesteps": 854000,
        "reward_mean": -0.36217499999999986,
        "reward_max": 0.7175625000000003,
        "reward_min": -1.5135,
        "leartime_s": 0.06790723800077103,
        "sampletime": 1.793784659996163,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 428,
        "timesteps": 856000,
        "reward_mean": -0.6667499999999998,
        "reward_max": 0.4032500000000005,
        "reward_min": -2.0482500000000003,
        "leartime_s": 0.07524548299261369,
        "sampletime": 1.9698545999999624,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 429,
        "timesteps": 858000,
        "reward_mean": -0.5763749999999999,
        "reward_max": 0.5586875000000004,
        "reward_min": -2.2769375,
        "leartime_s": 0.05742657498922199,
        "sampletime": 1.7904462029982824,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 430,
        "timesteps": 860000,
        "reward_mean": -0.5571499999999997,
        "reward_max": 0.6108125000000004,
        "reward_min": -2.0510625,
        "leartime_s": 0.056662390008568764,
        "sampletime": 2.0857906820019707,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 431,
        "timesteps": 862000,
        "reward_mean": -0.26937499999999975,
        "reward_max": 0.7186875000000006,
        "reward_min": -1.2199999999999998,
        "leartime_s": 0.05164507500012405,
        "sampletime": 1.8837445200188085,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 432,
        "timesteps": 864000,
        "reward_mean": -0.4434749999999998,
        "reward_max": 0.6453125000000005,
        "reward_min": -1.9096875,
        "leartime_s": 0.0608993060013745,
        "sampletime": 1.9719910520070698,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 433,
        "timesteps": 866000,
        "reward_mean": -0.4033249999999998,
        "reward_max": 0.9381250000000007,
        "reward_min": -1.368,
        "leartime_s": 0.07677038598922081,
        "sampletime": 2.092883276985958,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 434,
        "timesteps": 868000,
        "reward_mean": -0.12942499999999976,
        "reward_max": 0.8216875000000008,
        "reward_min": -1.2146250000000003,
        "leartime_s": 0.04402077599661425,
        "sampletime": 1.7452713339880574,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 435,
        "timesteps": 870000,
        "reward_mean": -0.5812749999999999,
        "reward_max": 0.39762500000000034,
        "reward_min": -1.7756875000000005,
        "leartime_s": 0.029651338001713157,
        "sampletime": 1.62080214600428,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 436,
        "timesteps": 872000,
        "reward_mean": -0.35482499999999983,
        "reward_max": 0.6768125000000003,
        "reward_min": -1.6151875,
        "leartime_s": 0.05329339799936861,
        "sampletime": 1.990924368990818,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 437,
        "timesteps": 874000,
        "reward_mean": -0.8078249999999998,
        "reward_max": 0.3710625000000005,
        "reward_min": -2.1251875,
        "leartime_s": 0.026969752012519166,
        "sampletime": 1.877095867996104,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 438,
        "timesteps": 876000,
        "reward_mean": -0.32739999999999975,
        "reward_max": 0.5688750000000007,
        "reward_min": -1.5243749999999998,
        "leartime_s": 0.07507202800479718,
        "sampletime": 1.8922817489947192,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 439,
        "timesteps": 878000,
        "reward_mean": -0.3252499999999998,
        "reward_max": 0.6098125000000004,
        "reward_min": -1.4642500000000007,
        "leartime_s": 0.023708844993961975,
        "sampletime": 2.1754928620066494,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 440,
        "timesteps": 880000,
        "reward_mean": -0.5141749999999998,
        "reward_max": 0.6460625000000007,
        "reward_min": -1.642125,
        "leartime_s": 0.047682932985480875,
        "sampletime": 1.668450048979139,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 441,
        "timesteps": 882000,
        "reward_mean": -0.37729999999999986,
        "reward_max": 0.7645000000000004,
        "reward_min": -1.7835,
        "leartime_s": 0.09529494302114472,
        "sampletime": 2.2009054480004124,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 442,
        "timesteps": 884000,
        "reward_mean": -0.27602499999999974,
        "reward_max": 0.5834375000000005,
        "reward_min": -1.4881875,
        "leartime_s": 0.049061872996389866,
        "sampletime": 1.941655891976552,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 443,
        "timesteps": 886000,
        "reward_mean": -0.38107499999999983,
        "reward_max": 0.7978750000000003,
        "reward_min": -1.9925000000000004,
        "leartime_s": 0.031399578001582995,
        "sampletime": 1.6593427959887777,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 444,
        "timesteps": 888000,
        "reward_mean": -0.6351749999999997,
        "reward_max": 0.5470000000000006,
        "reward_min": -2.0134375,
        "leartime_s": 0.048822680982993916,
        "sampletime": 1.9398682829923928,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 445,
        "timesteps": 890000,
        "reward_mean": -0.4518499999999998,
        "reward_max": 0.5684375000000005,
        "reward_min": -1.689,
        "leartime_s": 0.01879088400164619,
        "sampletime": 1.9447105030121747,
        "best_mean": -0.10994999999999981,
        "best_max": 0.6905000000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 446,
        "timesteps": 892000,
        "reward_mean": -0.0031249999999997213,
        "reward_max": 0.9881875000000006,
        "reward_min": -1.1584999999999999,
        "leartime_s": 0.08599733698065393,
        "sampletime": 1.728095922007924,
        "best_mean": -0.0031249999999997213,
        "best_max": 0.9881875000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 447,
        "timesteps": 894000,
        "reward_mean": -0.1101749999999998,
        "reward_max": 0.9006250000000003,
        "reward_min": -1.7380625,
        "leartime_s": 0.07430825100163929,
        "sampletime": 1.838366148993373,
        "best_mean": -0.0031249999999997213,
        "best_max": 0.9881875000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 448,
        "timesteps": 896000,
        "reward_mean": -0.22834999999999975,
        "reward_max": 0.9200000000000002,
        "reward_min": -2.0251875000000004,
        "leartime_s": 0.06428908900124952,
        "sampletime": 1.9636568450077903,
        "best_mean": -0.0031249999999997213,
        "best_max": 0.9881875000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 449,
        "timesteps": 898000,
        "reward_mean": -0.3899999999999999,
        "reward_max": 0.8183125000000004,
        "reward_min": -1.6543125000000003,
        "leartime_s": 0.043354310997528955,
        "sampletime": 1.9742805680143647,
        "best_mean": -0.0031249999999997213,
        "best_max": 0.9881875000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 450,
        "timesteps": 900000,
        "reward_mean": -0.3173749999999998,
        "reward_max": 0.7787500000000005,
        "reward_min": -1.4311875000000003,
        "leartime_s": 0.04611578898038715,
        "sampletime": 1.6704106090182904,
        "best_mean": -0.0031249999999997213,
        "best_max": 0.9881875000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 451,
        "timesteps": 902000,
        "reward_mean": -0.27779999999999977,
        "reward_max": 0.7920000000000004,
        "reward_min": -1.615375,
        "leartime_s": 0.06664003801415674,
        "sampletime": 1.6125158079958055,
        "best_mean": -0.0031249999999997213,
        "best_max": 0.9881875000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 452,
        "timesteps": 904000,
        "reward_mean": -0.0748999999999998,
        "reward_max": 1.0872500000000003,
        "reward_min": -1.1231250000000002,
        "leartime_s": 0.050449595000827685,
        "sampletime": 1.9580670499999542,
        "best_mean": -0.0031249999999997213,
        "best_max": 0.9881875000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 453,
        "timesteps": 906000,
        "reward_mean": -0.3215749999999997,
        "reward_max": 0.7669374999999999,
        "reward_min": -1.442625,
        "leartime_s": 0.02740958597860299,
        "sampletime": 1.7900214590190444,
        "best_mean": -0.0031249999999997213,
        "best_max": 0.9881875000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 454,
        "timesteps": 908000,
        "reward_mean": 0.1220500000000003,
        "reward_max": 1.1811875000000003,
        "reward_min": -0.9309999999999999,
        "leartime_s": 0.0774317370087374,
        "sampletime": 1.889275669993367,
        "best_mean": 0.1220500000000003,
        "best_max": 1.1811875000000003,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 455,
        "timesteps": 910000,
        "reward_mean": -0.13144999999999982,
        "reward_max": 1.1625000000000003,
        "reward_min": -1.2525000000000004,
        "leartime_s": 0.07137911699828692,
        "sampletime": 2.0575119589921087,
        "best_mean": 0.1220500000000003,
        "best_max": 1.1811875000000003,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 456,
        "timesteps": 912000,
        "reward_mean": -0.26787499999999975,
        "reward_max": 0.8811875000000006,
        "reward_min": -1.268375,
        "leartime_s": 0.06047906802268699,
        "sampletime": 1.8031376220169477,
        "best_mean": 0.1220500000000003,
        "best_max": 1.1811875000000003,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 457,
        "timesteps": 914000,
        "reward_mean": 0.03972500000000031,
        "reward_max": 1.1487500000000004,
        "reward_min": -1.0138749999999999,
        "leartime_s": 0.06182561899186112,
        "sampletime": 1.9232143700064626,
        "best_mean": 0.1220500000000003,
        "best_max": 1.1811875000000003,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 458,
        "timesteps": 916000,
        "reward_mean": 0.06430000000000022,
        "reward_max": 1.0700000000000003,
        "reward_min": -1.1266874999999998,
        "leartime_s": 0.05449631399824284,
        "sampletime": 1.8605259300093167,
        "best_mean": 0.1220500000000003,
        "best_max": 1.1811875000000003,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 459,
        "timesteps": 918000,
        "reward_mean": -0.4321749999999998,
        "reward_max": 0.9428750000000005,
        "reward_min": -1.6480000000000004,
        "leartime_s": 0.05863986301119439,
        "sampletime": 1.8868460869998671,
        "best_mean": 0.1220500000000003,
        "best_max": 1.1811875000000003,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 460,
        "timesteps": 920000,
        "reward_mean": 0.06777500000000035,
        "reward_max": 1.2021875000000009,
        "reward_min": -1.4764374999999996,
        "leartime_s": 0.036939343000994995,
        "sampletime": 1.8516445989953354,
        "best_mean": 0.1220500000000003,
        "best_max": 1.1811875000000003,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 461,
        "timesteps": 922000,
        "reward_mean": -0.20192499999999977,
        "reward_max": 0.8276250000000004,
        "reward_min": -1.3874999999999997,
        "leartime_s": 0.10612763298559003,
        "sampletime": 1.6882932190201245,
        "best_mean": 0.1220500000000003,
        "best_max": 1.1811875000000003,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 462,
        "timesteps": 924000,
        "reward_mean": 0.2603250000000002,
        "reward_max": 1.1615625000000003,
        "reward_min": -1.1693750000000003,
        "leartime_s": 0.06231930298963562,
        "sampletime": 2.2402218950155657,
        "best_mean": 0.2603250000000002,
        "best_max": 1.1615625000000003,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 463,
        "timesteps": 926000,
        "reward_mean": -0.1394999999999997,
        "reward_max": 0.8992500000000004,
        "reward_min": -1.6454374999999999,
        "leartime_s": 0.07646506899618544,
        "sampletime": 1.9257961539842654,
        "best_mean": 0.2603250000000002,
        "best_max": 1.1615625000000003,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 464,
        "timesteps": 928000,
        "reward_mean": -0.3487249999999998,
        "reward_max": 0.7888125000000001,
        "reward_min": -1.6282499999999995,
        "leartime_s": 0.10666140299872495,
        "sampletime": 1.9035171169962268,
        "best_mean": 0.2603250000000002,
        "best_max": 1.1615625000000003,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 465,
        "timesteps": 930000,
        "reward_mean": -0.13074999999999984,
        "reward_max": 0.9870000000000002,
        "reward_min": -1.6512499999999997,
        "leartime_s": 0.03572964298655279,
        "sampletime": 1.9102186620002612,
        "best_mean": 0.2603250000000002,
        "best_max": 1.1615625000000003,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 466,
        "timesteps": 932000,
        "reward_mean": -0.3525249999999998,
        "reward_max": 0.8265000000000006,
        "reward_min": -1.7811249999999998,
        "leartime_s": 0.03552021199720912,
        "sampletime": 1.7142297750106081,
        "best_mean": 0.2603250000000002,
        "best_max": 1.1615625000000003,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 467,
        "timesteps": 934000,
        "reward_mean": 0.1824000000000004,
        "reward_max": 1.1100625000000008,
        "reward_min": -1.0025624999999998,
        "leartime_s": 0.05113574001006782,
        "sampletime": 1.6612631840107497,
        "best_mean": 0.2603250000000002,
        "best_max": 1.1615625000000003,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 468,
        "timesteps": 936000,
        "reward_mean": 0.19070000000000029,
        "reward_max": 1.1245000000000003,
        "reward_min": -0.8931874999999998,
        "leartime_s": 0.024803539999993518,
        "sampletime": 2.277243311982602,
        "best_mean": 0.2603250000000002,
        "best_max": 1.1615625000000003,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 469,
        "timesteps": 938000,
        "reward_mean": -0.2878749999999998,
        "reward_max": 0.8100625,
        "reward_min": -1.7763749999999998,
        "leartime_s": 0.045600915007526055,
        "sampletime": 2.0957918200001586,
        "best_mean": 0.2603250000000002,
        "best_max": 1.1615625000000003,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 470,
        "timesteps": 940000,
        "reward_mean": 0.003825000000000269,
        "reward_max": 0.9883125000000005,
        "reward_min": -1.190375,
        "leartime_s": 0.07827888400061056,
        "sampletime": 1.6626880149997305,
        "best_mean": 0.2603250000000002,
        "best_max": 1.1615625000000003,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 471,
        "timesteps": 942000,
        "reward_mean": 0.18987500000000027,
        "reward_max": 1.1238750000000002,
        "reward_min": -1.3974374999999999,
        "leartime_s": 0.03913964898674749,
        "sampletime": 1.8911532970087137,
        "best_mean": 0.2603250000000002,
        "best_max": 1.1615625000000003,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 472,
        "timesteps": 944000,
        "reward_mean": 0.11980000000000021,
        "reward_max": 1.2357500000000001,
        "reward_min": -1.0163124999999997,
        "leartime_s": 0.06472253199899569,
        "sampletime": 1.9724405710003339,
        "best_mean": 0.2603250000000002,
        "best_max": 1.1615625000000003,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 473,
        "timesteps": 946000,
        "reward_mean": -0.0852749999999997,
        "reward_max": 0.9555000000000002,
        "reward_min": -0.8893749999999998,
        "leartime_s": 0.053363765007816255,
        "sampletime": 1.8421253990090918,
        "best_mean": 0.2603250000000002,
        "best_max": 1.1615625000000003,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 474,
        "timesteps": 948000,
        "reward_mean": 0.004400000000000233,
        "reward_max": 1.0960000000000003,
        "reward_min": -1.2038124999999997,
        "leartime_s": 0.03224794499692507,
        "sampletime": 2.442085121991113,
        "best_mean": 0.2603250000000002,
        "best_max": 1.1615625000000003,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 475,
        "timesteps": 950000,
        "reward_mean": 0.12725000000000034,
        "reward_max": 1.0643750000000003,
        "reward_min": -1.279625,
        "leartime_s": 0.061889919015811756,
        "sampletime": 1.843987019994529,
        "best_mean": 0.2603250000000002,
        "best_max": 1.1615625000000003,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 476,
        "timesteps": 952000,
        "reward_mean": 0.3301750000000003,
        "reward_max": 1.2268750000000002,
        "reward_min": -0.7102499999999997,
        "leartime_s": 0.04103954500169493,
        "sampletime": 1.9550344479794148,
        "best_mean": 0.3301750000000003,
        "best_max": 1.2268750000000002,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 477,
        "timesteps": 954000,
        "reward_mean": 0.16630000000000017,
        "reward_max": 1.5111875000000003,
        "reward_min": -0.95975,
        "leartime_s": 0.06674991399631836,
        "sampletime": 1.8400345839909278,
        "best_mean": 0.3301750000000003,
        "best_max": 1.2268750000000002,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 478,
        "timesteps": 956000,
        "reward_mean": 0.03275000000000023,
        "reward_max": 1.0268125000000006,
        "reward_min": -1.433875,
        "leartime_s": 0.035887355013983324,
        "sampletime": 1.7654466849926393,
        "best_mean": 0.3301750000000003,
        "best_max": 1.2268750000000002,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 479,
        "timesteps": 958000,
        "reward_mean": 0.027125000000000232,
        "reward_max": 1.1048125000000004,
        "reward_min": -1.5083750000000005,
        "leartime_s": 0.035285360005218536,
        "sampletime": 1.8590269310225267,
        "best_mean": 0.3301750000000003,
        "best_max": 1.2268750000000002,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 480,
        "timesteps": 960000,
        "reward_mean": 0.09780000000000025,
        "reward_max": 0.8744375000000003,
        "reward_min": -1.321875,
        "leartime_s": 0.052152368996758014,
        "sampletime": 1.8821617909998167,
        "best_mean": 0.3301750000000003,
        "best_max": 1.2268750000000002,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 481,
        "timesteps": 962000,
        "reward_mean": 0.05725000000000024,
        "reward_max": 1.1375625000000003,
        "reward_min": -1.0538125000000003,
        "leartime_s": 0.04021087600267492,
        "sampletime": 1.9611881370074116,
        "best_mean": 0.3301750000000003,
        "best_max": 1.2268750000000002,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 482,
        "timesteps": 964000,
        "reward_mean": -0.2794256499999998,
        "reward_max": 0.6558125000000001,
        "reward_min": -1.4483125,
        "leartime_s": 0.09333702299045399,
        "sampletime": 1.8041402449889574,
        "best_mean": 0.3301750000000003,
        "best_max": 1.2268750000000002,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 483,
        "timesteps": 966000,
        "reward_mean": 0.1040500000000003,
        "reward_max": 1.4250000000000005,
        "reward_min": -1.1839374999999999,
        "leartime_s": 0.02596069301944226,
        "sampletime": 1.6027082929795142,
        "best_mean": 0.3301750000000003,
        "best_max": 1.2268750000000002,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 484,
        "timesteps": 968000,
        "reward_mean": -0.061499999999999756,
        "reward_max": 1.1936875000000007,
        "reward_min": -1.471375,
        "leartime_s": 0.05564161701477133,
        "sampletime": 2.0787700560176745,
        "best_mean": 0.3301750000000003,
        "best_max": 1.2268750000000002,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 485,
        "timesteps": 970000,
        "reward_mean": 0.08517500000000026,
        "reward_max": 0.9681875000000005,
        "reward_min": -1.0838124999999998,
        "leartime_s": 0.08269574600853957,
        "sampletime": 1.766740713006584,
        "best_mean": 0.3301750000000003,
        "best_max": 1.2268750000000002,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 486,
        "timesteps": 972000,
        "reward_mean": 0.24892500000000028,
        "reward_max": 1.2847500000000003,
        "reward_min": -1.1670625000000001,
        "leartime_s": 0.04759783099871129,
        "sampletime": 2.169640325009823,
        "best_mean": 0.3301750000000003,
        "best_max": 1.2268750000000002,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 487,
        "timesteps": 974000,
        "reward_mean": -0.0238249999999998,
        "reward_max": 1.1084375000000002,
        "reward_min": -1.1700000000000004,
        "leartime_s": 0.05438384698936716,
        "sampletime": 2.0022980829817243,
        "best_mean": 0.3301750000000003,
        "best_max": 1.2268750000000002,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 488,
        "timesteps": 976000,
        "reward_mean": 0.2552000000000002,
        "reward_max": 1.1138125000000003,
        "reward_min": -1.5440625000000003,
        "leartime_s": 0.06521706201601774,
        "sampletime": 1.7643646369979251,
        "best_mean": 0.3301750000000003,
        "best_max": 1.2268750000000002,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 489,
        "timesteps": 978000,
        "reward_mean": 0.005675000000000225,
        "reward_max": 1.139875,
        "reward_min": -1.2887499999999996,
        "leartime_s": 0.039719903987133875,
        "sampletime": 2.1483013039978687,
        "best_mean": 0.3301750000000003,
        "best_max": 1.2268750000000002,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 490,
        "timesteps": 980000,
        "reward_mean": 0.3974000000000003,
        "reward_max": 1.6430625000000005,
        "reward_min": -1.0006249999999999,
        "leartime_s": 0.05576310498872772,
        "sampletime": 1.8307634020166006,
        "best_mean": 0.3974000000000003,
        "best_max": 1.6430625000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 491,
        "timesteps": 982000,
        "reward_mean": 0.21270000000000028,
        "reward_max": 1.3875625,
        "reward_min": -0.8671875000000001,
        "leartime_s": 0.09370953601319343,
        "sampletime": 1.955872456979705,
        "best_mean": 0.3974000000000003,
        "best_max": 1.6430625000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 492,
        "timesteps": 984000,
        "reward_mean": 0.06967500000000024,
        "reward_max": 1.2329375000000002,
        "reward_min": -1.1047499999999997,
        "leartime_s": 0.026863295992370695,
        "sampletime": 1.8258485909900628,
        "best_mean": 0.3974000000000003,
        "best_max": 1.6430625000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 493,
        "timesteps": 986000,
        "reward_mean": 0.2108000000000003,
        "reward_max": 1.2157500000000003,
        "reward_min": -1.0070625,
        "leartime_s": 0.034591539995744824,
        "sampletime": 1.8822777509922162,
        "best_mean": 0.3974000000000003,
        "best_max": 1.6430625000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 494,
        "timesteps": 988000,
        "reward_mean": 0.16040000000000026,
        "reward_max": 1.1915625000000007,
        "reward_min": -1.3125000000000002,
        "leartime_s": 0.07432919699931517,
        "sampletime": 1.733288655988872,
        "best_mean": 0.3974000000000003,
        "best_max": 1.6430625000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 495,
        "timesteps": 990000,
        "reward_mean": -0.05854999999999974,
        "reward_max": 0.8420000000000003,
        "reward_min": -1.3601874999999999,
        "leartime_s": 0.059744330996181816,
        "sampletime": 1.813563161995262,
        "best_mean": 0.3974000000000003,
        "best_max": 1.6430625000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 496,
        "timesteps": 992000,
        "reward_mean": 0.056700000000000216,
        "reward_max": 1.2206875000000004,
        "reward_min": -1.1338125000000001,
        "leartime_s": 0.023937171994475648,
        "sampletime": 1.7836194369883742,
        "best_mean": 0.3974000000000003,
        "best_max": 1.6430625000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 497,
        "timesteps": 994000,
        "reward_mean": 0.05607500000000031,
        "reward_max": 1.0041875000000005,
        "reward_min": -1.4574374999999997,
        "leartime_s": 0.03571706201182678,
        "sampletime": 2.0779844550124835,
        "best_mean": 0.3974000000000003,
        "best_max": 1.6430625000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 498,
        "timesteps": 996000,
        "reward_mean": 0.12335000000000021,
        "reward_max": 1.3351250000000006,
        "reward_min": -1.1996875000000002,
        "leartime_s": 0.06631380200269632,
        "sampletime": 1.816084215999581,
        "best_mean": 0.3974000000000003,
        "best_max": 1.6430625000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 499,
        "timesteps": 998000,
        "reward_mean": -0.1944249999999998,
        "reward_max": 0.6487500000000004,
        "reward_min": -1.4013124999999995,
        "leartime_s": 0.031120086001465097,
        "sampletime": 1.7111276949872263,
        "best_mean": 0.3974000000000003,
        "best_max": 1.6430625000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 500,
        "timesteps": 1000000,
        "reward_mean": 0.08830000000000031,
        "reward_max": 1.2696875000000003,
        "reward_min": -1.325875,
        "leartime_s": 0.042036864993860945,
        "sampletime": 1.791120724985376,
        "best_mean": 0.3974000000000003,
        "best_max": 1.6430625000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 1,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    }
]