[
    {
        "generation": 1,
        "timesteps": 2000,
        "reward_mean": -39.115275,
        "reward_max": -9.258375,
        "reward_min": -84.22968750000004,
        "leartime_s": 0.028569740999955684,
        "sampletime": 1.523932779993629,
        "best_mean": -39.115275,
        "best_max": -9.258375,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 2,
        "timesteps": 4000,
        "reward_mean": -39.009699999999995,
        "reward_max": -1.3338124999999996,
        "reward_min": -74.85537499999998,
        "leartime_s": 0.011601133010117337,
        "sampletime": 1.8672801310021896,
        "best_mean": -39.009699999999995,
        "best_max": -1.3338124999999996,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 3,
        "timesteps": 6000,
        "reward_mean": -35.026075000000006,
        "reward_max": -1.9019999999999988,
        "reward_min": -198.31818750000005,
        "leartime_s": 0.00696630499442108,
        "sampletime": 1.8647591369808652,
        "best_mean": -35.026075000000006,
        "best_max": -1.9019999999999988,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 4,
        "timesteps": 8000,
        "reward_mean": -19.421449999999997,
        "reward_max": 0.01674999999999991,
        "reward_min": -190.85881250000003,
        "leartime_s": 0.01070123800309375,
        "sampletime": 1.709578333015088,
        "best_mean": -19.421449999999997,
        "best_max": 0.01674999999999991,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 5,
        "timesteps": 10000,
        "reward_mean": -9.359675,
        "reward_max": -1.3089374999999999,
        "reward_min": -53.8844375,
        "leartime_s": 0.008026416006032377,
        "sampletime": 1.7425592159852386,
        "best_mean": -9.359675,
        "best_max": -1.3089374999999999,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 6,
        "timesteps": 12000,
        "reward_mean": -5.6736,
        "reward_max": -1.8271875,
        "reward_min": -15.704937500000002,
        "leartime_s": 0.0045641770120710135,
        "sampletime": 1.7094059810042381,
        "best_mean": -5.6736,
        "best_max": -1.8271875,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 7,
        "timesteps": 14000,
        "reward_mean": -3.0267000000000004,
        "reward_max": 0.27200000000000024,
        "reward_min": -12.3595625,
        "leartime_s": 0.0101004829921294,
        "sampletime": 1.545871588983573,
        "best_mean": -3.0267000000000004,
        "best_max": 0.27200000000000024,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 8,
        "timesteps": 16000,
        "reward_mean": -2.2456250000000004,
        "reward_max": 0.5289375000000004,
        "reward_min": -8.1294375,
        "leartime_s": 0.014424644003156573,
        "sampletime": 1.5722509330080356,
        "best_mean": -2.2456250000000004,
        "best_max": 0.5289375000000004,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 9,
        "timesteps": 18000,
        "reward_mean": -1.9015500000000005,
        "reward_max": -0.37068750000000017,
        "reward_min": -3.90925,
        "leartime_s": 0.029027084994595498,
        "sampletime": 1.680930984992301,
        "best_mean": -1.9015500000000005,
        "best_max": -0.37068750000000017,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 10,
        "timesteps": 20000,
        "reward_mean": -2.2230000000000003,
        "reward_max": -0.9626875,
        "reward_min": -4.376687500000001,
        "leartime_s": 0.005638706003082916,
        "sampletime": 2.234959802008234,
        "best_mean": -1.9015500000000005,
        "best_max": -0.37068750000000017,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 11,
        "timesteps": 22000,
        "reward_mean": -2.1455499999999996,
        "reward_max": -0.6604999999999999,
        "reward_min": -3.9305624999999993,
        "leartime_s": 0.03034238499822095,
        "sampletime": 1.8461773250019178,
        "best_mean": -1.9015500000000005,
        "best_max": -0.37068750000000017,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 12,
        "timesteps": 24000,
        "reward_mean": -1.8363750000000003,
        "reward_max": -0.7743749999999999,
        "reward_min": -3.4947500000000002,
        "leartime_s": 0.015943478007102385,
        "sampletime": 2.1122712999931537,
        "best_mean": -1.8363750000000003,
        "best_max": -0.7743749999999999,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 13,
        "timesteps": 26000,
        "reward_mean": -1.7104000000000001,
        "reward_max": -0.7315625000000001,
        "reward_min": -3.679312499999999,
        "leartime_s": 0.02657624499988742,
        "sampletime": 2.05559292100952,
        "best_mean": -1.7104000000000001,
        "best_max": -0.7315625000000001,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 14,
        "timesteps": 28000,
        "reward_mean": -1.8407,
        "reward_max": -0.5935000000000001,
        "reward_min": -3.539625000000001,
        "leartime_s": 0.005980860005365685,
        "sampletime": 1.8177095589926466,
        "best_mean": -1.7104000000000001,
        "best_max": -0.7315625000000001,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 15,
        "timesteps": 30000,
        "reward_mean": -1.95595,
        "reward_max": -0.6123125000000001,
        "reward_min": -3.3100625,
        "leartime_s": 0.023323859000811353,
        "sampletime": 2.1350798450002912,
        "best_mean": -1.7104000000000001,
        "best_max": -0.7315625000000001,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 16,
        "timesteps": 32000,
        "reward_mean": -1.7030249999999998,
        "reward_max": -0.5201250000000004,
        "reward_min": -3.1265625,
        "leartime_s": 0.013401659991359338,
        "sampletime": 2.035690605000127,
        "best_mean": -1.7030249999999998,
        "best_max": -0.5201250000000004,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 17,
        "timesteps": 34000,
        "reward_mean": -1.6825000000000003,
        "reward_max": -0.6440624999999999,
        "reward_min": -3.0002500000000003,
        "leartime_s": 0.012503779988037422,
        "sampletime": 1.7966281360131688,
        "best_mean": -1.6825000000000003,
        "best_max": -0.6440624999999999,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 18,
        "timesteps": 36000,
        "reward_mean": -1.6481,
        "reward_max": -0.7126874999999999,
        "reward_min": -3.230875,
        "leartime_s": 0.024337915994692594,
        "sampletime": 2.063894877996063,
        "best_mean": -1.6481,
        "best_max": -0.7126874999999999,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 19,
        "timesteps": 38000,
        "reward_mean": -1.5057250000000002,
        "reward_max": -0.4842499999999999,
        "reward_min": -2.7220000000000004,
        "leartime_s": 0.013336667994735762,
        "sampletime": 2.138729350990616,
        "best_mean": -1.5057250000000002,
        "best_max": -0.4842499999999999,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 20,
        "timesteps": 40000,
        "reward_mean": -1.351675,
        "reward_max": -0.36006249999999984,
        "reward_min": -2.6504375,
        "leartime_s": 0.03214375601965003,
        "sampletime": 2.015773419989273,
        "best_mean": -1.351675,
        "best_max": -0.36006249999999984,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 21,
        "timesteps": 42000,
        "reward_mean": -1.5885,
        "reward_max": -0.5895625000000002,
        "reward_min": -2.7926875,
        "leartime_s": 0.0063720700272824615,
        "sampletime": 2.0135144859959837,
        "best_mean": -1.351675,
        "best_max": -0.36006249999999984,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 22,
        "timesteps": 44000,
        "reward_mean": -1.6205369404761905,
        "reward_max": -0.7559375000000002,
        "reward_min": -2.5096875,
        "leartime_s": 0.02027417198405601,
        "sampletime": 1.9141287879901938,
        "best_mean": -1.351675,
        "best_max": -0.36006249999999984,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 23,
        "timesteps": 46000,
        "reward_mean": -1.21505,
        "reward_max": -0.041249999999999815,
        "reward_min": -2.395625000000001,
        "leartime_s": 0.007803473999956623,
        "sampletime": 1.707153142982861,
        "best_mean": -1.21505,
        "best_max": -0.041249999999999815,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 24,
        "timesteps": 48000,
        "reward_mean": -1.3170000000000002,
        "reward_max": -0.3835000000000002,
        "reward_min": -2.413312500000001,
        "leartime_s": 0.01920860802056268,
        "sampletime": 1.6504364180145785,
        "best_mean": -1.21505,
        "best_max": -0.041249999999999815,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 25,
        "timesteps": 50000,
        "reward_mean": -1.3216750000000002,
        "reward_max": -0.37606249999999986,
        "reward_min": -2.6355625000000007,
        "leartime_s": 0.005238482001004741,
        "sampletime": 1.8959408449882176,
        "best_mean": -1.21505,
        "best_max": -0.041249999999999815,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 26,
        "timesteps": 52000,
        "reward_mean": -1.5996750000000002,
        "reward_max": -0.638125,
        "reward_min": -3.0278125000000005,
        "leartime_s": 0.025289451994467527,
        "sampletime": 2.164695273997495,
        "best_mean": -1.21505,
        "best_max": -0.041249999999999815,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 27,
        "timesteps": 54000,
        "reward_mean": -1.17925,
        "reward_max": -0.07431249999999995,
        "reward_min": -2.4230625000000003,
        "leartime_s": 0.017112150992034003,
        "sampletime": 1.7461431940027978,
        "best_mean": -1.17925,
        "best_max": -0.07431249999999995,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 28,
        "timesteps": 56000,
        "reward_mean": -1.4343500000000002,
        "reward_max": -0.23418749999999997,
        "reward_min": -2.6833750000000007,
        "leartime_s": 0.015349432011134923,
        "sampletime": 1.9381294420163613,
        "best_mean": -1.17925,
        "best_max": -0.07431249999999995,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 29,
        "timesteps": 58000,
        "reward_mean": -1.3878750000000002,
        "reward_max": -0.3023125000000001,
        "reward_min": -2.6065625000000003,
        "leartime_s": 0.018991411983733997,
        "sampletime": 2.1737730620079674,
        "best_mean": -1.17925,
        "best_max": -0.07431249999999995,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 30,
        "timesteps": 60000,
        "reward_mean": -1.48015,
        "reward_max": -0.4838750000000003,
        "reward_min": -2.5523749999999996,
        "leartime_s": 0.04016213500290178,
        "sampletime": 1.6953152710048016,
        "best_mean": -1.17925,
        "best_max": -0.07431249999999995,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 31,
        "timesteps": 62000,
        "reward_mean": -1.3746,
        "reward_max": -0.2829375000000001,
        "reward_min": -2.3558750000000006,
        "leartime_s": 0.01650962099665776,
        "sampletime": 1.9229469129932113,
        "best_mean": -1.17925,
        "best_max": -0.07431249999999995,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 32,
        "timesteps": 64000,
        "reward_mean": -1.3368749999999998,
        "reward_max": -0.3751874999999996,
        "reward_min": -2.5071874999999997,
        "leartime_s": 0.010555754997767508,
        "sampletime": 1.8816151590144727,
        "best_mean": -1.17925,
        "best_max": -0.07431249999999995,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 33,
        "timesteps": 66000,
        "reward_mean": -1.225125,
        "reward_max": -0.26218749999999985,
        "reward_min": -2.9158750000000007,
        "leartime_s": 0.015478852990781888,
        "sampletime": 2.0697221790032927,
        "best_mean": -1.17925,
        "best_max": -0.07431249999999995,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 34,
        "timesteps": 68000,
        "reward_mean": -1.351375,
        "reward_max": -0.3239374999999999,
        "reward_min": -2.8097499999999993,
        "leartime_s": 0.01514295200468041,
        "sampletime": 1.9677198189892806,
        "best_mean": -1.17925,
        "best_max": -0.07431249999999995,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 35,
        "timesteps": 70000,
        "reward_mean": -1.49815,
        "reward_max": -0.7482500000000003,
        "reward_min": -2.9867500000000007,
        "leartime_s": 0.011819134990219027,
        "sampletime": 2.106478921021335,
        "best_mean": -1.17925,
        "best_max": -0.07431249999999995,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 36,
        "timesteps": 72000,
        "reward_mean": -1.3302500000000002,
        "reward_max": -0.24974999999999972,
        "reward_min": -2.5248750000000006,
        "leartime_s": 0.021139438991667703,
        "sampletime": 2.0031497789896093,
        "best_mean": -1.17925,
        "best_max": -0.07431249999999995,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 37,
        "timesteps": 74000,
        "reward_mean": -1.152825,
        "reward_max": -0.0771250000000002,
        "reward_min": -2.427625000000001,
        "leartime_s": 0.0071210880123544484,
        "sampletime": 1.8504002279951237,
        "best_mean": -1.152825,
        "best_max": -0.0771250000000002,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 38,
        "timesteps": 76000,
        "reward_mean": -1.2522000000000002,
        "reward_max": -0.20793750000000005,
        "reward_min": -2.4378125,
        "leartime_s": 0.021552874997723848,
        "sampletime": 1.977105867001228,
        "best_mean": -1.152825,
        "best_max": -0.0771250000000002,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 39,
        "timesteps": 78000,
        "reward_mean": -1.2278000000000002,
        "reward_max": -0.33706249999999993,
        "reward_min": -2.6758750000000004,
        "leartime_s": 0.019568295974750072,
        "sampletime": 1.797239288018318,
        "best_mean": -1.152825,
        "best_max": -0.0771250000000002,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 40,
        "timesteps": 80000,
        "reward_mean": -1.4422000000000001,
        "reward_max": -0.29856249999999995,
        "reward_min": -2.5902500000000006,
        "leartime_s": 0.020936317974701524,
        "sampletime": 1.795503715024097,
        "best_mean": -1.152825,
        "best_max": -0.0771250000000002,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 41,
        "timesteps": 82000,
        "reward_mean": -1.1093750000000002,
        "reward_max": -0.23987499999999987,
        "reward_min": -2.4741875,
        "leartime_s": 0.03380304199527018,
        "sampletime": 2.1229477930173744,
        "best_mean": -1.1093750000000002,
        "best_max": -0.23987499999999987,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 42,
        "timesteps": 84000,
        "reward_mean": -1.0929749999999998,
        "reward_max": 0.04793750000000027,
        "reward_min": -2.426125,
        "leartime_s": 0.00664471200434491,
        "sampletime": 2.0950209200091194,
        "best_mean": -1.0929749999999998,
        "best_max": 0.04793750000000027,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 43,
        "timesteps": 86000,
        "reward_mean": -1.2277500000000001,
        "reward_max": -0.3183125,
        "reward_min": -2.7726250000000006,
        "leartime_s": 0.020611245010513812,
        "sampletime": 1.7470763099845499,
        "best_mean": -1.0929749999999998,
        "best_max": 0.04793750000000027,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 44,
        "timesteps": 88000,
        "reward_mean": -1.352025,
        "reward_max": -0.26050000000000006,
        "reward_min": -3.0081875,
        "leartime_s": 0.00963961801608093,
        "sampletime": 2.0194903970113955,
        "best_mean": -1.0929749999999998,
        "best_max": 0.04793750000000027,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 45,
        "timesteps": 90000,
        "reward_mean": -1.3155500000000002,
        "reward_max": -0.4535624999999998,
        "reward_min": -2.7062500000000003,
        "leartime_s": 0.034977402014192194,
        "sampletime": 2.058310808002716,
        "best_mean": -1.0929749999999998,
        "best_max": 0.04793750000000027,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 46,
        "timesteps": 92000,
        "reward_mean": -1.1427,
        "reward_max": -0.29231249999999986,
        "reward_min": -2.1005000000000003,
        "leartime_s": 0.006057897990103811,
        "sampletime": 1.8716634379816242,
        "best_mean": -1.0929749999999998,
        "best_max": 0.04793750000000027,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 47,
        "timesteps": 94000,
        "reward_mean": -1.0086000000000002,
        "reward_max": -0.1496874999999998,
        "reward_min": -2.156,
        "leartime_s": 0.0342096539970953,
        "sampletime": 2.0506794339744374,
        "best_mean": -1.0086000000000002,
        "best_max": -0.1496874999999998,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 48,
        "timesteps": 96000,
        "reward_mean": -1.1454000000000002,
        "reward_max": -0.3095,
        "reward_min": -2.567437500000001,
        "leartime_s": 0.006438979995436966,
        "sampletime": 1.8912397230160423,
        "best_mean": -1.0086000000000002,
        "best_max": -0.1496874999999998,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 49,
        "timesteps": 98000,
        "reward_mean": -1.5481000000000003,
        "reward_max": -0.6317500000000004,
        "reward_min": -2.4901875,
        "leartime_s": 0.014783577003981918,
        "sampletime": 1.9973502510110848,
        "best_mean": -1.0086000000000002,
        "best_max": -0.1496874999999998,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 50,
        "timesteps": 100000,
        "reward_mean": -1.2218000000000002,
        "reward_max": -0.15693749999999987,
        "reward_min": -2.636687500000001,
        "leartime_s": 0.008238787006121129,
        "sampletime": 1.7136841950123198,
        "best_mean": -1.0086000000000002,
        "best_max": -0.1496874999999998,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 51,
        "timesteps": 102000,
        "reward_mean": -1.3374750000000002,
        "reward_max": -0.057249999999999954,
        "reward_min": -3.0060625000000005,
        "leartime_s": 0.006438800017349422,
        "sampletime": 2.0397062089759856,
        "best_mean": -1.0086000000000002,
        "best_max": -0.1496874999999998,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 52,
        "timesteps": 104000,
        "reward_mean": -1.1998250000000004,
        "reward_max": -0.33368749999999997,
        "reward_min": -2.6960000000000006,
        "leartime_s": 0.015998287010006607,
        "sampletime": 1.986302990000695,
        "best_mean": -1.0086000000000002,
        "best_max": -0.1496874999999998,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 53,
        "timesteps": 106000,
        "reward_mean": -1.065725,
        "reward_max": -0.26893749999999983,
        "reward_min": -2.096437500000001,
        "leartime_s": 0.04241210001055151,
        "sampletime": 1.9230066380114295,
        "best_mean": -1.0086000000000002,
        "best_max": -0.1496874999999998,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 54,
        "timesteps": 108000,
        "reward_mean": -1.3803,
        "reward_max": -0.4882500000000006,
        "reward_min": -2.45325,
        "leartime_s": 0.014621361013269052,
        "sampletime": 2.125192400009837,
        "best_mean": -1.0086000000000002,
        "best_max": -0.1496874999999998,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 55,
        "timesteps": 110000,
        "reward_mean": -1.15785,
        "reward_max": -0.10399999999999979,
        "reward_min": -2.391875000000001,
        "leartime_s": 0.059999712015269324,
        "sampletime": 1.7227374969806988,
        "best_mean": -1.0086000000000002,
        "best_max": -0.1496874999999998,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 56,
        "timesteps": 112000,
        "reward_mean": -1.2156750000000003,
        "reward_max": -0.34862499999999996,
        "reward_min": -2.2389375000000005,
        "leartime_s": 0.006998146011028439,
        "sampletime": 1.7423851450148504,
        "best_mean": -1.0086000000000002,
        "best_max": -0.1496874999999998,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 57,
        "timesteps": 114000,
        "reward_mean": -1.2642250000000004,
        "reward_max": -0.23000000000000004,
        "reward_min": -2.369875,
        "leartime_s": 0.023077644989825785,
        "sampletime": 2.0072758800233714,
        "best_mean": -1.0086000000000002,
        "best_max": -0.1496874999999998,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 58,
        "timesteps": 116000,
        "reward_mean": -1.190375,
        "reward_max": -0.22399999999999973,
        "reward_min": -3.306312500000001,
        "leartime_s": 0.020981237990781665,
        "sampletime": 2.28739279700676,
        "best_mean": -1.0086000000000002,
        "best_max": -0.1496874999999998,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 59,
        "timesteps": 118000,
        "reward_mean": -1.2025500000000002,
        "reward_max": -0.3205625,
        "reward_min": -2.4268750000000003,
        "leartime_s": 0.026666142017347738,
        "sampletime": 2.0866194249829277,
        "best_mean": -1.0086000000000002,
        "best_max": -0.1496874999999998,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 60,
        "timesteps": 120000,
        "reward_mean": -1.30525,
        "reward_max": -0.4287500000000003,
        "reward_min": -2.61025,
        "leartime_s": 0.007638901995960623,
        "sampletime": 1.949782823008718,
        "best_mean": -1.0086000000000002,
        "best_max": -0.1496874999999998,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 61,
        "timesteps": 122000,
        "reward_mean": -1.2978750000000006,
        "reward_max": -0.235375,
        "reward_min": -2.485000000000001,
        "leartime_s": 0.05121155100641772,
        "sampletime": 1.9146809100056998,
        "best_mean": -1.0086000000000002,
        "best_max": -0.1496874999999998,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 62,
        "timesteps": 124000,
        "reward_mean": -1.1504750000000001,
        "reward_max": -0.12562499999999974,
        "reward_min": -2.1580625000000007,
        "leartime_s": 0.008943974011344835,
        "sampletime": 1.8218967839784455,
        "best_mean": -1.0086000000000002,
        "best_max": -0.1496874999999998,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 63,
        "timesteps": 126000,
        "reward_mean": -1.2367750000000002,
        "reward_max": -0.23093749999999985,
        "reward_min": -2.74275,
        "leartime_s": 0.06284775299718603,
        "sampletime": 1.9254442319797818,
        "best_mean": -1.0086000000000002,
        "best_max": -0.1496874999999998,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 64,
        "timesteps": 128000,
        "reward_mean": -1.1607500000000002,
        "reward_max": -0.2834374999999998,
        "reward_min": -2.3359375000000004,
        "leartime_s": 0.016722457978175953,
        "sampletime": 2.2170822600019164,
        "best_mean": -1.0086000000000002,
        "best_max": -0.1496874999999998,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 65,
        "timesteps": 130000,
        "reward_mean": -1.296875,
        "reward_max": -0.3651250000000001,
        "reward_min": -2.3541875000000005,
        "leartime_s": 0.03443792701000348,
        "sampletime": 1.8112022929999512,
        "best_mean": -1.0086000000000002,
        "best_max": -0.1496874999999998,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 66,
        "timesteps": 132000,
        "reward_mean": -1.2184750000000004,
        "reward_max": -0.171,
        "reward_min": -2.118625,
        "leartime_s": 0.007970384991494939,
        "sampletime": 2.0635667300084606,
        "best_mean": -1.0086000000000002,
        "best_max": -0.1496874999999998,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 67,
        "timesteps": 134000,
        "reward_mean": -1.2380750000000003,
        "reward_max": -0.41937500000000005,
        "reward_min": -2.5494375,
        "leartime_s": 0.00812486300128512,
        "sampletime": 1.9264435560035054,
        "best_mean": -1.0086000000000002,
        "best_max": -0.1496874999999998,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 68,
        "timesteps": 136000,
        "reward_mean": -1.2579500000000003,
        "reward_max": -0.17062500000000003,
        "reward_min": -2.2971250000000007,
        "leartime_s": 0.008587789023295045,
        "sampletime": 1.9917100989841856,
        "best_mean": -1.0086000000000002,
        "best_max": -0.1496874999999998,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 69,
        "timesteps": 138000,
        "reward_mean": -1.1344750000000003,
        "reward_max": -0.09956250000000025,
        "reward_min": -2.4128125000000007,
        "leartime_s": 0.059142243990208954,
        "sampletime": 1.845174470974598,
        "best_mean": -1.0086000000000002,
        "best_max": -0.1496874999999998,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 70,
        "timesteps": 140000,
        "reward_mean": -0.9950750000000002,
        "reward_max": 0.1385625000000002,
        "reward_min": -2.079500000000001,
        "leartime_s": 0.04408823398989625,
        "sampletime": 1.9816163750074338,
        "best_mean": -0.9950750000000002,
        "best_max": 0.1385625000000002,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 71,
        "timesteps": 142000,
        "reward_mean": -1.1199250000000003,
        "reward_max": -0.24218749999999992,
        "reward_min": -2.1895000000000002,
        "leartime_s": 0.010830826009623706,
        "sampletime": 1.672177644999465,
        "best_mean": -0.9950750000000002,
        "best_max": 0.1385625000000002,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 72,
        "timesteps": 144000,
        "reward_mean": -1.1494750000000005,
        "reward_max": -0.03487499999999986,
        "reward_min": -2.405625,
        "leartime_s": 0.02024059198447503,
        "sampletime": 1.8896692559937946,
        "best_mean": -0.9950750000000002,
        "best_max": 0.1385625000000002,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 73,
        "timesteps": 146000,
        "reward_mean": -0.8428000000000002,
        "reward_max": 0.014812500000000062,
        "reward_min": -1.9362500000000005,
        "leartime_s": 0.02352847799193114,
        "sampletime": 1.8033236819901504,
        "best_mean": -0.8428000000000002,
        "best_max": 0.014812500000000062,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 74,
        "timesteps": 148000,
        "reward_mean": -1.1120500000000002,
        "reward_max": -0.11199999999999986,
        "reward_min": -2.4140625000000004,
        "leartime_s": 0.01657331400201656,
        "sampletime": 2.2145567940024193,
        "best_mean": -0.8428000000000002,
        "best_max": 0.014812500000000062,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 75,
        "timesteps": 150000,
        "reward_mean": -1.2794250000000005,
        "reward_max": -0.1781874999999999,
        "reward_min": -2.6001875,
        "leartime_s": 0.009185313014313579,
        "sampletime": 1.7800721249950584,
        "best_mean": -0.8428000000000002,
        "best_max": 0.014812500000000062,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 76,
        "timesteps": 152000,
        "reward_mean": -1.089425,
        "reward_max": -0.25631250000000005,
        "reward_min": -2.179875000000001,
        "leartime_s": 0.04652496299240738,
        "sampletime": 2.0607345390017144,
        "best_mean": -0.8428000000000002,
        "best_max": 0.014812500000000062,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 77,
        "timesteps": 154000,
        "reward_mean": -0.9987250000000001,
        "reward_max": -0.07756250000000015,
        "reward_min": -2.1848750000000012,
        "leartime_s": 0.02304530399851501,
        "sampletime": 2.090121574990917,
        "best_mean": -0.8428000000000002,
        "best_max": 0.014812500000000062,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 78,
        "timesteps": 156000,
        "reward_mean": -1.1169250000000004,
        "reward_max": 0.16562500000000024,
        "reward_min": -2.2383750000000004,
        "leartime_s": 0.052010068990057334,
        "sampletime": 1.700220228987746,
        "best_mean": -0.8428000000000002,
        "best_max": 0.014812500000000062,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 79,
        "timesteps": 158000,
        "reward_mean": -1.1394000000000002,
        "reward_max": -0.04056249999999993,
        "reward_min": -2.1383125000000005,
        "leartime_s": 0.030273779993876815,
        "sampletime": 1.9540148329979274,
        "best_mean": -0.8428000000000002,
        "best_max": 0.014812500000000062,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 80,
        "timesteps": 160000,
        "reward_mean": -1.1599000000000004,
        "reward_max": -0.06499999999999996,
        "reward_min": -2.325062500000001,
        "leartime_s": 0.018222896003862843,
        "sampletime": 2.330128883011639,
        "best_mean": -0.8428000000000002,
        "best_max": 0.014812500000000062,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 81,
        "timesteps": 162000,
        "reward_mean": -0.8138000000000002,
        "reward_max": 0.1943125000000001,
        "reward_min": -2.4435625000000005,
        "leartime_s": 0.037742711981991306,
        "sampletime": 1.7964177250105422,
        "best_mean": -0.8138000000000002,
        "best_max": 0.1943125000000001,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 82,
        "timesteps": 164000,
        "reward_mean": -1.0951500000000003,
        "reward_max": -0.1395625000000001,
        "reward_min": -2.6609375000000006,
        "leartime_s": 0.011877545999595895,
        "sampletime": 1.8188991959905252,
        "best_mean": -0.8138000000000002,
        "best_max": 0.1943125000000001,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 83,
        "timesteps": 166000,
        "reward_mean": -1.0792250000000003,
        "reward_max": -0.2834374999999999,
        "reward_min": -2.1526249999999996,
        "leartime_s": 0.02548080400447361,
        "sampletime": 2.0434721919882577,
        "best_mean": -0.8138000000000002,
        "best_max": 0.1943125000000001,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 84,
        "timesteps": 168000,
        "reward_mean": -1.0940750000000004,
        "reward_max": -0.16856250000000017,
        "reward_min": -2.2470000000000008,
        "leartime_s": 0.011872275004861876,
        "sampletime": 1.8525395909964573,
        "best_mean": -0.8138000000000002,
        "best_max": 0.1943125000000001,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 85,
        "timesteps": 170000,
        "reward_mean": -1.0037750000000005,
        "reward_max": -0.13312500000000005,
        "reward_min": -2.247687500000001,
        "leartime_s": 0.018937752000056207,
        "sampletime": 2.1143771180068143,
        "best_mean": -0.8138000000000002,
        "best_max": 0.1943125000000001,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 86,
        "timesteps": 172000,
        "reward_mean": -1.1580750000000002,
        "reward_max": -0.09306250000000013,
        "reward_min": -2.3169375000000008,
        "leartime_s": 0.019513066014042124,
        "sampletime": 2.1272269090113696,
        "best_mean": -0.8138000000000002,
        "best_max": 0.1943125000000001,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 87,
        "timesteps": 174000,
        "reward_mean": -0.8367000000000002,
        "reward_max": 0.29281250000000025,
        "reward_min": -2.022187500000001,
        "leartime_s": 0.030346530984388664,
        "sampletime": 1.8286444100085646,
        "best_mean": -0.8138000000000002,
        "best_max": 0.1943125000000001,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 88,
        "timesteps": 176000,
        "reward_mean": -0.9934750000000002,
        "reward_max": 0.23937500000000017,
        "reward_min": -2.3998125000000003,
        "leartime_s": 0.024860939010977745,
        "sampletime": 1.690479729004437,
        "best_mean": -0.8138000000000002,
        "best_max": 0.1943125000000001,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 89,
        "timesteps": 178000,
        "reward_mean": -1.0089250000000003,
        "reward_max": -0.0994375000000001,
        "reward_min": -1.9065000000000005,
        "leartime_s": 0.012130617018556222,
        "sampletime": 1.9930692790076137,
        "best_mean": -0.8138000000000002,
        "best_max": 0.1943125000000001,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 90,
        "timesteps": 180000,
        "reward_mean": -1.0137250000000002,
        "reward_max": 0.09200000000000022,
        "reward_min": -2.343,
        "leartime_s": 0.0075936520006507635,
        "sampletime": 2.021561808011029,
        "best_mean": -0.8138000000000002,
        "best_max": 0.1943125000000001,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 91,
        "timesteps": 182000,
        "reward_mean": -0.9801500000000003,
        "reward_max": -0.11631250000000022,
        "reward_min": -2.0726875000000007,
        "leartime_s": 0.02518796199001372,
        "sampletime": 1.7702553549897857,
        "best_mean": -0.8138000000000002,
        "best_max": 0.1943125000000001,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 92,
        "timesteps": 184000,
        "reward_mean": -1.1111500000000003,
        "reward_max": -0.007874999999999684,
        "reward_min": -2.2666250000000003,
        "leartime_s": 0.007975004991749302,
        "sampletime": 1.9944803979888093,
        "best_mean": -0.8138000000000002,
        "best_max": 0.1943125000000001,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 93,
        "timesteps": 186000,
        "reward_mean": -1.1303750000000001,
        "reward_max": -0.05118749999999987,
        "reward_min": -2.4388125,
        "leartime_s": 0.009711777995107695,
        "sampletime": 2.2090219620149583,
        "best_mean": -0.8138000000000002,
        "best_max": 0.1943125000000001,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 94,
        "timesteps": 188000,
        "reward_mean": -1.2799750000000003,
        "reward_max": -0.4176250000000001,
        "reward_min": -2.568437500000001,
        "leartime_s": 0.062037466996116564,
        "sampletime": 1.7846114770218264,
        "best_mean": -0.8138000000000002,
        "best_max": 0.1943125000000001,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 95,
        "timesteps": 190000,
        "reward_mean": -1.3333750000000004,
        "reward_max": -0.11962499999999993,
        "reward_min": -2.8016875000000003,
        "leartime_s": 0.035701365006389096,
        "sampletime": 2.1925720169965643,
        "best_mean": -0.8138000000000002,
        "best_max": 0.1943125000000001,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 96,
        "timesteps": 192000,
        "reward_mean": -1.1921750000000002,
        "reward_max": -0.15981250000000008,
        "reward_min": -2.3108125,
        "leartime_s": 0.010646957001881674,
        "sampletime": 1.9328287600073963,
        "best_mean": -0.8138000000000002,
        "best_max": 0.1943125000000001,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 97,
        "timesteps": 194000,
        "reward_mean": -1.2069750000000004,
        "reward_max": -0.12525000000000003,
        "reward_min": -2.3710625000000003,
        "leartime_s": 0.015621536003891379,
        "sampletime": 1.8842936299915891,
        "best_mean": -0.8138000000000002,
        "best_max": 0.1943125000000001,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 98,
        "timesteps": 196000,
        "reward_mean": -0.8104750000000004,
        "reward_max": 0.29381250000000014,
        "reward_min": -1.8995000000000002,
        "leartime_s": 0.014479905978078023,
        "sampletime": 2.149283225997351,
        "best_mean": -0.8104750000000004,
        "best_max": 0.29381250000000014,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 99,
        "timesteps": 198000,
        "reward_mean": -1.0964250000000002,
        "reward_max": -0.15050000000000008,
        "reward_min": -2.2828125000000004,
        "leartime_s": 0.006705403997329995,
        "sampletime": 1.8502562350186054,
        "best_mean": -0.8104750000000004,
        "best_max": 0.29381250000000014,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 100,
        "timesteps": 200000,
        "reward_mean": -0.8169250000000003,
        "reward_max": 0.1361875000000002,
        "reward_min": -1.9840625000000012,
        "leartime_s": 0.03779897198546678,
        "sampletime": 1.8993489500135183,
        "best_mean": -0.8104750000000004,
        "best_max": 0.29381250000000014,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 101,
        "timesteps": 202000,
        "reward_mean": -0.8712250000000001,
        "reward_max": -0.1429374999999999,
        "reward_min": -1.8110625000000007,
        "leartime_s": 0.008570827019866556,
        "sampletime": 2.2015170010272413,
        "best_mean": -0.8104750000000004,
        "best_max": 0.29381250000000014,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 102,
        "timesteps": 204000,
        "reward_mean": -1.1544500000000002,
        "reward_max": 0.14206250000000012,
        "reward_min": -2.4158749999999998,
        "leartime_s": 0.02256930200383067,
        "sampletime": 2.1009606159932446,
        "best_mean": -0.8104750000000004,
        "best_max": 0.29381250000000014,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 103,
        "timesteps": 206000,
        "reward_mean": -1.3510250000000006,
        "reward_max": -0.5053750000000004,
        "reward_min": -2.8923125000000005,
        "leartime_s": 0.01840171602088958,
        "sampletime": 2.133974969998235,
        "best_mean": -0.8104750000000004,
        "best_max": 0.29381250000000014,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 104,
        "timesteps": 208000,
        "reward_mean": -1.0304,
        "reward_max": -0.13362499999999983,
        "reward_min": -2.774312500000001,
        "leartime_s": 0.017405189981218427,
        "sampletime": 1.7570200039772317,
        "best_mean": -0.8104750000000004,
        "best_max": 0.29381250000000014,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 105,
        "timesteps": 210000,
        "reward_mean": -1.1044750000000003,
        "reward_max": 0.08293749999999997,
        "reward_min": -2.380187500000001,
        "leartime_s": 0.026827243011211976,
        "sampletime": 1.8961387769959401,
        "best_mean": -0.8104750000000004,
        "best_max": 0.29381250000000014,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 106,
        "timesteps": 212000,
        "reward_mean": -1.1346500000000004,
        "reward_max": -0.05899999999999972,
        "reward_min": -2.4915625000000006,
        "leartime_s": 0.043012303998693824,
        "sampletime": 2.2434631409996655,
        "best_mean": -0.8104750000000004,
        "best_max": 0.29381250000000014,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 107,
        "timesteps": 214000,
        "reward_mean": -1.000725,
        "reward_max": 0.06587500000000032,
        "reward_min": -1.9940625000000005,
        "leartime_s": 0.011773471982451156,
        "sampletime": 1.9829272750066593,
        "best_mean": -0.8104750000000004,
        "best_max": 0.29381250000000014,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 108,
        "timesteps": 216000,
        "reward_mean": -1.110475,
        "reward_max": -0.04250000000000015,
        "reward_min": -2.5135625000000013,
        "leartime_s": 0.010167642001761124,
        "sampletime": 1.819141927990131,
        "best_mean": -0.8104750000000004,
        "best_max": 0.29381250000000014,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 109,
        "timesteps": 218000,
        "reward_mean": -1.0482750000000003,
        "reward_max": 0.010687499999999867,
        "reward_min": -2.5025000000000004,
        "leartime_s": 0.03396337298909202,
        "sampletime": 1.9429926430166233,
        "best_mean": -0.8104750000000004,
        "best_max": 0.29381250000000014,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 110,
        "timesteps": 220000,
        "reward_mean": -1.0439750000000003,
        "reward_max": -0.10300000000000004,
        "reward_min": -2.3901875,
        "leartime_s": 0.03606007801136002,
        "sampletime": 2.049752834980609,
        "best_mean": -0.8104750000000004,
        "best_max": 0.29381250000000014,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 111,
        "timesteps": 222000,
        "reward_mean": -1.4218000000000004,
        "reward_max": -0.5120625000000002,
        "reward_min": -2.8435000000000006,
        "leartime_s": 0.012060887995176017,
        "sampletime": 1.8564294100215193,
        "best_mean": -0.8104750000000004,
        "best_max": 0.29381250000000014,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 112,
        "timesteps": 224000,
        "reward_mean": -0.8819000000000002,
        "reward_max": -0.014312499999999971,
        "reward_min": -2.029000000000001,
        "leartime_s": 0.01158119400497526,
        "sampletime": 1.9978440779959783,
        "best_mean": -0.8104750000000004,
        "best_max": 0.29381250000000014,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 113,
        "timesteps": 226000,
        "reward_mean": -1.2872500000000004,
        "reward_max": -0.2229375000000003,
        "reward_min": -2.4496874999999996,
        "leartime_s": 0.009751867997692898,
        "sampletime": 1.990181218017824,
        "best_mean": -0.8104750000000004,
        "best_max": 0.29381250000000014,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 114,
        "timesteps": 228000,
        "reward_mean": -1.2031500000000002,
        "reward_max": -0.33781249999999996,
        "reward_min": -2.2671875,
        "leartime_s": 0.010828675993252546,
        "sampletime": 1.7925754149910063,
        "best_mean": -0.8104750000000004,
        "best_max": 0.29381250000000014,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 115,
        "timesteps": 230000,
        "reward_mean": -0.8168500000000002,
        "reward_max": 0.47400000000000014,
        "reward_min": -2.0798125000000005,
        "leartime_s": 0.028180196997709572,
        "sampletime": 1.8425727350113448,
        "best_mean": -0.8104750000000004,
        "best_max": 0.29381250000000014,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 116,
        "timesteps": 232000,
        "reward_mean": -1.0913500000000003,
        "reward_max": 0.06562500000000002,
        "reward_min": -2.1390000000000007,
        "leartime_s": 0.009157165011856705,
        "sampletime": 2.0263149599777535,
        "best_mean": -0.8104750000000004,
        "best_max": 0.29381250000000014,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 117,
        "timesteps": 234000,
        "reward_mean": -0.9455000000000002,
        "reward_max": -0.06212499999999983,
        "reward_min": -2.143687500000001,
        "leartime_s": 0.032123487995704636,
        "sampletime": 1.9613244209904224,
        "best_mean": -0.8104750000000004,
        "best_max": 0.29381250000000014,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 118,
        "timesteps": 236000,
        "reward_mean": -0.9719750000000003,
        "reward_max": 0.17962500000000003,
        "reward_min": -2.233312500000001,
        "leartime_s": 0.08524434099672362,
        "sampletime": 2.098581865982851,
        "best_mean": -0.8104750000000004,
        "best_max": 0.29381250000000014,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 119,
        "timesteps": 238000,
        "reward_mean": -1.0837750000000002,
        "reward_max": -0.24793749999999976,
        "reward_min": -2.3065000000000007,
        "leartime_s": 0.026298142009181902,
        "sampletime": 2.1546558730187826,
        "best_mean": -0.8104750000000004,
        "best_max": 0.29381250000000014,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 120,
        "timesteps": 240000,
        "reward_mean": -1.1064250000000002,
        "reward_max": -0.0099374999999998,
        "reward_min": -2.2583125,
        "leartime_s": 0.010681175976060331,
        "sampletime": 1.832613250007853,
        "best_mean": -0.8104750000000004,
        "best_max": 0.29381250000000014,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 121,
        "timesteps": 242000,
        "reward_mean": -0.8405000000000002,
        "reward_max": 0.044250000000000025,
        "reward_min": -1.937625000000001,
        "leartime_s": 0.015742444986244664,
        "sampletime": 1.7227208229887765,
        "best_mean": -0.8104750000000004,
        "best_max": 0.29381250000000014,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 122,
        "timesteps": 244000,
        "reward_mean": -0.8591000000000001,
        "reward_max": 0.12581250000000027,
        "reward_min": -2.2943124999999998,
        "leartime_s": 0.015407575003337115,
        "sampletime": 1.9535428019880783,
        "best_mean": -0.8104750000000004,
        "best_max": 0.29381250000000014,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 123,
        "timesteps": 246000,
        "reward_mean": -0.8102000000000001,
        "reward_max": 0.19868750000000007,
        "reward_min": -2.0318125,
        "leartime_s": 0.012194937997264788,
        "sampletime": 1.689109782979358,
        "best_mean": -0.8102000000000001,
        "best_max": 0.19868750000000007,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 124,
        "timesteps": 248000,
        "reward_mean": -1.17185,
        "reward_max": -0.02399999999999991,
        "reward_min": -2.0750000000000006,
        "leartime_s": 0.01306158202351071,
        "sampletime": 2.1010085100133438,
        "best_mean": -0.8102000000000001,
        "best_max": 0.19868750000000007,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 125,
        "timesteps": 250000,
        "reward_mean": -0.73955,
        "reward_max": 0.3090000000000004,
        "reward_min": -1.7807500000000003,
        "leartime_s": 0.020402743015438318,
        "sampletime": 2.06672919401899,
        "best_mean": -0.73955,
        "best_max": 0.3090000000000004,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 126,
        "timesteps": 252000,
        "reward_mean": -0.800425,
        "reward_max": 0.04100000000000005,
        "reward_min": -2.036125000000001,
        "leartime_s": 0.01058883499354124,
        "sampletime": 1.7689161250018515,
        "best_mean": -0.73955,
        "best_max": 0.3090000000000004,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 127,
        "timesteps": 254000,
        "reward_mean": -0.8721250000000002,
        "reward_max": 0.061250000000000096,
        "reward_min": -1.9542500000000007,
        "leartime_s": 0.053763442003400996,
        "sampletime": 1.9252210709964857,
        "best_mean": -0.73955,
        "best_max": 0.3090000000000004,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 128,
        "timesteps": 256000,
        "reward_mean": -0.6644750000000001,
        "reward_max": 0.5277500000000004,
        "reward_min": -1.9462500000000005,
        "leartime_s": 0.05037768100737594,
        "sampletime": 2.0048803800018504,
        "best_mean": -0.6644750000000001,
        "best_max": 0.5277500000000004,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 129,
        "timesteps": 258000,
        "reward_mean": -0.5041749999999999,
        "reward_max": 0.5463125000000004,
        "reward_min": -1.5146250000000003,
        "leartime_s": 0.03224344601039775,
        "sampletime": 1.9595905230089556,
        "best_mean": -0.5041749999999999,
        "best_max": 0.5463125000000004,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 130,
        "timesteps": 260000,
        "reward_mean": -0.713075,
        "reward_max": 0.26400000000000007,
        "reward_min": -1.9798750000000005,
        "leartime_s": 0.019565555994631723,
        "sampletime": 1.7695286179950926,
        "best_mean": -0.5041749999999999,
        "best_max": 0.5463125000000004,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 131,
        "timesteps": 262000,
        "reward_mean": -0.3839749999999999,
        "reward_max": 0.5246250000000006,
        "reward_min": -1.5553749999999997,
        "leartime_s": 0.029401103005511686,
        "sampletime": 2.2561263789830264,
        "best_mean": -0.3839749999999999,
        "best_max": 0.5246250000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 132,
        "timesteps": 264000,
        "reward_mean": -0.6115999999999999,
        "reward_max": 0.3706250000000003,
        "reward_min": -1.8536875000000006,
        "leartime_s": 0.011342492012772709,
        "sampletime": 1.8522689170204103,
        "best_mean": -0.3839749999999999,
        "best_max": 0.5246250000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 133,
        "timesteps": 266000,
        "reward_mean": -0.5287000000000001,
        "reward_max": 0.4483750000000004,
        "reward_min": -1.4503125,
        "leartime_s": 0.023348093003733084,
        "sampletime": 1.8210275370220188,
        "best_mean": -0.3839749999999999,
        "best_max": 0.5246250000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 134,
        "timesteps": 268000,
        "reward_mean": -0.6423,
        "reward_max": 0.24350000000000022,
        "reward_min": -1.8774375,
        "leartime_s": 0.02474886699928902,
        "sampletime": 1.9863471810240299,
        "best_mean": -0.3839749999999999,
        "best_max": 0.5246250000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 135,
        "timesteps": 270000,
        "reward_mean": -0.2526999999999999,
        "reward_max": 0.5335000000000002,
        "reward_min": -1.3884375,
        "leartime_s": 0.01050554498215206,
        "sampletime": 1.9649517619982362,
        "best_mean": -0.2526999999999999,
        "best_max": 0.5335000000000002,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 136,
        "timesteps": 272000,
        "reward_mean": -0.3282749999999999,
        "reward_max": 0.5637500000000005,
        "reward_min": -1.3763125,
        "leartime_s": 0.026926464022835717,
        "sampletime": 1.7329452109988779,
        "best_mean": -0.2526999999999999,
        "best_max": 0.5335000000000002,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 137,
        "timesteps": 274000,
        "reward_mean": -0.4932249999999999,
        "reward_max": 0.8247500000000004,
        "reward_min": -1.5703125000000002,
        "leartime_s": 0.018142515007639304,
        "sampletime": 1.7005312500114087,
        "best_mean": -0.2526999999999999,
        "best_max": 0.5335000000000002,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 138,
        "timesteps": 276000,
        "reward_mean": -0.40032499999999976,
        "reward_max": 0.45675000000000054,
        "reward_min": -1.7961250000000002,
        "leartime_s": 0.023141124984249473,
        "sampletime": 2.2246044559869915,
        "best_mean": -0.2526999999999999,
        "best_max": 0.5335000000000002,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 139,
        "timesteps": 278000,
        "reward_mean": -0.28432499999999983,
        "reward_max": 0.36443750000000025,
        "reward_min": -1.2700625,
        "leartime_s": 0.029002862982451916,
        "sampletime": 1.8470296349842101,
        "best_mean": -0.2526999999999999,
        "best_max": 0.5335000000000002,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 140,
        "timesteps": 280000,
        "reward_mean": -0.23589999999999975,
        "reward_max": 0.6082500000000005,
        "reward_min": -1.2983125000000002,
        "leartime_s": 0.03524818102596328,
        "sampletime": 1.949671643000329,
        "best_mean": -0.23589999999999975,
        "best_max": 0.6082500000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 141,
        "timesteps": 282000,
        "reward_mean": -0.37859999999999977,
        "reward_max": 0.5206250000000006,
        "reward_min": -1.6111249999999997,
        "leartime_s": 0.018064035015413538,
        "sampletime": 2.002520893001929,
        "best_mean": -0.23589999999999975,
        "best_max": 0.6082500000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 142,
        "timesteps": 284000,
        "reward_mean": -0.1784749999999998,
        "reward_max": 0.6956250000000005,
        "reward_min": -1.2647500000000003,
        "leartime_s": 0.030399135983316228,
        "sampletime": 1.9252233660081401,
        "best_mean": -0.1784749999999998,
        "best_max": 0.6956250000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 143,
        "timesteps": 286000,
        "reward_mean": -0.30937499999999984,
        "reward_max": 0.5115000000000001,
        "reward_min": -1.3584999999999998,
        "leartime_s": 0.06907125998986885,
        "sampletime": 1.876930091995746,
        "best_mean": -0.1784749999999998,
        "best_max": 0.6956250000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 144,
        "timesteps": 288000,
        "reward_mean": -0.1453999999999997,
        "reward_max": 1.0360000000000007,
        "reward_min": -1.29925,
        "leartime_s": 0.011842912004794925,
        "sampletime": 2.27810359801515,
        "best_mean": -0.1453999999999997,
        "best_max": 1.0360000000000007,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 145,
        "timesteps": 290000,
        "reward_mean": -0.12794999999999965,
        "reward_max": 0.9218750000000004,
        "reward_min": -1.1699374999999999,
        "leartime_s": 0.016954965016338974,
        "sampletime": 1.8044460820092354,
        "best_mean": -0.12794999999999965,
        "best_max": 0.9218750000000004,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 146,
        "timesteps": 292000,
        "reward_mean": 0.0038000000000002958,
        "reward_max": 0.9092500000000003,
        "reward_min": -1.2456874999999998,
        "leartime_s": 0.04574832500657067,
        "sampletime": 1.972060047002742,
        "best_mean": 0.0038000000000002958,
        "best_max": 0.9092500000000003,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 147,
        "timesteps": 294000,
        "reward_mean": -0.11674999999999973,
        "reward_max": 0.8040000000000003,
        "reward_min": -1.4361875000000004,
        "leartime_s": 0.0265095200156793,
        "sampletime": 2.2282588870148174,
        "best_mean": 0.0038000000000002958,
        "best_max": 0.9092500000000003,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 148,
        "timesteps": 296000,
        "reward_mean": -0.2525499999999997,
        "reward_max": 0.6300625000000004,
        "reward_min": -1.3579999999999999,
        "leartime_s": 0.02431215299293399,
        "sampletime": 1.8013942639809102,
        "best_mean": 0.0038000000000002958,
        "best_max": 0.9092500000000003,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 149,
        "timesteps": 298000,
        "reward_mean": 0.009425000000000324,
        "reward_max": 0.9176250000000006,
        "reward_min": -1.1121874999999997,
        "leartime_s": 0.011840683000627905,
        "sampletime": 1.8898631389893126,
        "best_mean": 0.009425000000000324,
        "best_max": 0.9176250000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 150,
        "timesteps": 300000,
        "reward_mean": -0.027174999999999633,
        "reward_max": 0.7988125000000006,
        "reward_min": -1.2333125,
        "leartime_s": 0.01700105599593371,
        "sampletime": 2.1098370480176527,
        "best_mean": 0.009425000000000324,
        "best_max": 0.9176250000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 151,
        "timesteps": 302000,
        "reward_mean": -0.21577499999999966,
        "reward_max": 0.7294375000000004,
        "reward_min": -1.1335624999999998,
        "leartime_s": 0.016236780997132882,
        "sampletime": 1.6938270640093833,
        "best_mean": 0.009425000000000324,
        "best_max": 0.9176250000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 152,
        "timesteps": 304000,
        "reward_mean": 0.09340000000000032,
        "reward_max": 0.9403125000000006,
        "reward_min": -1.0006249999999997,
        "leartime_s": 0.02926327197928913,
        "sampletime": 2.1003640929993708,
        "best_mean": 0.09340000000000032,
        "best_max": 0.9403125000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 153,
        "timesteps": 306000,
        "reward_mean": -0.04772499999999967,
        "reward_max": 0.7695000000000003,
        "reward_min": -0.98575,
        "leartime_s": 0.029327113006729633,
        "sampletime": 1.7449490209983196,
        "best_mean": 0.09340000000000032,
        "best_max": 0.9403125000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 154,
        "timesteps": 308000,
        "reward_mean": 0.03460000000000038,
        "reward_max": 0.9688125000000007,
        "reward_min": -1.0988124999999997,
        "leartime_s": 0.0435523159976583,
        "sampletime": 1.855644791998202,
        "best_mean": 0.09340000000000032,
        "best_max": 0.9403125000000006,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 155,
        "timesteps": 310000,
        "reward_mean": 0.13712500000000036,
        "reward_max": 1.2508125,
        "reward_min": -0.8160000000000001,
        "leartime_s": 0.029791735985781997,
        "sampletime": 1.837786766991485,
        "best_mean": 0.13712500000000036,
        "best_max": 1.2508125,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 156,
        "timesteps": 312000,
        "reward_mean": 0.12425000000000042,
        "reward_max": 1.0901250000000007,
        "reward_min": -1.4424375,
        "leartime_s": 0.0328911819960922,
        "sampletime": 1.9326367010071408,
        "best_mean": 0.13712500000000036,
        "best_max": 1.2508125,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 157,
        "timesteps": 314000,
        "reward_mean": 0.4569750000000004,
        "reward_max": 1.4353750000000005,
        "reward_min": -0.6363124999999995,
        "leartime_s": 0.034064733976265416,
        "sampletime": 2.2056834049872123,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 158,
        "timesteps": 316000,
        "reward_mean": -0.005999999999999683,
        "reward_max": 0.8986250000000005,
        "reward_min": -1.2656249999999998,
        "leartime_s": 0.045853343995986506,
        "sampletime": 1.9883666039968375,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 159,
        "timesteps": 318000,
        "reward_mean": 0.38290000000000035,
        "reward_max": 1.3540000000000005,
        "reward_min": -0.6571874999999996,
        "leartime_s": 0.03806344501208514,
        "sampletime": 2.0029776449955534,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 160,
        "timesteps": 320000,
        "reward_mean": 0.10465000000000034,
        "reward_max": 1.1018750000000006,
        "reward_min": -0.93825,
        "leartime_s": 0.022540390986250713,
        "sampletime": 1.904933676996734,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 161,
        "timesteps": 322000,
        "reward_mean": 0.10255000000000035,
        "reward_max": 1.0660000000000003,
        "reward_min": -1.0417500000000006,
        "leartime_s": 0.04166032301145606,
        "sampletime": 1.9262149639835116,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 162,
        "timesteps": 324000,
        "reward_mean": 0.2533000000000004,
        "reward_max": 1.3822500000000006,
        "reward_min": -0.8252499999999998,
        "leartime_s": 0.05273958999896422,
        "sampletime": 1.9926497050037142,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 163,
        "timesteps": 326000,
        "reward_mean": 0.07695000000000035,
        "reward_max": 0.8371250000000005,
        "reward_min": -1.156,
        "leartime_s": 0.035036568995565176,
        "sampletime": 2.2654353429970797,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 164,
        "timesteps": 328000,
        "reward_mean": 0.07880000000000031,
        "reward_max": 1.0911250000000006,
        "reward_min": -1.054375,
        "leartime_s": 0.030378991999896243,
        "sampletime": 1.9350065250182524,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 165,
        "timesteps": 330000,
        "reward_mean": -0.05832499999999966,
        "reward_max": 1.0476875000000008,
        "reward_min": -1.4206249999999998,
        "leartime_s": 0.0338239390111994,
        "sampletime": 2.244316722993972,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 166,
        "timesteps": 332000,
        "reward_mean": -0.07099999999999969,
        "reward_max": 0.7101250000000003,
        "reward_min": -1.2521874999999993,
        "leartime_s": 0.05936052298056893,
        "sampletime": 1.7680689609842375,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 167,
        "timesteps": 334000,
        "reward_mean": 0.12055000000000038,
        "reward_max": 1.2098750000000003,
        "reward_min": -1.1798749999999996,
        "leartime_s": 0.03134787900489755,
        "sampletime": 2.107206631975714,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 168,
        "timesteps": 336000,
        "reward_mean": 0.17040000000000036,
        "reward_max": 1.1628750000000003,
        "reward_min": -0.8288124999999995,
        "leartime_s": 0.025567752978531644,
        "sampletime": 2.022447691997513,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 169,
        "timesteps": 338000,
        "reward_mean": 0.13830000000000037,
        "reward_max": 1.080125000000001,
        "reward_min": -1.3094999999999997,
        "leartime_s": 0.04112144900136627,
        "sampletime": 1.8930822240072303,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 170,
        "timesteps": 340000,
        "reward_mean": 0.03607500000000033,
        "reward_max": 1.2381875000000007,
        "reward_min": -1.1604999999999999,
        "leartime_s": 0.013603228988358751,
        "sampletime": 1.7113093869993463,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 171,
        "timesteps": 342000,
        "reward_mean": 0.07972500000000034,
        "reward_max": 1.0301250000000004,
        "reward_min": -1.2433749999999997,
        "leartime_s": 0.019052751013077796,
        "sampletime": 1.932540045992937,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 172,
        "timesteps": 344000,
        "reward_mean": 0.23650000000000038,
        "reward_max": 1.0238125000000005,
        "reward_min": -0.6599374999999996,
        "leartime_s": 0.05898131197318435,
        "sampletime": 1.7501104029943235,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 173,
        "timesteps": 346000,
        "reward_mean": -0.005099999999999721,
        "reward_max": 1.0789375000000003,
        "reward_min": -1.3301249999999998,
        "leartime_s": 0.049782786023570225,
        "sampletime": 2.321985543007031,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 174,
        "timesteps": 348000,
        "reward_mean": -0.3891499999999998,
        "reward_max": 0.9555625000000005,
        "reward_min": -1.6602500000000002,
        "leartime_s": 0.019853568985126913,
        "sampletime": 1.9296164670086,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 175,
        "timesteps": 350000,
        "reward_mean": 0.08202500000000035,
        "reward_max": 0.8499375000000007,
        "reward_min": -1.297875,
        "leartime_s": 0.013851741998223588,
        "sampletime": 1.9584395470155869,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 176,
        "timesteps": 352000,
        "reward_mean": -0.0658999999999997,
        "reward_max": 0.9478750000000005,
        "reward_min": -1.3661875,
        "leartime_s": 0.032367439998779446,
        "sampletime": 1.9772085959848482,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 177,
        "timesteps": 354000,
        "reward_mean": 0.15005000000000035,
        "reward_max": 1.1418125000000006,
        "reward_min": -1.0601875,
        "leartime_s": 0.018842810997739434,
        "sampletime": 1.9495050729892682,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 178,
        "timesteps": 356000,
        "reward_mean": 0.07335000000000035,
        "reward_max": 1.5227500000000007,
        "reward_min": -1.3275,
        "leartime_s": 0.05158095099614002,
        "sampletime": 1.9306778550089803,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 179,
        "timesteps": 358000,
        "reward_mean": 0.08432500000000037,
        "reward_max": 1.1800000000000006,
        "reward_min": -1.2425625000000002,
        "leartime_s": 0.015722826006822288,
        "sampletime": 2.0249073730083182,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 180,
        "timesteps": 360000,
        "reward_mean": -0.21104999999999974,
        "reward_max": 1.0137500000000008,
        "reward_min": -1.3960000000000004,
        "leartime_s": 0.021934804011834785,
        "sampletime": 1.9005746449984144,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 181,
        "timesteps": 362000,
        "reward_mean": -0.20282499999999976,
        "reward_max": 0.6864375000000005,
        "reward_min": -1.2682499999999999,
        "leartime_s": 0.10416834999341518,
        "sampletime": 1.9764134950237349,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 182,
        "timesteps": 364000,
        "reward_mean": 0.03357500000000027,
        "reward_max": 0.9846250000000004,
        "reward_min": -1.0515,
        "leartime_s": 0.02935859397985041,
        "sampletime": 2.0068804070178885,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 183,
        "timesteps": 366000,
        "reward_mean": -0.20272499999999974,
        "reward_max": 0.5207500000000004,
        "reward_min": -1.6411875000000005,
        "leartime_s": 0.06698155097546987,
        "sampletime": 2.046137329976773,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 184,
        "timesteps": 368000,
        "reward_mean": 0.026400000000000277,
        "reward_max": 1.0196250000000004,
        "reward_min": -1.2382499999999999,
        "leartime_s": 0.014674865989945829,
        "sampletime": 2.0478314200008754,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 185,
        "timesteps": 370000,
        "reward_mean": -0.15572499999999978,
        "reward_max": 0.7512500000000005,
        "reward_min": -1.8327499999999999,
        "leartime_s": 0.03512400001636706,
        "sampletime": 2.0128879719995894,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 186,
        "timesteps": 372000,
        "reward_mean": -0.20357499999999976,
        "reward_max": 0.7642500000000004,
        "reward_min": -1.7511875000000001,
        "leartime_s": 0.03733917701174505,
        "sampletime": 1.9538147229759488,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 187,
        "timesteps": 374000,
        "reward_mean": -0.17727499999999974,
        "reward_max": 0.8096250000000004,
        "reward_min": -1.5394999999999999,
        "leartime_s": 0.02787817199714482,
        "sampletime": 1.5645452650205698,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 188,
        "timesteps": 376000,
        "reward_mean": -0.25072499999999975,
        "reward_max": 0.5610625000000005,
        "reward_min": -1.2571874999999997,
        "leartime_s": 0.0292215820227284,
        "sampletime": 1.7176364730112255,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 189,
        "timesteps": 378000,
        "reward_mean": -0.2942999999999998,
        "reward_max": 0.7703750000000005,
        "reward_min": -1.35125,
        "leartime_s": 0.07321852300083265,
        "sampletime": 2.037897278001765,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 190,
        "timesteps": 380000,
        "reward_mean": -0.19867499999999977,
        "reward_max": 0.7438750000000005,
        "reward_min": -1.5084999999999997,
        "leartime_s": 0.013819448999129236,
        "sampletime": 2.0362958849873394,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 191,
        "timesteps": 382000,
        "reward_mean": -0.2752749999999999,
        "reward_max": 0.8330625000000003,
        "reward_min": -1.711875,
        "leartime_s": 0.016940915025770664,
        "sampletime": 1.9326892599929124,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 192,
        "timesteps": 384000,
        "reward_mean": -0.15919999999999987,
        "reward_max": 0.9343125000000002,
        "reward_min": -0.9873125000000001,
        "leartime_s": 0.05564655200578272,
        "sampletime": 2.0267038470192347,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 193,
        "timesteps": 386000,
        "reward_mean": -0.3184499999999998,
        "reward_max": 0.6878125000000004,
        "reward_min": -1.5161250000000002,
        "leartime_s": 0.03531759898760356,
        "sampletime": 2.3365845480002463,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 194,
        "timesteps": 388000,
        "reward_mean": -0.08877499999999967,
        "reward_max": 1.1006875000000003,
        "reward_min": -1.2000624999999998,
        "leartime_s": 0.024668515019584447,
        "sampletime": 1.6885485170059837,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 195,
        "timesteps": 390000,
        "reward_mean": 0.0467750000000003,
        "reward_max": 0.8840000000000005,
        "reward_min": -0.9285000000000001,
        "leartime_s": 0.01506564998999238,
        "sampletime": 2.278850845003035,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 196,
        "timesteps": 392000,
        "reward_mean": -0.18414999999999979,
        "reward_max": 0.6810625000000005,
        "reward_min": -1.2105000000000001,
        "leartime_s": 0.014638348016887903,
        "sampletime": 1.881576790008694,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 197,
        "timesteps": 394000,
        "reward_mean": -0.38044999999999984,
        "reward_max": 0.44550000000000023,
        "reward_min": -1.5147500000000003,
        "leartime_s": 0.018886318983277306,
        "sampletime": 1.7552660049987026,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 198,
        "timesteps": 396000,
        "reward_mean": -0.2707499999999998,
        "reward_max": 0.6527500000000006,
        "reward_min": -1.4314375000000001,
        "leartime_s": 0.0588251170120202,
        "sampletime": 2.1571040260023437,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 199,
        "timesteps": 398000,
        "reward_mean": -0.21517499999999973,
        "reward_max": 0.7335000000000003,
        "reward_min": -1.31825,
        "leartime_s": 0.03067089300020598,
        "sampletime": 1.9116185049933847,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 200,
        "timesteps": 400000,
        "reward_mean": -0.4029749999999998,
        "reward_max": 0.6990000000000005,
        "reward_min": -1.7234375000000004,
        "leartime_s": 0.028583990002516657,
        "sampletime": 1.8007746709918138,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 201,
        "timesteps": 402000,
        "reward_mean": -0.3252999999999998,
        "reward_max": 0.7405625000000006,
        "reward_min": -1.5136249999999998,
        "leartime_s": 0.014425747009227052,
        "sampletime": 1.9153273529955186,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 202,
        "timesteps": 404000,
        "reward_mean": -0.18204999999999985,
        "reward_max": 0.8741875000000006,
        "reward_min": -1.2371875,
        "leartime_s": 0.028134413994848728,
        "sampletime": 2.189043185004266,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 203,
        "timesteps": 406000,
        "reward_mean": -0.0869249999999997,
        "reward_max": 0.8779375000000005,
        "reward_min": -1.3584999999999998,
        "leartime_s": 0.030698682996444404,
        "sampletime": 1.7112848929828033,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 204,
        "timesteps": 408000,
        "reward_mean": -0.13557499999999975,
        "reward_max": 1.1302500000000006,
        "reward_min": -1.4653125000000002,
        "leartime_s": 0.026047664985526353,
        "sampletime": 1.6209998049889691,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 205,
        "timesteps": 410000,
        "reward_mean": -0.26054999999999984,
        "reward_max": 0.7568750000000003,
        "reward_min": -1.4408750000000001,
        "leartime_s": 0.01935812400188297,
        "sampletime": 2.149262105987873,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 206,
        "timesteps": 412000,
        "reward_mean": -0.19102499999999983,
        "reward_max": 0.7171875000000002,
        "reward_min": -1.3287500000000003,
        "leartime_s": 0.03859382899827324,
        "sampletime": 1.7331445819872897,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 207,
        "timesteps": 414000,
        "reward_mean": -0.46954999999999986,
        "reward_max": 0.5475625000000003,
        "reward_min": -1.7495,
        "leartime_s": 0.012336298008449376,
        "sampletime": 2.1571097770065535,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 208,
        "timesteps": 416000,
        "reward_mean": -0.25424999999999975,
        "reward_max": 0.4457500000000004,
        "reward_min": -1.3860000000000003,
        "leartime_s": 0.03653423901414499,
        "sampletime": 2.0335894979943987,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 209,
        "timesteps": 418000,
        "reward_mean": -0.19537499999999977,
        "reward_max": 0.9663125000000006,
        "reward_min": -1.209875,
        "leartime_s": 0.022005505015840754,
        "sampletime": 1.88373123499332,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 210,
        "timesteps": 420000,
        "reward_mean": -0.39274999999999977,
        "reward_max": 0.6069375000000007,
        "reward_min": -1.6801875000000004,
        "leartime_s": 0.031918473017867655,
        "sampletime": 2.2664432259916794,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 211,
        "timesteps": 422000,
        "reward_mean": -0.29204999999999987,
        "reward_max": 0.8078750000000002,
        "reward_min": -1.5976250000000007,
        "leartime_s": 0.023160523996921256,
        "sampletime": 1.769118804979371,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 212,
        "timesteps": 424000,
        "reward_mean": -0.18624999999999972,
        "reward_max": 0.8481250000000006,
        "reward_min": -1.3291875000000004,
        "leartime_s": 0.02936695300741121,
        "sampletime": 2.0669860880007036,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 213,
        "timesteps": 426000,
        "reward_mean": -0.33392499999999986,
        "reward_max": 0.5874375000000006,
        "reward_min": -1.4303124999999999,
        "leartime_s": 0.06898275500861928,
        "sampletime": 1.9227844130073208,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 214,
        "timesteps": 428000,
        "reward_mean": -0.22864999999999971,
        "reward_max": 0.8717500000000007,
        "reward_min": -1.2659999999999998,
        "leartime_s": 0.023827839002478868,
        "sampletime": 1.8760754310060292,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 215,
        "timesteps": 430000,
        "reward_mean": -0.1856749999999998,
        "reward_max": 0.7261250000000004,
        "reward_min": -1.2623124999999997,
        "leartime_s": 0.015058371995110065,
        "sampletime": 2.0704962620220613,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 216,
        "timesteps": 432000,
        "reward_mean": -0.37524999999999975,
        "reward_max": 0.5304375000000005,
        "reward_min": -1.3693750000000005,
        "leartime_s": 0.021618211001623422,
        "sampletime": 1.9568100619944744,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 217,
        "timesteps": 434000,
        "reward_mean": -0.36394999999999983,
        "reward_max": 0.7721250000000003,
        "reward_min": -1.442875,
        "leartime_s": 0.042546646000118926,
        "sampletime": 1.9363593189918902,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 218,
        "timesteps": 436000,
        "reward_mean": -0.2117999999999998,
        "reward_max": 0.6743125000000005,
        "reward_min": -1.2638124999999998,
        "leartime_s": 0.025540963019011542,
        "sampletime": 1.9849638210143894,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 219,
        "timesteps": 438000,
        "reward_mean": -0.1371749999999998,
        "reward_max": 0.9850625000000004,
        "reward_min": -1.2064375000000003,
        "leartime_s": 0.033842517994344234,
        "sampletime": 1.9766104869777337,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 220,
        "timesteps": 440000,
        "reward_mean": -0.3119999999999998,
        "reward_max": 0.5506250000000005,
        "reward_min": -1.4422500000000003,
        "leartime_s": 0.014996315992902964,
        "sampletime": 1.605530031985836,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 221,
        "timesteps": 442000,
        "reward_mean": -0.2988499999999997,
        "reward_max": 0.6783750000000006,
        "reward_min": -1.4064999999999996,
        "leartime_s": 0.041162987996358424,
        "sampletime": 1.757371224986855,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 222,
        "timesteps": 444000,
        "reward_mean": -0.3070499999999997,
        "reward_max": 0.6005625000000006,
        "reward_min": -1.556875,
        "leartime_s": 0.0643488299974706,
        "sampletime": 1.9753397419990506,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 223,
        "timesteps": 446000,
        "reward_mean": -0.44627499999999987,
        "reward_max": 0.5860625000000003,
        "reward_min": -1.6955000000000005,
        "leartime_s": 0.05675839999457821,
        "sampletime": 2.2310383020085283,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 224,
        "timesteps": 448000,
        "reward_mean": -0.35927499999999984,
        "reward_max": 0.8101875000000005,
        "reward_min": -1.8047500000000003,
        "leartime_s": 0.029714795004110783,
        "sampletime": 1.9529216749942861,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 225,
        "timesteps": 450000,
        "reward_mean": -0.5246999999999997,
        "reward_max": 0.6103750000000003,
        "reward_min": -1.82925,
        "leartime_s": 0.042659286002162844,
        "sampletime": 1.918598362011835,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 226,
        "timesteps": 452000,
        "reward_mean": -0.5760250000000001,
        "reward_max": 0.4966875000000004,
        "reward_min": -1.5995000000000004,
        "leartime_s": 0.014320561022032052,
        "sampletime": 2.1238669409940485,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 227,
        "timesteps": 454000,
        "reward_mean": -0.47952499999999987,
        "reward_max": 0.5674375000000005,
        "reward_min": -1.5835625000000002,
        "leartime_s": 0.04327192099299282,
        "sampletime": 1.946600944007514,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 228,
        "timesteps": 456000,
        "reward_mean": -0.6260749999999998,
        "reward_max": 0.5540000000000004,
        "reward_min": -1.8306874999999998,
        "leartime_s": 0.03058984299423173,
        "sampletime": 1.72586787599721,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 229,
        "timesteps": 458000,
        "reward_mean": -0.3131499999999999,
        "reward_max": 0.6415625000000004,
        "reward_min": -1.6003749999999997,
        "leartime_s": 0.02102428799844347,
        "sampletime": 2.2404372010205407,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 230,
        "timesteps": 460000,
        "reward_mean": -0.7223499999999999,
        "reward_max": 0.22481250000000025,
        "reward_min": -1.8639375000000007,
        "leartime_s": 0.035649472003569826,
        "sampletime": 1.9826304040034302,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 231,
        "timesteps": 462000,
        "reward_mean": -0.5186,
        "reward_max": 0.3349375000000002,
        "reward_min": -1.89775,
        "leartime_s": 0.02631099900463596,
        "sampletime": 2.096275253017666,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 232,
        "timesteps": 464000,
        "reward_mean": -0.5842499999999999,
        "reward_max": 0.5186875000000005,
        "reward_min": -1.873,
        "leartime_s": 0.0391025319986511,
        "sampletime": 1.8757106259872671,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 233,
        "timesteps": 466000,
        "reward_mean": -0.6503749999999999,
        "reward_max": 0.4350625000000004,
        "reward_min": -2.3143125,
        "leartime_s": 0.04018974700011313,
        "sampletime": 2.150789684994379,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 234,
        "timesteps": 468000,
        "reward_mean": -0.44132499999999986,
        "reward_max": 0.4347500000000005,
        "reward_min": -1.448,
        "leartime_s": 0.06855739399907179,
        "sampletime": 2.01902950098156,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 235,
        "timesteps": 470000,
        "reward_mean": -0.6185499999999999,
        "reward_max": 0.3770625000000004,
        "reward_min": -2.1567500000000006,
        "leartime_s": 0.07517612399533391,
        "sampletime": 1.7805694809940178,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 236,
        "timesteps": 472000,
        "reward_mean": -0.55125,
        "reward_max": 0.6084375000000004,
        "reward_min": -1.6118125,
        "leartime_s": 0.01922434300649911,
        "sampletime": 1.9518463929998688,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 237,
        "timesteps": 474000,
        "reward_mean": -0.5602999999999999,
        "reward_max": 0.5511250000000005,
        "reward_min": -2.065000000000001,
        "leartime_s": 0.012871323997387663,
        "sampletime": 1.638737511006184,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 238,
        "timesteps": 476000,
        "reward_mean": -0.48224999999999996,
        "reward_max": 0.35562500000000014,
        "reward_min": -1.9130625000000008,
        "leartime_s": 0.013258146995212883,
        "sampletime": 1.6941187499905936,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 239,
        "timesteps": 478000,
        "reward_mean": -0.567225,
        "reward_max": 0.4721250000000005,
        "reward_min": -1.4387500000000002,
        "leartime_s": 0.03732224498526193,
        "sampletime": 1.88700649299426,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 240,
        "timesteps": 480000,
        "reward_mean": -0.771,
        "reward_max": 0.3484375000000004,
        "reward_min": -2.537625,
        "leartime_s": 0.04567180000594817,
        "sampletime": 2.129419839999173,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 241,
        "timesteps": 482000,
        "reward_mean": -0.69405,
        "reward_max": 0.18512500000000026,
        "reward_min": -1.7373125,
        "leartime_s": 0.013973372988402843,
        "sampletime": 1.9571581030031666,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 242,
        "timesteps": 484000,
        "reward_mean": -0.6427999999999999,
        "reward_max": 0.4411250000000002,
        "reward_min": -1.8013750000000002,
        "leartime_s": 0.01531431099283509,
        "sampletime": 2.029315655992832,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 243,
        "timesteps": 486000,
        "reward_mean": -0.6670750000000001,
        "reward_max": 0.3033750000000004,
        "reward_min": -1.8513125000000006,
        "leartime_s": 0.018719391024205834,
        "sampletime": 1.8982883349817712,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 244,
        "timesteps": 488000,
        "reward_mean": -0.6438000000000001,
        "reward_max": 0.4501250000000003,
        "reward_min": -1.9620000000000002,
        "leartime_s": 0.03682638201280497,
        "sampletime": 2.239336768980138,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 245,
        "timesteps": 490000,
        "reward_mean": -0.73805,
        "reward_max": 0.38300000000000056,
        "reward_min": -1.8626250000000006,
        "leartime_s": 0.03204524400644004,
        "sampletime": 1.8533626979915425,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 246,
        "timesteps": 492000,
        "reward_mean": -0.7997000000000001,
        "reward_max": 0.21012500000000017,
        "reward_min": -1.7946875000000007,
        "leartime_s": 0.047996990993851796,
        "sampletime": 2.409777908003889,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 247,
        "timesteps": 494000,
        "reward_mean": -0.7581500000000001,
        "reward_max": 0.20081250000000023,
        "reward_min": -1.8565625000000008,
        "leartime_s": 0.019690754008479416,
        "sampletime": 1.9694773190130945,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 248,
        "timesteps": 496000,
        "reward_mean": -0.8597250000000001,
        "reward_max": 0.1166875000000004,
        "reward_min": -2.1286875000000007,
        "leartime_s": 0.03184108200366609,
        "sampletime": 1.6835694609908387,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 249,
        "timesteps": 498000,
        "reward_mean": -0.8150500000000002,
        "reward_max": 0.010875000000000051,
        "reward_min": -1.7613750000000001,
        "leartime_s": 0.03444245402351953,
        "sampletime": 1.797953077009879,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 250,
        "timesteps": 500000,
        "reward_mean": -0.8805250000000003,
        "reward_max": -0.0964374999999999,
        "reward_min": -2.0356875000000008,
        "leartime_s": 0.038982629019301385,
        "sampletime": 1.8701882289897185,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 251,
        "timesteps": 502000,
        "reward_mean": -0.8583500000000002,
        "reward_max": 0.07012500000000019,
        "reward_min": -1.8464375,
        "leartime_s": 0.040438178984913975,
        "sampletime": 1.975574305979535,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 252,
        "timesteps": 504000,
        "reward_mean": -1.055875,
        "reward_max": 0.04518750000000013,
        "reward_min": -2.703187500000001,
        "leartime_s": 0.02232560599804856,
        "sampletime": 1.900450135988649,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 253,
        "timesteps": 506000,
        "reward_mean": -0.9182500000000002,
        "reward_max": 0.09087500000000004,
        "reward_min": -1.8482500000000006,
        "leartime_s": 0.043549436988541856,
        "sampletime": 1.7752572130120825,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 254,
        "timesteps": 508000,
        "reward_mean": -0.9338750000000002,
        "reward_max": 0.09625000000000014,
        "reward_min": -2.1276875000000004,
        "leartime_s": 0.03480527497595176,
        "sampletime": 2.2256748939980753,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 255,
        "timesteps": 510000,
        "reward_mean": -0.7593000000000002,
        "reward_max": 0.32400000000000057,
        "reward_min": -2.3533750000000015,
        "leartime_s": 0.04083551300573163,
        "sampletime": 1.8391395020007621,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 256,
        "timesteps": 512000,
        "reward_mean": -0.8980750000000003,
        "reward_max": 0.10025000000000026,
        "reward_min": -2.0533750000000004,
        "leartime_s": 0.06092946100397967,
        "sampletime": 1.9056555159913842,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 257,
        "timesteps": 514000,
        "reward_mean": -0.8678750000000002,
        "reward_max": 0.1576250000000003,
        "reward_min": -2.1615000000000006,
        "leartime_s": 0.04313643099158071,
        "sampletime": 1.9174825410009362,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 258,
        "timesteps": 516000,
        "reward_mean": -0.8354500000000001,
        "reward_max": 0.049999999999999975,
        "reward_min": -2.007250000000001,
        "leartime_s": 0.028069061983842403,
        "sampletime": 2.017877831996884,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 259,
        "timesteps": 518000,
        "reward_mean": -0.6395500000000002,
        "reward_max": 0.29812500000000025,
        "reward_min": -1.812625,
        "leartime_s": 0.018969241995364428,
        "sampletime": 1.7392135840200353,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 260,
        "timesteps": 520000,
        "reward_mean": -0.6949750000000001,
        "reward_max": 0.32487499999999997,
        "reward_min": -2.1563125000000007,
        "leartime_s": 0.035211050999350846,
        "sampletime": 2.277248605998466,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 261,
        "timesteps": 522000,
        "reward_mean": -0.8788750000000002,
        "reward_max": 0.12275,
        "reward_min": -2.109875000000001,
        "leartime_s": 0.025491681997664273,
        "sampletime": 1.8349614010076039,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 262,
        "timesteps": 524000,
        "reward_mean": -0.7970000000000002,
        "reward_max": 0.28787500000000044,
        "reward_min": -2.081000000000001,
        "leartime_s": 0.07788156799506396,
        "sampletime": 1.984942098002648,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 263,
        "timesteps": 526000,
        "reward_mean": -0.9515250000000003,
        "reward_max": -0.03274999999999994,
        "reward_min": -2.035375000000001,
        "leartime_s": 0.01592298797913827,
        "sampletime": 2.1541641000076197,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 264,
        "timesteps": 528000,
        "reward_mean": -0.7167250000000002,
        "reward_max": 0.20312500000000028,
        "reward_min": -2.7460000000000004,
        "leartime_s": 0.05790583899943158,
        "sampletime": 1.9029083590139635,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 265,
        "timesteps": 530000,
        "reward_mean": -0.9065750000000002,
        "reward_max": 0.018312500000000034,
        "reward_min": -1.9216250000000006,
        "leartime_s": 0.050779020006302744,
        "sampletime": 2.177171809016727,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 266,
        "timesteps": 532000,
        "reward_mean": -0.9708250000000002,
        "reward_max": -0.01237499999999983,
        "reward_min": -2.0367500000000014,
        "leartime_s": 0.02340884698787704,
        "sampletime": 1.7439524490037002,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 267,
        "timesteps": 534000,
        "reward_mean": -0.8631250000000003,
        "reward_max": 0.13518750000000024,
        "reward_min": -2.002937500000001,
        "leartime_s": 0.04791050899075344,
        "sampletime": 1.8636885070009157,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 268,
        "timesteps": 536000,
        "reward_mean": -1.0659,
        "reward_max": -0.16712499999999986,
        "reward_min": -2.1985625000000004,
        "leartime_s": 0.02150948200142011,
        "sampletime": 2.0905690109939314,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 269,
        "timesteps": 538000,
        "reward_mean": -1.0935500000000005,
        "reward_max": -0.2012499999999999,
        "reward_min": -1.9637500000000008,
        "leartime_s": 0.052843687997665256,
        "sampletime": 1.6265664160018787,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 270,
        "timesteps": 540000,
        "reward_mean": -0.9379750000000002,
        "reward_max": 0.027624999999999934,
        "reward_min": -2.1951875000000003,
        "leartime_s": 0.017984643985982984,
        "sampletime": 1.7641201569931582,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 271,
        "timesteps": 542000,
        "reward_mean": -1.1447750000000003,
        "reward_max": -0.18956250000000002,
        "reward_min": -2.1308125000000007,
        "leartime_s": 0.03872434498043731,
        "sampletime": 2.0463714019861072,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 272,
        "timesteps": 544000,
        "reward_mean": -0.73255,
        "reward_max": 0.2955625000000001,
        "reward_min": -2.1160625,
        "leartime_s": 0.026286437991075218,
        "sampletime": 1.95031205000123,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 273,
        "timesteps": 546000,
        "reward_mean": -0.7238000000000002,
        "reward_max": 0.19843750000000004,
        "reward_min": -1.7392500000000004,
        "leartime_s": 0.030713993997778744,
        "sampletime": 1.7408379380067345,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 274,
        "timesteps": 548000,
        "reward_mean": -0.8940250000000002,
        "reward_max": 0.0148125000000002,
        "reward_min": -2.028375,
        "leartime_s": 0.02969591598957777,
        "sampletime": 2.195544909016462,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 275,
        "timesteps": 550000,
        "reward_mean": -0.7326500000000001,
        "reward_max": 0.4773750000000002,
        "reward_min": -2.0539375,
        "leartime_s": 0.05767568701412529,
        "sampletime": 2.03667182000936,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 276,
        "timesteps": 552000,
        "reward_mean": -1.0612250000000003,
        "reward_max": 0.07006250000000006,
        "reward_min": -2.245375,
        "leartime_s": 0.06760693498654291,
        "sampletime": 1.7763441510032862,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 277,
        "timesteps": 554000,
        "reward_mean": -0.7958750000000001,
        "reward_max": 0.19668750000000018,
        "reward_min": -2.069125,
        "leartime_s": 0.016089786018710583,
        "sampletime": 2.024951087019872,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 278,
        "timesteps": 556000,
        "reward_mean": -1.0143750000000002,
        "reward_max": -0.05218749999999996,
        "reward_min": -2.1979375000000005,
        "leartime_s": 0.03155999002046883,
        "sampletime": 1.9775876599887852,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 279,
        "timesteps": 558000,
        "reward_mean": -0.84245,
        "reward_max": -0.01643749999999955,
        "reward_min": -2.0777500000000004,
        "leartime_s": 0.05328966400702484,
        "sampletime": 1.7290135539951734,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 280,
        "timesteps": 560000,
        "reward_mean": -0.9653250000000003,
        "reward_max": 0.2899375000000001,
        "reward_min": -2.4788750000000004,
        "leartime_s": 0.011819272011052817,
        "sampletime": 2.0406010890146717,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 281,
        "timesteps": 562000,
        "reward_mean": -0.8729750000000002,
        "reward_max": 0.09150000000000016,
        "reward_min": -2.0617500000000004,
        "leartime_s": 0.028293164999922737,
        "sampletime": 1.9056809300091118,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 282,
        "timesteps": 564000,
        "reward_mean": -0.8490750000000001,
        "reward_max": 0.056812500000000224,
        "reward_min": -2.1365000000000003,
        "leartime_s": 0.04013368801679462,
        "sampletime": 1.7024159230059013,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 283,
        "timesteps": 566000,
        "reward_mean": -0.8266500000000001,
        "reward_max": 0.16525000000000029,
        "reward_min": -1.952375000000001,
        "leartime_s": 0.02835397099261172,
        "sampletime": 2.400972138013458,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 284,
        "timesteps": 568000,
        "reward_mean": -0.6343,
        "reward_max": 0.2787500000000001,
        "reward_min": -1.8146250000000004,
        "leartime_s": 0.045259221020387486,
        "sampletime": 1.8152022400172427,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 285,
        "timesteps": 570000,
        "reward_mean": -0.9763750000000002,
        "reward_max": 0.07381250000000014,
        "reward_min": -2.470437500000001,
        "leartime_s": 0.048198453994700685,
        "sampletime": 1.8259151469974313,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 286,
        "timesteps": 572000,
        "reward_mean": -1.0859500000000002,
        "reward_max": -0.1275624999999998,
        "reward_min": -2.4546250000000005,
        "leartime_s": 0.061650987016037107,
        "sampletime": 1.671467414998915,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 287,
        "timesteps": 574000,
        "reward_mean": -0.9117000000000003,
        "reward_max": 0.08425000000000027,
        "reward_min": -2.2715000000000005,
        "leartime_s": 0.06428070898982696,
        "sampletime": 1.8798930119955912,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 288,
        "timesteps": 576000,
        "reward_mean": -0.9667750000000003,
        "reward_max": -0.09099999999999983,
        "reward_min": -1.9487500000000009,
        "leartime_s": 0.039551321999169886,
        "sampletime": 1.962138614995638,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 289,
        "timesteps": 578000,
        "reward_mean": -1.2017000000000004,
        "reward_max": -0.23337500000000003,
        "reward_min": -2.5696250000000007,
        "leartime_s": 0.07645572401816025,
        "sampletime": 2.2444533760135528,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 290,
        "timesteps": 580000,
        "reward_mean": -1.0231750000000002,
        "reward_max": -0.17174999999999993,
        "reward_min": -2.551437500000001,
        "leartime_s": 0.0359928930120077,
        "sampletime": 1.9790534669882618,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 291,
        "timesteps": 582000,
        "reward_mean": -0.9288750000000002,
        "reward_max": 0.31062500000000026,
        "reward_min": -1.9908749999999997,
        "leartime_s": 0.019861598004354164,
        "sampletime": 1.6776085699966643,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 292,
        "timesteps": 584000,
        "reward_mean": -1.0365,
        "reward_max": -0.018749999999999926,
        "reward_min": -2.3629375000000006,
        "leartime_s": 0.03999904700322077,
        "sampletime": 2.019912165007554,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 293,
        "timesteps": 586000,
        "reward_mean": -0.75495,
        "reward_max": 0.2128125000000002,
        "reward_min": -1.7073750000000005,
        "leartime_s": 0.05108544699032791,
        "sampletime": 2.0808320379874203,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 294,
        "timesteps": 588000,
        "reward_mean": -0.9123500000000001,
        "reward_max": 0.07243750000000036,
        "reward_min": -2.3563125,
        "leartime_s": 0.047801686014281586,
        "sampletime": 2.0482848529936746,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 295,
        "timesteps": 590000,
        "reward_mean": -0.9936250000000001,
        "reward_max": -0.07412499999999965,
        "reward_min": -2.3958750000000006,
        "leartime_s": 0.09484476898796856,
        "sampletime": 1.9350659160118084,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 296,
        "timesteps": 592000,
        "reward_mean": -1.0796750000000002,
        "reward_max": -0.10324999999999973,
        "reward_min": -2.2558124999999998,
        "leartime_s": 0.029705786000704393,
        "sampletime": 2.0734371060098056,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 297,
        "timesteps": 594000,
        "reward_mean": -0.8937000000000002,
        "reward_max": -0.0441874999999997,
        "reward_min": -2.015000000000001,
        "leartime_s": 0.05488387600053102,
        "sampletime": 1.8432656680233777,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 298,
        "timesteps": 596000,
        "reward_mean": -0.8265250000000001,
        "reward_max": 0.32325000000000026,
        "reward_min": -2.120375,
        "leartime_s": 0.018696454993914813,
        "sampletime": 1.812252822011942,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 299,
        "timesteps": 598000,
        "reward_mean": -1.1809500000000002,
        "reward_max": -0.1636875000000001,
        "reward_min": -2.3418750000000004,
        "leartime_s": 0.01905610298854299,
        "sampletime": 2.086498558986932,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 300,
        "timesteps": 600000,
        "reward_mean": -1.1670500000000001,
        "reward_max": -0.2896249999999998,
        "reward_min": -2.4692500000000006,
        "leartime_s": 0.030764633003855124,
        "sampletime": 1.956344941019779,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 301,
        "timesteps": 602000,
        "reward_mean": -1.0790500000000003,
        "reward_max": -0.1436874999999997,
        "reward_min": -2.5806875000000007,
        "leartime_s": 0.04811878898181021,
        "sampletime": 1.788927175977733,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 302,
        "timesteps": 604000,
        "reward_mean": -1.048175,
        "reward_max": -0.07718749999999984,
        "reward_min": -2.1841250000000003,
        "leartime_s": 0.05543804101762362,
        "sampletime": 1.6596430019999389,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 303,
        "timesteps": 606000,
        "reward_mean": -1.0987250000000002,
        "reward_max": -0.05724999999999976,
        "reward_min": -2.4795000000000003,
        "leartime_s": 0.02977500599808991,
        "sampletime": 2.377807101001963,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 304,
        "timesteps": 608000,
        "reward_mean": -1.03665,
        "reward_max": 0.11487500000000034,
        "reward_min": -2.639875,
        "leartime_s": 0.026071284984936938,
        "sampletime": 1.8253214310097974,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 305,
        "timesteps": 610000,
        "reward_mean": -1.0804500000000004,
        "reward_max": -0.16587499999999983,
        "reward_min": -2.2633750000000004,
        "leartime_s": 0.044739883014699444,
        "sampletime": 2.110189986997284,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 306,
        "timesteps": 612000,
        "reward_mean": -0.9183250000000002,
        "reward_max": 0.17612499999999998,
        "reward_min": -2.3882500000000007,
        "leartime_s": 0.051134982000803575,
        "sampletime": 1.9052188450004905,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 307,
        "timesteps": 614000,
        "reward_mean": -1.1565500000000002,
        "reward_max": -0.17843749999999992,
        "reward_min": -2.8382499999999995,
        "leartime_s": 0.029239598021376878,
        "sampletime": 1.7718933380092494,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 308,
        "timesteps": 616000,
        "reward_mean": -1.2089500000000002,
        "reward_max": -0.1284999999999998,
        "reward_min": -2.5115,
        "leartime_s": 0.03776692898827605,
        "sampletime": 1.8551537259772886,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 309,
        "timesteps": 618000,
        "reward_mean": -0.9064000000000001,
        "reward_max": 0.1543125000000004,
        "reward_min": -2.3593750000000004,
        "leartime_s": 0.0500935569871217,
        "sampletime": 2.199148804997094,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 310,
        "timesteps": 620000,
        "reward_mean": -0.9924000000000003,
        "reward_max": -0.04437499999999993,
        "reward_min": -2.0930000000000004,
        "leartime_s": 0.024568680993979797,
        "sampletime": 1.7030566049797926,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 311,
        "timesteps": 622000,
        "reward_mean": -1.073625,
        "reward_max": -0.05381250000000001,
        "reward_min": -2.1866250000000003,
        "leartime_s": 0.032382685982156545,
        "sampletime": 2.0982359450135846,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 312,
        "timesteps": 624000,
        "reward_mean": -0.9484500000000001,
        "reward_max": 0.1793750000000003,
        "reward_min": -1.8925625000000006,
        "leartime_s": 0.03490248598973267,
        "sampletime": 1.9688491830020212,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 313,
        "timesteps": 626000,
        "reward_mean": -0.9850500000000002,
        "reward_max": -0.003499999999999809,
        "reward_min": -2.162,
        "leartime_s": 0.058570271998178214,
        "sampletime": 1.9369266710127704,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 314,
        "timesteps": 628000,
        "reward_mean": -1.0069249999999998,
        "reward_max": 0.18937500000000043,
        "reward_min": -2.3086875000000004,
        "leartime_s": 0.01966506298049353,
        "sampletime": 1.8384916520153638,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 315,
        "timesteps": 630000,
        "reward_mean": -1.0202250000000002,
        "reward_max": -0.24356249999999982,
        "reward_min": -2.2268750000000006,
        "leartime_s": 0.033834297995781526,
        "sampletime": 1.9136260249943007,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 316,
        "timesteps": 632000,
        "reward_mean": -1.1761750000000002,
        "reward_max": 0.10687500000000005,
        "reward_min": -2.6152500000000014,
        "leartime_s": 0.05971007002517581,
        "sampletime": 2.1613546200096607,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 317,
        "timesteps": 634000,
        "reward_mean": -1.0947500000000006,
        "reward_max": -0.12668749999999987,
        "reward_min": -2.3051250000000008,
        "leartime_s": 0.05776628901367076,
        "sampletime": 1.9795848529902287,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 318,
        "timesteps": 636000,
        "reward_mean": -1.0995,
        "reward_max": -0.05231249999999978,
        "reward_min": -2.2615625000000006,
        "leartime_s": 0.02599926700349897,
        "sampletime": 1.766527308995137,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 319,
        "timesteps": 638000,
        "reward_mean": -0.723975,
        "reward_max": 0.06043750000000017,
        "reward_min": -2.1961250000000003,
        "leartime_s": 0.03414363000774756,
        "sampletime": 1.682176932983566,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 320,
        "timesteps": 640000,
        "reward_mean": -0.9817500000000001,
        "reward_max": 0.00912500000000023,
        "reward_min": -2.775375000000001,
        "leartime_s": 0.02245745898107998,
        "sampletime": 1.8760441140038893,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 321,
        "timesteps": 642000,
        "reward_mean": -1.1328000000000003,
        "reward_max": 0.005187500000000171,
        "reward_min": -2.3033750000000004,
        "leartime_s": 0.04083039300167002,
        "sampletime": 1.8908147210022435,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 322,
        "timesteps": 644000,
        "reward_mean": -0.8709750000000002,
        "reward_max": -0.038499999999999854,
        "reward_min": -2.3933125,
        "leartime_s": 0.0587712140113581,
        "sampletime": 1.900655787991127,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 323,
        "timesteps": 646000,
        "reward_mean": -1.0182750000000003,
        "reward_max": -0.21843750000000003,
        "reward_min": -2.3854375,
        "leartime_s": 0.04112981501384638,
        "sampletime": 2.085511848999886,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 324,
        "timesteps": 648000,
        "reward_mean": -0.9401250000000002,
        "reward_max": 0.0768125000000002,
        "reward_min": -2.1450625000000008,
        "leartime_s": 0.051271144999191165,
        "sampletime": 1.8187006380176172,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 325,
        "timesteps": 650000,
        "reward_mean": -0.9203000000000002,
        "reward_max": -0.09337499999999996,
        "reward_min": -2.150000000000001,
        "leartime_s": 0.10249314000247978,
        "sampletime": 1.8913229040044826,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 326,
        "timesteps": 652000,
        "reward_mean": -1.2255,
        "reward_max": -0.25081249999999994,
        "reward_min": -2.482000000000001,
        "leartime_s": 0.0491024479852058,
        "sampletime": 2.3628540780046023,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 327,
        "timesteps": 654000,
        "reward_mean": -0.7850750000000002,
        "reward_max": 0.1187500000000003,
        "reward_min": -1.8310625000000003,
        "leartime_s": 0.0394165120087564,
        "sampletime": 1.6904906530107837,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 328,
        "timesteps": 656000,
        "reward_mean": -1.0564,
        "reward_max": -0.16731249999999992,
        "reward_min": -2.257125000000001,
        "leartime_s": 0.02039065200369805,
        "sampletime": 2.1820000179868657,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 329,
        "timesteps": 658000,
        "reward_mean": -0.772425,
        "reward_max": 0.28037500000000015,
        "reward_min": -2.143875000000001,
        "leartime_s": 0.0354914499912411,
        "sampletime": 2.160289454011945,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 330,
        "timesteps": 660000,
        "reward_mean": -0.9291500000000001,
        "reward_max": 0.2661250000000004,
        "reward_min": -2.1004375000000004,
        "leartime_s": 0.04073684097966179,
        "sampletime": 2.0078144040016923,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 331,
        "timesteps": 662000,
        "reward_mean": -0.9301750000000002,
        "reward_max": 0.3309375000000003,
        "reward_min": -2.248687500000001,
        "leartime_s": 0.01748389599379152,
        "sampletime": 2.1309081540093757,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 332,
        "timesteps": 664000,
        "reward_mean": -0.7823000000000002,
        "reward_max": -0.04049999999999973,
        "reward_min": -2.3310000000000004,
        "leartime_s": 0.06817901600152254,
        "sampletime": 1.7422130840132013,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 333,
        "timesteps": 666000,
        "reward_mean": -1.0514250000000003,
        "reward_max": 0.0033750000000001418,
        "reward_min": -2.670000000000001,
        "leartime_s": 0.04312858000048436,
        "sampletime": 2.1043442800000776,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 334,
        "timesteps": 668000,
        "reward_mean": -1.0827250000000004,
        "reward_max": -0.21668749999999978,
        "reward_min": -2.6056875,
        "leartime_s": 0.03373105599894188,
        "sampletime": 1.9593193469918333,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 335,
        "timesteps": 670000,
        "reward_mean": -1.051975,
        "reward_max": -0.13693749999999982,
        "reward_min": -2.048625000000001,
        "leartime_s": 0.03272876999108121,
        "sampletime": 1.7630406120151747,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 336,
        "timesteps": 672000,
        "reward_mean": -0.8532750000000001,
        "reward_max": 0.1820000000000004,
        "reward_min": -2.156875000000001,
        "leartime_s": 0.04504478699527681,
        "sampletime": 1.7130372000101488,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 337,
        "timesteps": 674000,
        "reward_mean": -0.9108500000000002,
        "reward_max": -0.08462499999999984,
        "reward_min": -2.474437500000001,
        "leartime_s": 0.047299873986048624,
        "sampletime": 2.0364680720085744,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 338,
        "timesteps": 676000,
        "reward_mean": -1.015675,
        "reward_max": -0.20731249999999968,
        "reward_min": -2.1042500000000004,
        "leartime_s": 0.04467869200743735,
        "sampletime": 1.8927191289840266,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 339,
        "timesteps": 678000,
        "reward_mean": -0.9585499999999999,
        "reward_max": 0.25168750000000023,
        "reward_min": -2.1636250000000006,
        "leartime_s": 0.04671765898820013,
        "sampletime": 1.8471810960036237,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 340,
        "timesteps": 680000,
        "reward_mean": -0.7188750000000002,
        "reward_max": 0.31443750000000004,
        "reward_min": -1.9334375000000001,
        "leartime_s": 0.0717804080049973,
        "sampletime": 2.241204607009422,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 341,
        "timesteps": 682000,
        "reward_mean": -1.1725,
        "reward_max": 0.04568750000000005,
        "reward_min": -2.430437500000001,
        "leartime_s": 0.04696098100976087,
        "sampletime": 1.984286721009994,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 342,
        "timesteps": 684000,
        "reward_mean": -0.9986500000000003,
        "reward_max": 0.20325000000000026,
        "reward_min": -2.2612500000000004,
        "leartime_s": 0.03900114801945165,
        "sampletime": 2.023364565015072,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 343,
        "timesteps": 686000,
        "reward_mean": -0.9291750000000002,
        "reward_max": 0.10937500000000001,
        "reward_min": -2.1258125000000008,
        "leartime_s": 0.03703291298006661,
        "sampletime": 2.205353673984064,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 344,
        "timesteps": 688000,
        "reward_mean": -0.70745,
        "reward_max": 0.4469375000000004,
        "reward_min": -2.0355625000000006,
        "leartime_s": 0.04253657499793917,
        "sampletime": 1.8291662730043754,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 345,
        "timesteps": 690000,
        "reward_mean": -0.9862250000000002,
        "reward_max": 0.13356250000000047,
        "reward_min": -2.3531875000000007,
        "leartime_s": 0.06401340602315031,
        "sampletime": 1.9329588430118747,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 346,
        "timesteps": 692000,
        "reward_mean": -0.8352250000000001,
        "reward_max": 0.08062500000000032,
        "reward_min": -2.2396875,
        "leartime_s": 0.04872669398901053,
        "sampletime": 2.0513451880251523,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 347,
        "timesteps": 694000,
        "reward_mean": -0.92125,
        "reward_max": 0.31643750000000015,
        "reward_min": -2.3433125000000006,
        "leartime_s": 0.043063808989245445,
        "sampletime": 1.937994248000905,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 348,
        "timesteps": 696000,
        "reward_mean": -0.70975,
        "reward_max": 0.17387500000000009,
        "reward_min": -2.1563750000000006,
        "leartime_s": 0.08127473198692314,
        "sampletime": 2.235546687996248,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 349,
        "timesteps": 698000,
        "reward_mean": -1.013025,
        "reward_max": 0.0957500000000002,
        "reward_min": -2.5156875,
        "leartime_s": 0.02015597201534547,
        "sampletime": 1.907254866004223,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 350,
        "timesteps": 700000,
        "reward_mean": -0.9320750000000001,
        "reward_max": 0.05906250000000014,
        "reward_min": -2.1911875000000003,
        "leartime_s": 0.05179470998700708,
        "sampletime": 1.7811828989943024,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 351,
        "timesteps": 702000,
        "reward_mean": -0.798025,
        "reward_max": 0.1547500000000003,
        "reward_min": -2.0853124999999997,
        "leartime_s": 0.06900634602061473,
        "sampletime": 2.2084944439993706,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 352,
        "timesteps": 704000,
        "reward_mean": -0.7294750000000001,
        "reward_max": 0.3327500000000001,
        "reward_min": -1.6864375000000005,
        "leartime_s": 0.02850365699850954,
        "sampletime": 1.7299034949974157,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 353,
        "timesteps": 706000,
        "reward_mean": -0.8496000000000001,
        "reward_max": 0.2677500000000004,
        "reward_min": -1.9734375000000004,
        "leartime_s": 0.01844643399817869,
        "sampletime": 1.8011368290171959,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 354,
        "timesteps": 708000,
        "reward_mean": -0.8410000000000001,
        "reward_max": 0.07518750000000049,
        "reward_min": -2.2438750000000005,
        "leartime_s": 0.03844262400525622,
        "sampletime": 2.1496477570035495,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 355,
        "timesteps": 710000,
        "reward_mean": -0.7317250000000002,
        "reward_max": 0.33037500000000014,
        "reward_min": -2.1882500000000005,
        "leartime_s": 0.04577330098254606,
        "sampletime": 2.0831644109857734,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 356,
        "timesteps": 712000,
        "reward_mean": -0.7918000000000001,
        "reward_max": 0.21106250000000037,
        "reward_min": -1.8940625000000002,
        "leartime_s": 0.0385409040027298,
        "sampletime": 1.906867901008809,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 357,
        "timesteps": 714000,
        "reward_mean": -0.9088750000000002,
        "reward_max": -0.0358749999999998,
        "reward_min": -2.4375000000000004,
        "leartime_s": 0.02928159199655056,
        "sampletime": 1.9473504810011946,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 358,
        "timesteps": 716000,
        "reward_mean": -0.6321500000000001,
        "reward_max": 0.3334375000000004,
        "reward_min": -1.8823125000000007,
        "leartime_s": 0.023343991982983425,
        "sampletime": 1.9516294430068228,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 359,
        "timesteps": 718000,
        "reward_mean": -0.5915499999999999,
        "reward_max": 0.4290000000000005,
        "reward_min": -2.083125,
        "leartime_s": 0.03764022799441591,
        "sampletime": 1.9904330499994103,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 360,
        "timesteps": 720000,
        "reward_mean": -0.961075,
        "reward_max": 0.10700000000000032,
        "reward_min": -2.3972500000000005,
        "leartime_s": 0.029614772996865213,
        "sampletime": 2.1659345219959505,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 361,
        "timesteps": 722000,
        "reward_mean": -0.8255250000000001,
        "reward_max": 0.19300000000000037,
        "reward_min": -1.8679375,
        "leartime_s": 0.0459679150080774,
        "sampletime": 2.1206400240189396,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 362,
        "timesteps": 724000,
        "reward_mean": -0.9487250000000002,
        "reward_max": 0.022062500000000186,
        "reward_min": -2.5370625000000007,
        "leartime_s": 0.06504008499905467,
        "sampletime": 1.8035521619895007,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 363,
        "timesteps": 726000,
        "reward_mean": -0.7905999999999999,
        "reward_max": 0.25368750000000034,
        "reward_min": -2.2850625000000004,
        "leartime_s": 0.021782770985737443,
        "sampletime": 1.9383499860123266,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 364,
        "timesteps": 728000,
        "reward_mean": -0.7192999999999999,
        "reward_max": 0.5790000000000002,
        "reward_min": -2.0965625000000006,
        "leartime_s": 0.020836915995460004,
        "sampletime": 2.206781262997538,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 365,
        "timesteps": 730000,
        "reward_mean": -0.6222999999999999,
        "reward_max": 0.4823125000000004,
        "reward_min": -2.2170625,
        "leartime_s": 0.046605517010902986,
        "sampletime": 1.754942655999912,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 366,
        "timesteps": 732000,
        "reward_mean": -0.6715249999999998,
        "reward_max": 0.22268750000000034,
        "reward_min": -1.7247500000000007,
        "leartime_s": 0.0478327690216247,
        "sampletime": 2.1086383670044597,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 367,
        "timesteps": 734000,
        "reward_mean": -0.7056000000000001,
        "reward_max": 0.3854375000000002,
        "reward_min": -2.0716250000000005,
        "leartime_s": 0.039745694026350975,
        "sampletime": 1.9029621059889905,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 368,
        "timesteps": 736000,
        "reward_mean": -0.7765250000000001,
        "reward_max": 0.26581250000000034,
        "reward_min": -2.1863125000000005,
        "leartime_s": 0.019365783024113625,
        "sampletime": 2.0547843140084296,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 369,
        "timesteps": 738000,
        "reward_mean": -0.7645749999999999,
        "reward_max": 0.26487500000000036,
        "reward_min": -2.1945,
        "leartime_s": 0.03764761600177735,
        "sampletime": 1.7475790379976388,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 370,
        "timesteps": 740000,
        "reward_mean": -0.882725,
        "reward_max": 0.09243750000000053,
        "reward_min": -2.0994375,
        "leartime_s": 0.018594966997625306,
        "sampletime": 1.8559742709912825,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 371,
        "timesteps": 742000,
        "reward_mean": -0.765425,
        "reward_max": 0.3071875000000002,
        "reward_min": -2.090375,
        "leartime_s": 0.06358448401442729,
        "sampletime": 1.9272911160078365,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 372,
        "timesteps": 744000,
        "reward_mean": -0.42347499999999993,
        "reward_max": 0.5542500000000002,
        "reward_min": -1.4527500000000002,
        "leartime_s": 0.043462141999043524,
        "sampletime": 2.1362956049852073,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 373,
        "timesteps": 746000,
        "reward_mean": -0.6888500000000002,
        "reward_max": 0.2927500000000002,
        "reward_min": -2.0204375,
        "leartime_s": 0.032468002988025546,
        "sampletime": 1.7853422759799287,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 374,
        "timesteps": 748000,
        "reward_mean": -0.785925,
        "reward_max": 0.3606250000000003,
        "reward_min": -2.001500000000001,
        "leartime_s": 0.045762972004013136,
        "sampletime": 1.8108714460104238,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 375,
        "timesteps": 750000,
        "reward_mean": -0.46484999999999993,
        "reward_max": 0.5465625000000005,
        "reward_min": -1.8704375,
        "leartime_s": 0.03400950398645364,
        "sampletime": 1.942015750973951,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 376,
        "timesteps": 752000,
        "reward_mean": -0.7951750000000001,
        "reward_max": 0.007500000000000118,
        "reward_min": -1.7958750000000003,
        "leartime_s": 0.03357571497326717,
        "sampletime": 2.038120797020383,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 377,
        "timesteps": 754000,
        "reward_mean": -0.2174999999999998,
        "reward_max": 0.6812500000000005,
        "reward_min": -1.258,
        "leartime_s": 0.049394139990909025,
        "sampletime": 1.8743301359936595,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 378,
        "timesteps": 756000,
        "reward_mean": -0.58505,
        "reward_max": 0.37681250000000027,
        "reward_min": -1.5150625000000002,
        "leartime_s": 0.019124351005302742,
        "sampletime": 2.1608242059883196,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 379,
        "timesteps": 758000,
        "reward_mean": -0.6690749999999999,
        "reward_max": 0.40612500000000024,
        "reward_min": -1.8918750000000002,
        "leartime_s": 0.05287672599661164,
        "sampletime": 1.791419599991059,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 380,
        "timesteps": 760000,
        "reward_mean": -0.7318499999999999,
        "reward_max": 0.13375000000000012,
        "reward_min": -2.0989374999999995,
        "leartime_s": 0.041164624999510124,
        "sampletime": 1.6157058039971162,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 381,
        "timesteps": 762000,
        "reward_mean": -0.5595,
        "reward_max": 0.4522500000000002,
        "reward_min": -1.7890625000000002,
        "leartime_s": 0.02990737301297486,
        "sampletime": 1.954272506001871,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 382,
        "timesteps": 764000,
        "reward_mean": -0.5056249999999999,
        "reward_max": 0.36437500000000017,
        "reward_min": -1.7299375000000008,
        "leartime_s": 0.020089147001272067,
        "sampletime": 2.0657628449844196,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 383,
        "timesteps": 766000,
        "reward_mean": -0.31842499999999985,
        "reward_max": 0.7319375000000002,
        "reward_min": -2.0772500000000003,
        "leartime_s": 0.055516706983326,
        "sampletime": 2.039232463022927,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 384,
        "timesteps": 768000,
        "reward_mean": -0.571425,
        "reward_max": 0.40775000000000045,
        "reward_min": -1.8650000000000002,
        "leartime_s": 0.051946729014161974,
        "sampletime": 2.0404963140026666,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 385,
        "timesteps": 770000,
        "reward_mean": -0.5407249999999999,
        "reward_max": 0.5378750000000002,
        "reward_min": -1.8749375000000004,
        "leartime_s": 0.05099647198221646,
        "sampletime": 1.7853654980135616,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 386,
        "timesteps": 772000,
        "reward_mean": -0.835475,
        "reward_max": 0.2603750000000003,
        "reward_min": -2.1985,
        "leartime_s": 0.05881136699463241,
        "sampletime": 1.7354425649973564,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 387,
        "timesteps": 774000,
        "reward_mean": -0.3985249999999999,
        "reward_max": 0.4615000000000002,
        "reward_min": -1.6997500000000003,
        "leartime_s": 0.035722093016374856,
        "sampletime": 2.3008395039942116,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 388,
        "timesteps": 776000,
        "reward_mean": -0.570875,
        "reward_max": 0.6986250000000004,
        "reward_min": -1.8010000000000004,
        "leartime_s": 0.048222599987639114,
        "sampletime": 1.7046891119971406,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 389,
        "timesteps": 778000,
        "reward_mean": -0.47879999999999995,
        "reward_max": 0.4939375000000005,
        "reward_min": -1.8092500000000005,
        "leartime_s": 0.03641567801241763,
        "sampletime": 2.104909267014591,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 390,
        "timesteps": 780000,
        "reward_mean": -0.5002249999999998,
        "reward_max": 0.7731875000000004,
        "reward_min": -1.75925,
        "leartime_s": 0.023640208004508168,
        "sampletime": 2.163393608003389,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 391,
        "timesteps": 782000,
        "reward_mean": -0.4594999999999998,
        "reward_max": 0.5200000000000005,
        "reward_min": -1.6146874999999996,
        "leartime_s": 0.09307303500827402,
        "sampletime": 1.9255407009914052,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 392,
        "timesteps": 784000,
        "reward_mean": -0.7086749999999999,
        "reward_max": 0.3979375000000004,
        "reward_min": -2.0261250000000004,
        "leartime_s": 0.024052530992776155,
        "sampletime": 1.9414460969856009,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 393,
        "timesteps": 786000,
        "reward_mean": -0.43174999999999986,
        "reward_max": 0.5058125000000007,
        "reward_min": -1.4724374999999998,
        "leartime_s": 0.030215128994314,
        "sampletime": 2.0194560530071612,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 394,
        "timesteps": 788000,
        "reward_mean": -0.5382999999999999,
        "reward_max": 0.3808750000000002,
        "reward_min": -1.71975,
        "leartime_s": 0.045821181003702804,
        "sampletime": 2.134742663009092,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 395,
        "timesteps": 790000,
        "reward_mean": -0.554,
        "reward_max": 0.4217500000000004,
        "reward_min": -1.8435000000000006,
        "leartime_s": 0.042584976996295154,
        "sampletime": 1.7923097779857926,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 396,
        "timesteps": 792000,
        "reward_mean": -0.4699249999999998,
        "reward_max": 0.6066250000000004,
        "reward_min": -1.555125,
        "leartime_s": 0.032803949987282977,
        "sampletime": 2.0482436569873244,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 397,
        "timesteps": 794000,
        "reward_mean": -0.5027499999999999,
        "reward_max": 0.5098750000000004,
        "reward_min": -1.7038125000000006,
        "leartime_s": 0.023911530995974317,
        "sampletime": 2.1365112729836255,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 398,
        "timesteps": 796000,
        "reward_mean": -0.7421249999999998,
        "reward_max": 0.35925000000000057,
        "reward_min": -1.9185000000000003,
        "leartime_s": 0.05838329897960648,
        "sampletime": 1.782115693000378,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 399,
        "timesteps": 798000,
        "reward_mean": -0.4691249999999999,
        "reward_max": 0.4416875000000004,
        "reward_min": -2.0525,
        "leartime_s": 0.03608529100893065,
        "sampletime": 2.321940418012673,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 400,
        "timesteps": 800000,
        "reward_mean": -0.5630499999999998,
        "reward_max": 0.44593750000000054,
        "reward_min": -1.873125,
        "leartime_s": 0.04259533400181681,
        "sampletime": 2.078976299002534,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 401,
        "timesteps": 802000,
        "reward_mean": -0.8209249999999998,
        "reward_max": 0.4406250000000005,
        "reward_min": -2.156875,
        "leartime_s": 0.054127198993228376,
        "sampletime": 2.0105073189770337,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 402,
        "timesteps": 804000,
        "reward_mean": -0.3080999999999999,
        "reward_max": 0.5555000000000003,
        "reward_min": -1.3283125,
        "leartime_s": 0.034712081018369645,
        "sampletime": 1.687703714997042,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 403,
        "timesteps": 806000,
        "reward_mean": -0.4623249999999999,
        "reward_max": 0.6695625000000004,
        "reward_min": -2.2125000000000004,
        "leartime_s": 0.03795533999800682,
        "sampletime": 1.9881117799959611,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 404,
        "timesteps": 808000,
        "reward_mean": -0.7458749999999998,
        "reward_max": 0.2898750000000003,
        "reward_min": -2.6654375000000003,
        "leartime_s": 0.03963019300135784,
        "sampletime": 1.8740803340042476,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 405,
        "timesteps": 810000,
        "reward_mean": -0.7160749999999999,
        "reward_max": 0.18768750000000034,
        "reward_min": -2.242187500000001,
        "leartime_s": 0.048779873992316425,
        "sampletime": 1.7821807750151493,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 406,
        "timesteps": 812000,
        "reward_mean": -0.537625,
        "reward_max": 0.23381250000000026,
        "reward_min": -1.6808750000000003,
        "leartime_s": 0.027549279009690508,
        "sampletime": 1.9249323140247725,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 407,
        "timesteps": 814000,
        "reward_mean": -0.52155,
        "reward_max": 0.28918750000000026,
        "reward_min": -1.7610625000000004,
        "leartime_s": 0.04852831200696528,
        "sampletime": 1.851304371986771,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 408,
        "timesteps": 816000,
        "reward_mean": -0.2548999999999999,
        "reward_max": 0.6210625000000005,
        "reward_min": -1.6912500000000006,
        "leartime_s": 0.05080990999704227,
        "sampletime": 1.9341753059998155,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 409,
        "timesteps": 818000,
        "reward_mean": -0.4943749999999999,
        "reward_max": 0.43687500000000057,
        "reward_min": -1.9165625000000002,
        "leartime_s": 0.021291634999215603,
        "sampletime": 2.287981765024597,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 410,
        "timesteps": 820000,
        "reward_mean": -0.7614500000000001,
        "reward_max": 0.4428750000000004,
        "reward_min": -1.9161875000000004,
        "leartime_s": 0.06731245902483352,
        "sampletime": 1.9266370340192225,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 411,
        "timesteps": 822000,
        "reward_mean": -0.5758,
        "reward_max": 0.8120625000000001,
        "reward_min": -1.8996875000000002,
        "leartime_s": 0.06476309199933894,
        "sampletime": 1.7104653310088906,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 412,
        "timesteps": 824000,
        "reward_mean": -0.57445,
        "reward_max": 0.4616250000000004,
        "reward_min": -1.8682500000000002,
        "leartime_s": 0.02194863199838437,
        "sampletime": 2.206606919004116,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 413,
        "timesteps": 826000,
        "reward_mean": -0.23579999999999995,
        "reward_max": 0.8897500000000004,
        "reward_min": -1.8896249999999999,
        "leartime_s": 0.054972236015601084,
        "sampletime": 1.767856889986433,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 414,
        "timesteps": 828000,
        "reward_mean": -0.698525,
        "reward_max": 0.5544375000000004,
        "reward_min": -2.02225,
        "leartime_s": 0.08409866300644353,
        "sampletime": 1.8162692650221288,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 415,
        "timesteps": 830000,
        "reward_mean": -0.533925,
        "reward_max": 0.3760000000000004,
        "reward_min": -1.8104375,
        "leartime_s": 0.07819044301868416,
        "sampletime": 2.3505441260058433,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 416,
        "timesteps": 832000,
        "reward_mean": -0.47079999999999983,
        "reward_max": 0.4440000000000005,
        "reward_min": -2.1504374999999993,
        "leartime_s": 0.07718410599045455,
        "sampletime": 1.9465587619924918,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 417,
        "timesteps": 834000,
        "reward_mean": -0.576825,
        "reward_max": 0.3646875000000004,
        "reward_min": -2.1551875000000003,
        "leartime_s": 0.0821191249997355,
        "sampletime": 1.935007816995494,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 418,
        "timesteps": 836000,
        "reward_mean": -0.492875,
        "reward_max": 0.3275000000000001,
        "reward_min": -1.6881875000000004,
        "leartime_s": 0.033601985982386395,
        "sampletime": 1.6242276680131909,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 419,
        "timesteps": 838000,
        "reward_mean": -0.49152499999999993,
        "reward_max": 0.6033125000000006,
        "reward_min": -1.8165,
        "leartime_s": 0.07644167399848811,
        "sampletime": 2.084350272984011,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 420,
        "timesteps": 840000,
        "reward_mean": -0.450375,
        "reward_max": 0.42043750000000024,
        "reward_min": -1.3196250000000003,
        "leartime_s": 0.10672067000996321,
        "sampletime": 1.9043454449856654,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 421,
        "timesteps": 842000,
        "reward_mean": -0.6632250000000002,
        "reward_max": 0.15868750000000031,
        "reward_min": -2.1481875000000006,
        "leartime_s": 0.05444904198520817,
        "sampletime": 1.9698624500015285,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 422,
        "timesteps": 844000,
        "reward_mean": -0.7318,
        "reward_max": 0.32631250000000045,
        "reward_min": -2.1198125,
        "leartime_s": 0.05923098500352353,
        "sampletime": 2.0380731689801905,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 423,
        "timesteps": 846000,
        "reward_mean": -0.5760749999999999,
        "reward_max": 0.2258125000000004,
        "reward_min": -2.6856875,
        "leartime_s": 0.06529192498419434,
        "sampletime": 1.743034393992275,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 424,
        "timesteps": 848000,
        "reward_mean": -0.7415750000000001,
        "reward_max": 0.2940000000000005,
        "reward_min": -1.9500625,
        "leartime_s": 0.022426985000493005,
        "sampletime": 2.237668149988167,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 425,
        "timesteps": 850000,
        "reward_mean": -0.633375,
        "reward_max": 0.5654375000000003,
        "reward_min": -1.7983125000000006,
        "leartime_s": 0.03911105898441747,
        "sampletime": 1.9083658559829928,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 426,
        "timesteps": 852000,
        "reward_mean": -0.8902500000000001,
        "reward_max": 0.2917500000000003,
        "reward_min": -1.9095000000000004,
        "leartime_s": 0.04780229600146413,
        "sampletime": 1.8187767199997324,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 427,
        "timesteps": 854000,
        "reward_mean": -0.5548249999999999,
        "reward_max": 0.4765000000000004,
        "reward_min": -1.9903750000000002,
        "leartime_s": 0.04951126000378281,
        "sampletime": 2.018324610980926,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 428,
        "timesteps": 856000,
        "reward_mean": -0.8021500000000001,
        "reward_max": 0.33237500000000036,
        "reward_min": -1.9873125000000003,
        "leartime_s": 0.032524164009373635,
        "sampletime": 2.0423610620200634,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 429,
        "timesteps": 858000,
        "reward_mean": -0.8147249999999999,
        "reward_max": 0.10150000000000037,
        "reward_min": -1.9323750000000002,
        "leartime_s": 0.03997321499628015,
        "sampletime": 1.9061293049890082,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 430,
        "timesteps": 860000,
        "reward_mean": -0.6079749999999999,
        "reward_max": 0.25281250000000033,
        "reward_min": -2.36325,
        "leartime_s": 0.07698619799339212,
        "sampletime": 2.4433187750109937,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 431,
        "timesteps": 862000,
        "reward_mean": -0.716375,
        "reward_max": 0.31568750000000045,
        "reward_min": -1.7013125,
        "leartime_s": 0.03901771700475365,
        "sampletime": 1.7856761580042075,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 432,
        "timesteps": 864000,
        "reward_mean": -0.5859999999999999,
        "reward_max": 0.2264375000000003,
        "reward_min": -1.8566250000000006,
        "leartime_s": 0.04305111002759077,
        "sampletime": 2.003180568019161,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 433,
        "timesteps": 866000,
        "reward_mean": -0.822625,
        "reward_max": 0.29650000000000026,
        "reward_min": -2.097625000000001,
        "leartime_s": 0.0407632420246955,
        "sampletime": 2.1088166410045233,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 434,
        "timesteps": 868000,
        "reward_mean": -0.7004000000000001,
        "reward_max": 0.4523125000000001,
        "reward_min": -1.7948750000000007,
        "leartime_s": 0.025773993984330446,
        "sampletime": 1.7871148270205595,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 435,
        "timesteps": 870000,
        "reward_mean": -0.6025,
        "reward_max": 0.3887500000000004,
        "reward_min": -1.7448125000000005,
        "leartime_s": 0.022159774001920596,
        "sampletime": 1.6609595740155783,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 436,
        "timesteps": 872000,
        "reward_mean": -0.8905250000000001,
        "reward_max": 0.10956250000000037,
        "reward_min": -2.232125,
        "leartime_s": 0.05956988799152896,
        "sampletime": 2.059955525008263,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 437,
        "timesteps": 874000,
        "reward_mean": -0.9176000000000001,
        "reward_max": 0.12381250000000023,
        "reward_min": -2.0694375000000003,
        "leartime_s": 0.08409058401593938,
        "sampletime": 2.135629948024871,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 438,
        "timesteps": 876000,
        "reward_mean": -0.8452750000000001,
        "reward_max": 0.0869375000000003,
        "reward_min": -1.96475,
        "leartime_s": 0.02506609002011828,
        "sampletime": 1.7152651409851387,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 439,
        "timesteps": 878000,
        "reward_mean": -0.695875,
        "reward_max": 0.34718750000000026,
        "reward_min": -1.880062500000001,
        "leartime_s": 0.054834820999531075,
        "sampletime": 2.2113850169989746,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 440,
        "timesteps": 880000,
        "reward_mean": -0.9172750000000001,
        "reward_max": 0.14843750000000033,
        "reward_min": -2.143437500000001,
        "leartime_s": 0.04613821397651918,
        "sampletime": 2.081343220983399,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 441,
        "timesteps": 882000,
        "reward_mean": -0.8339249999999999,
        "reward_max": 0.12362500000000023,
        "reward_min": -2.397875,
        "leartime_s": 0.0314288990048226,
        "sampletime": 1.7175625639792997,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 442,
        "timesteps": 884000,
        "reward_mean": -0.8407250000000002,
        "reward_max": 0.20087500000000033,
        "reward_min": -2.5060625,
        "leartime_s": 0.043721154012018815,
        "sampletime": 2.0630112689977977,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 443,
        "timesteps": 886000,
        "reward_mean": -0.78625,
        "reward_max": 0.26331250000000045,
        "reward_min": -2.0311875,
        "leartime_s": 0.06606988899875432,
        "sampletime": 2.0306522419850808,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 444,
        "timesteps": 888000,
        "reward_mean": -1.0444,
        "reward_max": 0.03143750000000055,
        "reward_min": -2.3623749999999997,
        "leartime_s": 0.082669002993498,
        "sampletime": 1.9391834610141814,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 445,
        "timesteps": 890000,
        "reward_mean": -0.79475,
        "reward_max": 0.13400000000000017,
        "reward_min": -2.1738750000000007,
        "leartime_s": 0.081396711000707,
        "sampletime": 1.9060825210181065,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 446,
        "timesteps": 892000,
        "reward_mean": -0.865425,
        "reward_max": 0.023375000000000153,
        "reward_min": -2.4648749999999993,
        "leartime_s": 0.091073198011145,
        "sampletime": 1.9222026049974374,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 447,
        "timesteps": 894000,
        "reward_mean": -0.7964750000000002,
        "reward_max": 0.19256250000000033,
        "reward_min": -2.0214375000000007,
        "leartime_s": 0.07397377499728464,
        "sampletime": 1.9096992270206101,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 448,
        "timesteps": 896000,
        "reward_mean": -0.9221000000000001,
        "reward_max": 0.04700000000000031,
        "reward_min": -2.1639999999999997,
        "leartime_s": 0.05363625200698152,
        "sampletime": 1.6898226759803947,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 449,
        "timesteps": 898000,
        "reward_mean": -0.8127750000000001,
        "reward_max": 0.07468749999999999,
        "reward_min": -2.137875,
        "leartime_s": 0.038236299995332956,
        "sampletime": 2.1017345910076983,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 450,
        "timesteps": 900000,
        "reward_mean": -0.9497500000000001,
        "reward_max": -0.012187499999999636,
        "reward_min": -2.13125,
        "leartime_s": 0.025844274990959093,
        "sampletime": 1.6308708410069812,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 451,
        "timesteps": 902000,
        "reward_mean": -0.9141500000000001,
        "reward_max": -0.04499999999999982,
        "reward_min": -2.278125,
        "leartime_s": 0.057553482009097934,
        "sampletime": 1.6341098370030522,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 452,
        "timesteps": 904000,
        "reward_mean": -0.88795,
        "reward_max": 0.09937500000000046,
        "reward_min": -2.2264375,
        "leartime_s": 0.024250523012597114,
        "sampletime": 1.8950126490090042,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 453,
        "timesteps": 906000,
        "reward_mean": -1.0900750000000003,
        "reward_max": -0.015187499999999854,
        "reward_min": -2.3381250000000002,
        "leartime_s": 0.06944035898777656,
        "sampletime": 2.2071175079909153,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 454,
        "timesteps": 908000,
        "reward_mean": -0.84725,
        "reward_max": 0.15537500000000032,
        "reward_min": -2.625062500000001,
        "leartime_s": 0.048600991984130815,
        "sampletime": 1.8285703670117073,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 455,
        "timesteps": 910000,
        "reward_mean": -1.0228000000000002,
        "reward_max": -0.1405624999999997,
        "reward_min": -2.5066249999999997,
        "leartime_s": 0.0930562449793797,
        "sampletime": 1.7240748910116963,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 456,
        "timesteps": 912000,
        "reward_mean": -1.0355,
        "reward_max": -0.07281249999999964,
        "reward_min": -2.0810625000000007,
        "leartime_s": 0.035330509999766946,
        "sampletime": 2.2054745630011894,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 457,
        "timesteps": 914000,
        "reward_mean": -1.0293,
        "reward_max": 0.14862500000000037,
        "reward_min": -2.5546875000000004,
        "leartime_s": 0.030723242001840845,
        "sampletime": 2.0132313430076465,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 458,
        "timesteps": 916000,
        "reward_mean": -0.9086500000000001,
        "reward_max": 0.2258125000000004,
        "reward_min": -2.2753125000000005,
        "leartime_s": 0.04870738397585228,
        "sampletime": 1.962554079014808,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 459,
        "timesteps": 918000,
        "reward_mean": -0.8281250000000001,
        "reward_max": 0.07393750000000021,
        "reward_min": -2.024375,
        "leartime_s": 0.03923863000818528,
        "sampletime": 1.9614899999869522,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 460,
        "timesteps": 920000,
        "reward_mean": -0.8703,
        "reward_max": 0.1091875000000005,
        "reward_min": -1.8949999999999996,
        "leartime_s": 0.033559736009920016,
        "sampletime": 1.7576908970077056,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 461,
        "timesteps": 922000,
        "reward_mean": -0.8456,
        "reward_max": 0.16487500000000035,
        "reward_min": -2.1230625,
        "leartime_s": 0.06466673000250012,
        "sampletime": 2.1419416409917176,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 462,
        "timesteps": 924000,
        "reward_mean": -1.0304,
        "reward_max": -0.04624999999999965,
        "reward_min": -2.2798125000000002,
        "leartime_s": 0.04278887700638734,
        "sampletime": 2.105155883007683,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 463,
        "timesteps": 926000,
        "reward_mean": -0.9281250000000001,
        "reward_max": 0.5050625000000003,
        "reward_min": -2.184375,
        "leartime_s": 0.08961884598829783,
        "sampletime": 1.865103021991672,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 464,
        "timesteps": 928000,
        "reward_mean": -1.11075,
        "reward_max": -0.005312499999999637,
        "reward_min": -2.251750000000001,
        "leartime_s": 0.09031178199802525,
        "sampletime": 2.038351687020622,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 465,
        "timesteps": 930000,
        "reward_mean": -1.1969750000000001,
        "reward_max": -0.1573124999999999,
        "reward_min": -2.819,
        "leartime_s": 0.026570747984806076,
        "sampletime": 2.0141572450229432,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 466,
        "timesteps": 932000,
        "reward_mean": -0.99275,
        "reward_max": -0.07643749999999977,
        "reward_min": -2.285625000000001,
        "leartime_s": 0.045021325000561774,
        "sampletime": 1.8103824610006995,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 467,
        "timesteps": 934000,
        "reward_mean": -1.0687250000000001,
        "reward_max": -0.10499999999999987,
        "reward_min": -3.1092500000000007,
        "leartime_s": 0.03102298200246878,
        "sampletime": 1.6363668629783206,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 468,
        "timesteps": 936000,
        "reward_mean": -1.1324750000000001,
        "reward_max": -0.17812499999999984,
        "reward_min": -2.0266875000000004,
        "leartime_s": 0.0399653360072989,
        "sampletime": 1.7652724439976737,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 469,
        "timesteps": 938000,
        "reward_mean": -1.0534000000000001,
        "reward_max": -0.08556249999999987,
        "reward_min": -1.9534375000000008,
        "leartime_s": 0.024828844994772226,
        "sampletime": 1.5893386279931292,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 470,
        "timesteps": 940000,
        "reward_mean": -0.7641250000000002,
        "reward_max": 0.4047500000000004,
        "reward_min": -1.9934375000000006,
        "leartime_s": 0.06123946199659258,
        "sampletime": 1.6552642700262368,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 471,
        "timesteps": 942000,
        "reward_mean": -1.0473000000000001,
        "reward_max": -0.12956249999999997,
        "reward_min": -2.553937500000001,
        "leartime_s": 0.041322425997350365,
        "sampletime": 1.5802716680045705,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 472,
        "timesteps": 944000,
        "reward_mean": -0.9954250000000002,
        "reward_max": 0.31750000000000034,
        "reward_min": -2.1983125,
        "leartime_s": 0.05049677801434882,
        "sampletime": 1.6015178639790975,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 473,
        "timesteps": 946000,
        "reward_mean": -0.8661750000000001,
        "reward_max": 0.06762500000000014,
        "reward_min": -2.1790000000000003,
        "leartime_s": 0.04762390398536809,
        "sampletime": 1.5545165980001912,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 474,
        "timesteps": 948000,
        "reward_mean": -0.9603250000000002,
        "reward_max": 0.19325000000000025,
        "reward_min": -2.1300000000000003,
        "leartime_s": 0.035283658013213426,
        "sampletime": 1.518255456991028,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 475,
        "timesteps": 950000,
        "reward_mean": -0.85275,
        "reward_max": 0.3504375000000002,
        "reward_min": -1.8654375000000005,
        "leartime_s": 0.039378951012622565,
        "sampletime": 1.5862890249991324,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 476,
        "timesteps": 952000,
        "reward_mean": -0.9057500000000002,
        "reward_max": -0.017187499999999883,
        "reward_min": -2.085125,
        "leartime_s": 0.04437498000334017,
        "sampletime": 1.5415403219813015,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 477,
        "timesteps": 954000,
        "reward_mean": -0.8695000000000002,
        "reward_max": 0.041375000000000245,
        "reward_min": -2.1285625000000006,
        "leartime_s": 0.02926868200302124,
        "sampletime": 1.637487668020185,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 478,
        "timesteps": 956000,
        "reward_mean": -1.023425,
        "reward_max": 0.1277500000000003,
        "reward_min": -2.3443125,
        "leartime_s": 0.033862684009363875,
        "sampletime": 1.589592710020952,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 479,
        "timesteps": 958000,
        "reward_mean": -1.004275,
        "reward_max": 0.013312499999999991,
        "reward_min": -2.774687500000001,
        "leartime_s": 0.0251610109989997,
        "sampletime": 1.5658787009888329,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 480,
        "timesteps": 960000,
        "reward_mean": -0.9016750000000001,
        "reward_max": 0.20518750000000024,
        "reward_min": -2.597062500000001,
        "leartime_s": 0.05420707701705396,
        "sampletime": 1.540095610980643,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 481,
        "timesteps": 962000,
        "reward_mean": -0.9119750000000001,
        "reward_max": 0.3475625000000002,
        "reward_min": -2.095500000000001,
        "leartime_s": 0.031116216006921604,
        "sampletime": 1.637611016019946,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 482,
        "timesteps": 964000,
        "reward_mean": -0.9601000000000002,
        "reward_max": 0.1936875000000004,
        "reward_min": -2.291,
        "leartime_s": 0.02379458799259737,
        "sampletime": 1.6309806659992319,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 483,
        "timesteps": 966000,
        "reward_mean": -1.1268500000000001,
        "reward_max": 0.09293750000000013,
        "reward_min": -2.8232500000000003,
        "leartime_s": 0.02559218101669103,
        "sampletime": 1.464567963994341,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 484,
        "timesteps": 968000,
        "reward_mean": -0.7696500000000001,
        "reward_max": 0.34862500000000013,
        "reward_min": -1.7308750000000004,
        "leartime_s": 0.036645979998866096,
        "sampletime": 1.649801113002468,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 485,
        "timesteps": 970000,
        "reward_mean": -0.9997250000000001,
        "reward_max": 0.0781875000000003,
        "reward_min": -2.211250000000001,
        "leartime_s": 0.024495921010384336,
        "sampletime": 1.5408535970200319,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 486,
        "timesteps": 972000,
        "reward_mean": -0.9713250000000001,
        "reward_max": 0.014312500000000047,
        "reward_min": -2.1018750000000006,
        "leartime_s": 0.07603856001514941,
        "sampletime": 1.6263220270047896,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 487,
        "timesteps": 974000,
        "reward_mean": -0.9088000000000002,
        "reward_max": 0.11981250000000032,
        "reward_min": -2.2273750000000008,
        "leartime_s": 0.06318791600642726,
        "sampletime": 1.5635070230055135,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 488,
        "timesteps": 976000,
        "reward_mean": -0.868175,
        "reward_max": 0.3207500000000001,
        "reward_min": -2.2930625000000004,
        "leartime_s": 0.08440855602384545,
        "sampletime": 1.5617352300032508,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 489,
        "timesteps": 978000,
        "reward_mean": -0.9262250000000002,
        "reward_max": 0.047750000000000084,
        "reward_min": -2.659500000000001,
        "leartime_s": 0.06096194899873808,
        "sampletime": 1.534237835003296,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 490,
        "timesteps": 980000,
        "reward_mean": -1.07395,
        "reward_max": -0.19187499999999988,
        "reward_min": -2.55925,
        "leartime_s": 0.025086615001782775,
        "sampletime": 1.6286790950107388,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 491,
        "timesteps": 982000,
        "reward_mean": -0.8229000000000001,
        "reward_max": 0.30887500000000045,
        "reward_min": -1.8987500000000006,
        "leartime_s": 0.03042006099713035,
        "sampletime": 1.6598652399843559,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 492,
        "timesteps": 984000,
        "reward_mean": -0.9884250000000001,
        "reward_max": -0.08937499999999968,
        "reward_min": -2.035562500000001,
        "leartime_s": 0.033440623024944216,
        "sampletime": 1.5797260190011002,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 493,
        "timesteps": 986000,
        "reward_mean": -0.9692750000000001,
        "reward_max": 0.20825000000000038,
        "reward_min": -2.3427500000000006,
        "leartime_s": 0.024903008015826344,
        "sampletime": 1.5407375119975768,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 494,
        "timesteps": 988000,
        "reward_mean": -0.9935750000000001,
        "reward_max": 0.3771250000000003,
        "reward_min": -2.431750000000001,
        "leartime_s": 0.041315056005259976,
        "sampletime": 1.5772296799987089,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 495,
        "timesteps": 990000,
        "reward_mean": -1.05965,
        "reward_max": -0.09812499999999963,
        "reward_min": -2.2400625,
        "leartime_s": 0.02933367298101075,
        "sampletime": 1.5959868959907908,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 496,
        "timesteps": 992000,
        "reward_mean": -0.8746750000000001,
        "reward_max": 0.20818750000000033,
        "reward_min": -2.6138750000000006,
        "leartime_s": 0.05289158600498922,
        "sampletime": 1.5707248089893255,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 497,
        "timesteps": 994000,
        "reward_mean": -0.9337500000000002,
        "reward_max": -0.03899999999999991,
        "reward_min": -2.2866875000000007,
        "leartime_s": 0.059675739001249894,
        "sampletime": 1.6199884170200676,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 498,
        "timesteps": 996000,
        "reward_mean": -0.8957250000000001,
        "reward_max": 0.005312500000000123,
        "reward_min": -2.2497500000000006,
        "leartime_s": 0.052986657014116645,
        "sampletime": 1.6761589880043175,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 499,
        "timesteps": 998000,
        "reward_mean": -0.516425,
        "reward_max": 0.4775000000000002,
        "reward_min": -1.7019375000000003,
        "leartime_s": 0.02698025098652579,
        "sampletime": 1.555253585014725,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 500,
        "timesteps": 1000000,
        "reward_mean": -0.7376,
        "reward_max": 0.5802500000000002,
        "reward_min": -1.9243750000000008,
        "leartime_s": 0.034063138999044895,
        "sampletime": 1.6048108649847563,
        "best_mean": 0.4569750000000004,
        "best_max": 1.4353750000000005,
        "params": {
            "agentsize": 100,
            "yellow": 0,
            "seeds": 239913,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    }
]