[
    {
        "generation": 1,
        "timesteps": 200,
        "reward_mean": -38.991400000000006,
        "reward_max": -0.28181875,
        "reward_min": -81.84466875000005,
        "leartime_s": 0.025158950011245906,
        "sampletime": 0.9668855280033313,
        "best_mean": -38.991400000000006,
        "best_max": -0.28181875,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 2,
        "timesteps": 400,
        "reward_mean": -36.44964999999999,
        "reward_max": -0.17726250000000007,
        "reward_min": -172.84188124999997,
        "leartime_s": 0.010213400004431605,
        "sampletime": 1.1315143830142915,
        "best_mean": -36.44964999999999,
        "best_max": -0.17726250000000007,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 3,
        "timesteps": 600,
        "reward_mean": -20.045824999999997,
        "reward_max": 0.5236375,
        "reward_min": -218.261175,
        "leartime_s": 0.02126989999669604,
        "sampletime": 0.811883463000413,
        "best_mean": -20.045824999999997,
        "best_max": 0.5236375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 4,
        "timesteps": 800,
        "reward_mean": -18.038725,
        "reward_max": 1.8786624999999992,
        "reward_min": -35.4953125,
        "leartime_s": 0.006016497005475685,
        "sampletime": 0.772760758001823,
        "best_mean": -18.038725,
        "best_max": 1.8786624999999992,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 5,
        "timesteps": 1000,
        "reward_mean": -17.961475,
        "reward_max": 1.7625749999999998,
        "reward_min": -35.531612499999994,
        "leartime_s": 0.038037785998312756,
        "sampletime": 0.8602536940015852,
        "best_mean": -17.961475,
        "best_max": 1.7625749999999998,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 6,
        "timesteps": 1200,
        "reward_mean": -17.5113,
        "reward_max": 0.5303125000000001,
        "reward_min": -73.2064875,
        "leartime_s": 0.022065461991587654,
        "sampletime": 0.9278127139841672,
        "best_mean": -17.5113,
        "best_max": 0.5303125000000001,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 7,
        "timesteps": 1400,
        "reward_mean": -10.68055,
        "reward_max": -0.9913062499999999,
        "reward_min": -114.88326874999998,
        "leartime_s": 0.008153764007147402,
        "sampletime": 0.8337547270057257,
        "best_mean": -10.68055,
        "best_max": -0.9913062499999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 8,
        "timesteps": 1600,
        "reward_mean": -8.657174999999999,
        "reward_max": -0.25994999999999996,
        "reward_min": -74.75618125,
        "leartime_s": 0.023413821996655315,
        "sampletime": 0.7246948200045153,
        "best_mean": -8.657174999999999,
        "best_max": -0.25994999999999996,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 9,
        "timesteps": 1800,
        "reward_mean": -7.298850000000001,
        "reward_max": 0.7115812499999999,
        "reward_min": -93.31526874999999,
        "leartime_s": 0.045776350976666436,
        "sampletime": 0.6991993859992363,
        "best_mean": -7.298850000000001,
        "best_max": 0.7115812499999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 10,
        "timesteps": 2000,
        "reward_mean": -4.336024999999999,
        "reward_max": 0.25469375000000005,
        "reward_min": -35.357706250000014,
        "leartime_s": 0.01528346401755698,
        "sampletime": 0.8671641669934615,
        "best_mean": -4.336024999999999,
        "best_max": 0.25469375000000005,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 11,
        "timesteps": 2200,
        "reward_mean": -2.9976749999999996,
        "reward_max": -0.1364375000000001,
        "reward_min": -9.86535625,
        "leartime_s": 0.0415231240040157,
        "sampletime": 0.8993682319996879,
        "best_mean": -2.9976749999999996,
        "best_max": -0.1364375000000001,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 12,
        "timesteps": 2400,
        "reward_mean": -2.5294499999999993,
        "reward_max": -0.5357312499999997,
        "reward_min": -5.958068749999999,
        "leartime_s": 0.022274333983659744,
        "sampletime": 1.0333067629835568,
        "best_mean": -2.5294499999999993,
        "best_max": -0.5357312499999997,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 13,
        "timesteps": 2600,
        "reward_mean": -2.506575,
        "reward_max": -0.6808000000000001,
        "reward_min": -5.98708125,
        "leartime_s": 0.03736372198909521,
        "sampletime": 0.9366239930095617,
        "best_mean": -2.506575,
        "best_max": -0.6808000000000001,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 14,
        "timesteps": 2800,
        "reward_mean": -2.0233250000000007,
        "reward_max": -0.60830625,
        "reward_min": -4.083818750000001,
        "leartime_s": 0.01259176799794659,
        "sampletime": 0.8758018240041565,
        "best_mean": -2.0233250000000007,
        "best_max": -0.60830625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 15,
        "timesteps": 3000,
        "reward_mean": -2.016950000000001,
        "reward_max": -1.0646,
        "reward_min": -4.87439375,
        "leartime_s": 0.042474124988075346,
        "sampletime": 0.9957140279875603,
        "best_mean": -2.016950000000001,
        "best_max": -1.0646,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 16,
        "timesteps": 3200,
        "reward_mean": -1.9514250000000002,
        "reward_max": -0.8323062499999998,
        "reward_min": -3.63835625,
        "leartime_s": 0.03780171400285326,
        "sampletime": 0.8326177790004294,
        "best_mean": -1.9514250000000002,
        "best_max": -0.8323062499999998,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 17,
        "timesteps": 3400,
        "reward_mean": -1.7734,
        "reward_max": -0.6648937500000003,
        "reward_min": -3.277387499999999,
        "leartime_s": 0.013533104996895418,
        "sampletime": 1.0129155709873885,
        "best_mean": -1.7734,
        "best_max": -0.6648937500000003,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 18,
        "timesteps": 3600,
        "reward_mean": -1.8754,
        "reward_max": -0.7945749999999998,
        "reward_min": -3.1623375,
        "leartime_s": 0.03677795099793002,
        "sampletime": 0.8849235750094522,
        "best_mean": -1.7734,
        "best_max": -0.6648937500000003,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 19,
        "timesteps": 3800,
        "reward_mean": -1.7679749999999996,
        "reward_max": -0.87030625,
        "reward_min": -2.9835312499999995,
        "leartime_s": 0.006876453990116715,
        "sampletime": 0.845302706991788,
        "best_mean": -1.7679749999999996,
        "best_max": -0.87030625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 20,
        "timesteps": 4000,
        "reward_mean": -1.76575,
        "reward_max": -0.5485875,
        "reward_min": -3.0360812500000005,
        "leartime_s": 0.024604862002888694,
        "sampletime": 0.9561208439990878,
        "best_mean": -1.76575,
        "best_max": -0.5485875,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 21,
        "timesteps": 4200,
        "reward_mean": -1.7636249999999996,
        "reward_max": -0.7059062500000001,
        "reward_min": -3.4004874999999997,
        "leartime_s": 0.017648061009822413,
        "sampletime": 1.0348984229785856,
        "best_mean": -1.7636249999999996,
        "best_max": -0.7059062500000001,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 22,
        "timesteps": 4400,
        "reward_mean": -1.674125,
        "reward_max": -0.5359312499999999,
        "reward_min": -3.362531250000001,
        "leartime_s": 0.020432278979569674,
        "sampletime": 0.8391748299764004,
        "best_mean": -1.674125,
        "best_max": -0.5359312499999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 23,
        "timesteps": 4600,
        "reward_mean": -1.6178000000000001,
        "reward_max": -0.6408,
        "reward_min": -2.832875,
        "leartime_s": 0.006842512986622751,
        "sampletime": 0.8774029079941101,
        "best_mean": -1.6178000000000001,
        "best_max": -0.6408,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 24,
        "timesteps": 4800,
        "reward_mean": -1.4415,
        "reward_max": -0.45740625,
        "reward_min": -2.77246875,
        "leartime_s": 0.013564835011493415,
        "sampletime": 1.044475540984422,
        "best_mean": -1.4415,
        "best_max": -0.45740625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 25,
        "timesteps": 5000,
        "reward_mean": -1.5839250000000002,
        "reward_max": -0.4042375,
        "reward_min": -3.056656249999999,
        "leartime_s": 0.033687273011310026,
        "sampletime": 1.02126696598134,
        "best_mean": -1.4415,
        "best_max": -0.45740625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 26,
        "timesteps": 5200,
        "reward_mean": -1.7385,
        "reward_max": -0.4640437500000001,
        "reward_min": -3.207325000000001,
        "leartime_s": 0.035344668984180316,
        "sampletime": 0.8553247750096489,
        "best_mean": -1.4415,
        "best_max": -0.45740625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 27,
        "timesteps": 5400,
        "reward_mean": -1.5659250000000002,
        "reward_max": -0.42533749999999976,
        "reward_min": -2.877112500000001,
        "leartime_s": 0.02799282898195088,
        "sampletime": 0.7515671089931857,
        "best_mean": -1.4415,
        "best_max": -0.45740625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 28,
        "timesteps": 5600,
        "reward_mean": -1.6682249999999998,
        "reward_max": -0.6759000000000001,
        "reward_min": -2.8909750000000005,
        "leartime_s": 0.0380601899814792,
        "sampletime": 1.152319865010213,
        "best_mean": -1.4415,
        "best_max": -0.45740625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 29,
        "timesteps": 5800,
        "reward_mean": -1.354975,
        "reward_max": -0.2128999999999999,
        "reward_min": -2.7529750000000006,
        "leartime_s": 0.06445928598986939,
        "sampletime": 0.8657853369950317,
        "best_mean": -1.354975,
        "best_max": -0.2128999999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 30,
        "timesteps": 6000,
        "reward_mean": -1.58285,
        "reward_max": -0.7377750000000003,
        "reward_min": -2.8073625,
        "leartime_s": 0.008256125001935288,
        "sampletime": 0.7790702229831368,
        "best_mean": -1.354975,
        "best_max": -0.2128999999999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 31,
        "timesteps": 6200,
        "reward_mean": -1.251475,
        "reward_max": -0.342075,
        "reward_min": -2.31918125,
        "leartime_s": 0.007032485998934135,
        "sampletime": 0.8995681929809507,
        "best_mean": -1.251475,
        "best_max": -0.342075,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 32,
        "timesteps": 6400,
        "reward_mean": -1.4413249999999997,
        "reward_max": -0.40353125000000006,
        "reward_min": -3.29155625,
        "leartime_s": 0.01450072298757732,
        "sampletime": 0.9208700899907853,
        "best_mean": -1.251475,
        "best_max": -0.342075,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 33,
        "timesteps": 6600,
        "reward_mean": -1.2926999999999997,
        "reward_max": -0.36011249999999984,
        "reward_min": -2.5529500000000005,
        "leartime_s": 0.014200209989212453,
        "sampletime": 0.7969092369894497,
        "best_mean": -1.251475,
        "best_max": -0.342075,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 34,
        "timesteps": 6800,
        "reward_mean": -1.2051999999999998,
        "reward_max": -0.33106874999999986,
        "reward_min": -2.1097187500000003,
        "leartime_s": 0.012538347014924511,
        "sampletime": 0.8389255939982831,
        "best_mean": -1.2051999999999998,
        "best_max": -0.33106874999999986,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 35,
        "timesteps": 7000,
        "reward_mean": -1.4497499999999999,
        "reward_max": -0.6351375000000001,
        "reward_min": -2.38579375,
        "leartime_s": 0.05465973899117671,
        "sampletime": 1.140249710995704,
        "best_mean": -1.2051999999999998,
        "best_max": -0.33106874999999986,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 36,
        "timesteps": 7200,
        "reward_mean": -1.3191,
        "reward_max": -0.39011250000000003,
        "reward_min": -2.534375,
        "leartime_s": 0.03876866400241852,
        "sampletime": 0.8685844170104247,
        "best_mean": -1.2051999999999998,
        "best_max": -0.33106874999999986,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 37,
        "timesteps": 7400,
        "reward_mean": -1.4605000000000001,
        "reward_max": -0.42708749999999995,
        "reward_min": -2.6048125000000004,
        "leartime_s": 0.03775530800339766,
        "sampletime": 0.8546011279977392,
        "best_mean": -1.2051999999999998,
        "best_max": -0.33106874999999986,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 38,
        "timesteps": 7600,
        "reward_mean": -1.4844999999999997,
        "reward_max": -0.5169374999999999,
        "reward_min": -2.7446312500000003,
        "leartime_s": 0.030977152986451983,
        "sampletime": 1.1963485319865867,
        "best_mean": -1.2051999999999998,
        "best_max": -0.33106874999999986,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 39,
        "timesteps": 7800,
        "reward_mean": -1.27785,
        "reward_max": -0.3444874999999997,
        "reward_min": -2.6031875,
        "leartime_s": 0.05628250297741033,
        "sampletime": 0.9319482020218857,
        "best_mean": -1.2051999999999998,
        "best_max": -0.33106874999999986,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 40,
        "timesteps": 8000,
        "reward_mean": -1.3144500000000001,
        "reward_max": -0.4285999999999998,
        "reward_min": -2.5392999999999994,
        "leartime_s": 0.008632306999061257,
        "sampletime": 0.7624270480009727,
        "best_mean": -1.2051999999999998,
        "best_max": -0.33106874999999986,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 41,
        "timesteps": 8200,
        "reward_mean": -1.3121249999999998,
        "reward_max": -0.50116875,
        "reward_min": -2.4120250000000008,
        "leartime_s": 0.00853193600778468,
        "sampletime": 0.8543778340099379,
        "best_mean": -1.2051999999999998,
        "best_max": -0.33106874999999986,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 42,
        "timesteps": 8400,
        "reward_mean": -1.21425,
        "reward_max": -0.27795,
        "reward_min": -2.1107750000000003,
        "leartime_s": 0.017269269010284916,
        "sampletime": 1.04237226000987,
        "best_mean": -1.2051999999999998,
        "best_max": -0.33106874999999986,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 43,
        "timesteps": 8600,
        "reward_mean": -1.3379250000000003,
        "reward_max": -0.44571249999999996,
        "reward_min": -2.4936625,
        "leartime_s": 0.051670726999873295,
        "sampletime": 0.8185344540106598,
        "best_mean": -1.2051999999999998,
        "best_max": -0.33106874999999986,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 44,
        "timesteps": 8800,
        "reward_mean": -1.188275,
        "reward_max": -0.18667500000000004,
        "reward_min": -2.3661749999999997,
        "leartime_s": 0.04243393399519846,
        "sampletime": 0.7805040550010744,
        "best_mean": -1.188275,
        "best_max": -0.18667500000000004,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 45,
        "timesteps": 9000,
        "reward_mean": -1.3273499999999998,
        "reward_max": -0.44401874999999985,
        "reward_min": -2.8776374999999996,
        "leartime_s": 0.022095912019722164,
        "sampletime": 0.722092869982589,
        "best_mean": -1.188275,
        "best_max": -0.18667500000000004,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 46,
        "timesteps": 9200,
        "reward_mean": -1.3033500000000002,
        "reward_max": -0.5254749999999998,
        "reward_min": -2.6924062500000003,
        "leartime_s": 0.027429132984252647,
        "sampletime": 0.7040847600146662,
        "best_mean": -1.188275,
        "best_max": -0.18667500000000004,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 47,
        "timesteps": 9400,
        "reward_mean": -1.2494250000000002,
        "reward_max": -0.484775,
        "reward_min": -2.2981374999999997,
        "leartime_s": 0.021250165009405464,
        "sampletime": 0.7800641730136704,
        "best_mean": -1.188275,
        "best_max": -0.18667500000000004,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 48,
        "timesteps": 9600,
        "reward_mean": -1.1390250000000002,
        "reward_max": -0.30720624999999996,
        "reward_min": -2.2518875000000005,
        "leartime_s": 0.010273432009853423,
        "sampletime": 0.834786441992037,
        "best_mean": -1.1390250000000002,
        "best_max": -0.30720624999999996,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 49,
        "timesteps": 9800,
        "reward_mean": -1.1505999999999998,
        "reward_max": -0.3797499999999998,
        "reward_min": -1.9588625,
        "leartime_s": 0.02771623499575071,
        "sampletime": 0.8187657970120199,
        "best_mean": -1.1390250000000002,
        "best_max": -0.30720624999999996,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 50,
        "timesteps": 10000,
        "reward_mean": -1.3499250000000005,
        "reward_max": -0.4957250000000002,
        "reward_min": -2.3087312500000006,
        "leartime_s": 0.012709833012195304,
        "sampletime": 0.7658622399903834,
        "best_mean": -1.1390250000000002,
        "best_max": -0.30720624999999996,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 51,
        "timesteps": 10200,
        "reward_mean": -1.279325,
        "reward_max": -0.38595,
        "reward_min": -2.491981250000001,
        "leartime_s": 0.027991217997623608,
        "sampletime": 0.8057163349876646,
        "best_mean": -1.1390250000000002,
        "best_max": -0.30720624999999996,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 52,
        "timesteps": 10400,
        "reward_mean": -1.068025,
        "reward_max": -0.15715625000000016,
        "reward_min": -2.1530937500000005,
        "leartime_s": 0.03466446400852874,
        "sampletime": 0.9611961340124253,
        "best_mean": -1.068025,
        "best_max": -0.15715625000000016,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 53,
        "timesteps": 10600,
        "reward_mean": -1.1870999999999998,
        "reward_max": -0.25762500000000005,
        "reward_min": -2.3144125000000004,
        "leartime_s": 0.02343655299046077,
        "sampletime": 0.8581702670198865,
        "best_mean": -1.068025,
        "best_max": -0.15715625000000016,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 54,
        "timesteps": 10800,
        "reward_mean": -1.224225,
        "reward_max": -0.25083125,
        "reward_min": -2.51020625,
        "leartime_s": 0.061490222986321896,
        "sampletime": 0.9762334820115939,
        "best_mean": -1.068025,
        "best_max": -0.15715625000000016,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 55,
        "timesteps": 11000,
        "reward_mean": -1.135875,
        "reward_max": -0.24833750000000007,
        "reward_min": -2.8767125,
        "leartime_s": 0.01971990300808102,
        "sampletime": 0.8927005959849339,
        "best_mean": -1.068025,
        "best_max": -0.15715625000000016,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 56,
        "timesteps": 11200,
        "reward_mean": -1.26005,
        "reward_max": -0.31572500000000014,
        "reward_min": -2.1926249999999996,
        "leartime_s": 0.04140768697834574,
        "sampletime": 0.7268370639940258,
        "best_mean": -1.068025,
        "best_max": -0.15715625000000016,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 57,
        "timesteps": 11400,
        "reward_mean": -0.9492,
        "reward_max": -0.11331875000000009,
        "reward_min": -2.05226875,
        "leartime_s": 0.01713338599074632,
        "sampletime": 0.868436507997103,
        "best_mean": -0.9492,
        "best_max": -0.11331875000000009,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 58,
        "timesteps": 11600,
        "reward_mean": -1.0600500000000002,
        "reward_max": -0.07135625000000012,
        "reward_min": -2.1438125,
        "leartime_s": 0.028892934002215043,
        "sampletime": 1.0114753099915106,
        "best_mean": -0.9492,
        "best_max": -0.11331875000000009,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 59,
        "timesteps": 11800,
        "reward_mean": -0.8456999999999998,
        "reward_max": 0.06701874999999996,
        "reward_min": -1.6882562499999998,
        "leartime_s": 0.030773430014960468,
        "sampletime": 0.8103874009975698,
        "best_mean": -0.8456999999999998,
        "best_max": 0.06701874999999996,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 60,
        "timesteps": 12000,
        "reward_mean": -1.0724999999999996,
        "reward_max": -0.17785000000000006,
        "reward_min": -2.41945,
        "leartime_s": 0.023644377011805773,
        "sampletime": 0.8037955070030876,
        "best_mean": -0.8456999999999998,
        "best_max": 0.06701874999999996,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 61,
        "timesteps": 12200,
        "reward_mean": -0.9497250000000002,
        "reward_max": -0.12010000000000004,
        "reward_min": -1.9794749999999994,
        "leartime_s": 0.0235493479995057,
        "sampletime": 1.0547702570038382,
        "best_mean": -0.8456999999999998,
        "best_max": 0.06701874999999996,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 62,
        "timesteps": 12400,
        "reward_mean": -1.1328999999999998,
        "reward_max": -0.059062500000000004,
        "reward_min": -2.7064875000000006,
        "leartime_s": 0.018605903984280303,
        "sampletime": 0.7664435059996322,
        "best_mean": -0.8456999999999998,
        "best_max": 0.06701874999999996,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 63,
        "timesteps": 12600,
        "reward_mean": -1.0633,
        "reward_max": -0.15746249999999998,
        "reward_min": -2.3486500000000006,
        "leartime_s": 0.03809123000246473,
        "sampletime": 0.8064374410023447,
        "best_mean": -0.8456999999999998,
        "best_max": 0.06701874999999996,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 64,
        "timesteps": 12800,
        "reward_mean": -0.923975,
        "reward_max": -0.11632500000000012,
        "reward_min": -2.2934124999999996,
        "leartime_s": 0.020305187994381413,
        "sampletime": 0.831275064003421,
        "best_mean": -0.8456999999999998,
        "best_max": 0.06701874999999996,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 65,
        "timesteps": 13000,
        "reward_mean": -0.585275,
        "reward_max": 0.28285624999999986,
        "reward_min": -2.0680625,
        "leartime_s": 0.04203332102042623,
        "sampletime": 0.8999468529946171,
        "best_mean": -0.585275,
        "best_max": 0.28285624999999986,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 66,
        "timesteps": 13200,
        "reward_mean": -0.9700000000000002,
        "reward_max": -0.14488125000000027,
        "reward_min": -2.0643374999999997,
        "leartime_s": 0.04971836099866778,
        "sampletime": 0.8242737399996258,
        "best_mean": -0.585275,
        "best_max": 0.28285624999999986,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 67,
        "timesteps": 13400,
        "reward_mean": -1.21125,
        "reward_max": -0.29348750000000023,
        "reward_min": -2.4693125,
        "leartime_s": 0.015096507006091997,
        "sampletime": 0.7962239010084886,
        "best_mean": -0.585275,
        "best_max": 0.28285624999999986,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 68,
        "timesteps": 13600,
        "reward_mean": -1.06725,
        "reward_max": -0.27680000000000016,
        "reward_min": -1.9779375000000003,
        "leartime_s": 0.008139254001434892,
        "sampletime": 1.0626003470097203,
        "best_mean": -0.585275,
        "best_max": 0.28285624999999986,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 69,
        "timesteps": 13800,
        "reward_mean": -0.9718750000000003,
        "reward_max": 0.029931249999999895,
        "reward_min": -2.346343750000001,
        "leartime_s": 0.040013925987295806,
        "sampletime": 0.7717389860190451,
        "best_mean": -0.585275,
        "best_max": 0.28285624999999986,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 70,
        "timesteps": 14000,
        "reward_mean": -0.768125,
        "reward_max": 0.13303750000000023,
        "reward_min": -1.8031187499999992,
        "leartime_s": 0.026299894991097972,
        "sampletime": 0.7728352989943232,
        "best_mean": -0.585275,
        "best_max": 0.28285624999999986,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 71,
        "timesteps": 14200,
        "reward_mean": -0.9740749999999998,
        "reward_max": -0.05199374999999995,
        "reward_min": -1.90550625,
        "leartime_s": 0.03797753600520082,
        "sampletime": 0.899875021976186,
        "best_mean": -0.585275,
        "best_max": 0.28285624999999986,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 72,
        "timesteps": 14400,
        "reward_mean": -1.007,
        "reward_max": -0.04714999999999997,
        "reward_min": -2.183175,
        "leartime_s": 0.02960526500828564,
        "sampletime": 0.9380212299874984,
        "best_mean": -0.585275,
        "best_max": 0.28285624999999986,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 73,
        "timesteps": 14600,
        "reward_mean": -1.19345,
        "reward_max": -0.289625,
        "reward_min": -2.5290999999999997,
        "leartime_s": 0.046330443990882486,
        "sampletime": 0.7575238849967718,
        "best_mean": -0.585275,
        "best_max": 0.28285624999999986,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 74,
        "timesteps": 14800,
        "reward_mean": -1.07565,
        "reward_max": -0.16078749999999994,
        "reward_min": -2.3311874999999995,
        "leartime_s": 0.0210634539835155,
        "sampletime": 0.8599771020235494,
        "best_mean": -0.585275,
        "best_max": 0.28285624999999986,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 75,
        "timesteps": 15000,
        "reward_mean": -0.9633499999999999,
        "reward_max": 0.10108125000000005,
        "reward_min": -2.0392125000000005,
        "leartime_s": 0.0353597869980149,
        "sampletime": 1.0656106539827306,
        "best_mean": -0.585275,
        "best_max": 0.28285624999999986,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 76,
        "timesteps": 15200,
        "reward_mean": -0.8428249999999998,
        "reward_max": 0.07240000000000008,
        "reward_min": -2.24438125,
        "leartime_s": 0.0246029710106086,
        "sampletime": 0.9434496659960132,
        "best_mean": -0.585275,
        "best_max": 0.28285624999999986,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 77,
        "timesteps": 15400,
        "reward_mean": -0.9316500000000001,
        "reward_max": 0.16418125,
        "reward_min": -1.8950375000000002,
        "leartime_s": 0.016238526994129643,
        "sampletime": 0.8668739849817939,
        "best_mean": -0.585275,
        "best_max": 0.28285624999999986,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 78,
        "timesteps": 15600,
        "reward_mean": -0.4566249999999999,
        "reward_max": 0.5167750000000001,
        "reward_min": -1.8147562500000003,
        "leartime_s": 0.016376276995288208,
        "sampletime": 1.1786360400146805,
        "best_mean": -0.4566249999999999,
        "best_max": 0.5167750000000001,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 79,
        "timesteps": 15800,
        "reward_mean": -0.6317499999999998,
        "reward_max": 0.2818500000000001,
        "reward_min": -1.7563624999999996,
        "leartime_s": 0.07446276402333751,
        "sampletime": 0.8305183380143717,
        "best_mean": -0.4566249999999999,
        "best_max": 0.5167750000000001,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 80,
        "timesteps": 16000,
        "reward_mean": -0.7130249999999999,
        "reward_max": 0.0997562500000001,
        "reward_min": -2.0320812499999996,
        "leartime_s": 0.02107466899906285,
        "sampletime": 0.8351820640091319,
        "best_mean": -0.4566249999999999,
        "best_max": 0.5167750000000001,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 81,
        "timesteps": 16200,
        "reward_mean": -0.660825,
        "reward_max": 0.17820625,
        "reward_min": -1.7747312500000003,
        "leartime_s": 0.04886156300199218,
        "sampletime": 0.9051063150109258,
        "best_mean": -0.4566249999999999,
        "best_max": 0.5167750000000001,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 82,
        "timesteps": 16400,
        "reward_mean": -0.6621999999999999,
        "reward_max": 0.20816249999999997,
        "reward_min": -1.6817374999999992,
        "leartime_s": 0.009462742978939787,
        "sampletime": 0.8083351310051512,
        "best_mean": -0.4566249999999999,
        "best_max": 0.5167750000000001,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 83,
        "timesteps": 16600,
        "reward_mean": -0.5370500000000001,
        "reward_max": 0.21918124999999983,
        "reward_min": -1.72149375,
        "leartime_s": 0.02048523401026614,
        "sampletime": 0.7033632489910815,
        "best_mean": -0.4566249999999999,
        "best_max": 0.5167750000000001,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 84,
        "timesteps": 16800,
        "reward_mean": -0.5767749999999999,
        "reward_max": 0.4599312500000001,
        "reward_min": -1.70325,
        "leartime_s": 0.04649105598218739,
        "sampletime": 0.9056671180005651,
        "best_mean": -0.4566249999999999,
        "best_max": 0.5167750000000001,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 85,
        "timesteps": 17000,
        "reward_mean": -0.5945,
        "reward_max": 0.23853124999999994,
        "reward_min": -1.8312750000000007,
        "leartime_s": 0.03824465800425969,
        "sampletime": 1.2034691169974394,
        "best_mean": -0.4566249999999999,
        "best_max": 0.5167750000000001,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 86,
        "timesteps": 17200,
        "reward_mean": -0.6233250000000001,
        "reward_max": 0.3002687499999998,
        "reward_min": -2.0147375000000003,
        "leartime_s": 0.029356359009398147,
        "sampletime": 0.8100927890045568,
        "best_mean": -0.4566249999999999,
        "best_max": 0.5167750000000001,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 87,
        "timesteps": 17400,
        "reward_mean": -0.565525,
        "reward_max": 0.3999124999999999,
        "reward_min": -1.9033124999999995,
        "leartime_s": 0.026903258985839784,
        "sampletime": 0.7917445859930012,
        "best_mean": -0.4566249999999999,
        "best_max": 0.5167750000000001,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 88,
        "timesteps": 17600,
        "reward_mean": -0.7608500000000002,
        "reward_max": 0.2191312500000001,
        "reward_min": -1.7179937500000007,
        "leartime_s": 0.01996725599747151,
        "sampletime": 1.0154581000097096,
        "best_mean": -0.4566249999999999,
        "best_max": 0.5167750000000001,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 89,
        "timesteps": 17800,
        "reward_mean": -0.501675,
        "reward_max": 0.58304375,
        "reward_min": -1.9773062499999996,
        "leartime_s": 0.037399531982373446,
        "sampletime": 0.9341215530002955,
        "best_mean": -0.4566249999999999,
        "best_max": 0.5167750000000001,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 90,
        "timesteps": 18000,
        "reward_mean": -0.5013249999999999,
        "reward_max": 0.3430500000000002,
        "reward_min": -1.6806437500000002,
        "leartime_s": 0.05669043099624105,
        "sampletime": 0.784098386997357,
        "best_mean": -0.4566249999999999,
        "best_max": 0.5167750000000001,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 91,
        "timesteps": 18200,
        "reward_mean": -0.28949999999999987,
        "reward_max": 0.5161250000000001,
        "reward_min": -1.2322625,
        "leartime_s": 0.00770502001978457,
        "sampletime": 0.8857495920092333,
        "best_mean": -0.28949999999999987,
        "best_max": 0.5161250000000001,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 92,
        "timesteps": 18400,
        "reward_mean": -0.37175,
        "reward_max": 0.6441437500000001,
        "reward_min": -1.73924375,
        "leartime_s": 0.05073139499290846,
        "sampletime": 0.8145054130000062,
        "best_mean": -0.28949999999999987,
        "best_max": 0.5161250000000001,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 93,
        "timesteps": 18600,
        "reward_mean": -0.5440499999999999,
        "reward_max": 0.3634750000000001,
        "reward_min": -1.9558187500000002,
        "leartime_s": 0.0080217829963658,
        "sampletime": 0.9104255239944905,
        "best_mean": -0.28949999999999987,
        "best_max": 0.5161250000000001,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 94,
        "timesteps": 18800,
        "reward_mean": -0.34882500000000005,
        "reward_max": 0.4740749999999999,
        "reward_min": -1.263375,
        "leartime_s": 0.010654996993253008,
        "sampletime": 0.878331290994538,
        "best_mean": -0.28949999999999987,
        "best_max": 0.5161250000000001,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 95,
        "timesteps": 19000,
        "reward_mean": -0.5614750000000002,
        "reward_max": 0.1671187499999998,
        "reward_min": -1.60583125,
        "leartime_s": 0.031909432989778,
        "sampletime": 1.1025358329934534,
        "best_mean": -0.28949999999999987,
        "best_max": 0.5161250000000001,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 96,
        "timesteps": 19200,
        "reward_mean": -0.5406249999999998,
        "reward_max": 0.2888875000000001,
        "reward_min": -1.4714499999999995,
        "leartime_s": 0.010087108006700873,
        "sampletime": 0.9228384610032663,
        "best_mean": -0.28949999999999987,
        "best_max": 0.5161250000000001,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 97,
        "timesteps": 19400,
        "reward_mean": -0.42062499999999986,
        "reward_max": 0.5560875000000003,
        "reward_min": -1.4467999999999999,
        "leartime_s": 0.0379177599970717,
        "sampletime": 0.7617439260066021,
        "best_mean": -0.28949999999999987,
        "best_max": 0.5161250000000001,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 98,
        "timesteps": 19600,
        "reward_mean": -0.41702499999999987,
        "reward_max": 0.54206875,
        "reward_min": -1.4198312499999992,
        "leartime_s": 0.04266383399954066,
        "sampletime": 1.0596101540140808,
        "best_mean": -0.28949999999999987,
        "best_max": 0.5161250000000001,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 99,
        "timesteps": 19800,
        "reward_mean": -0.23537499999999978,
        "reward_max": 0.5310125000000002,
        "reward_min": -1.5215437499999998,
        "leartime_s": 0.008805771998595446,
        "sampletime": 0.7717898870178033,
        "best_mean": -0.23537499999999978,
        "best_max": 0.5310125000000002,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 100,
        "timesteps": 20000,
        "reward_mean": -0.4649249999999998,
        "reward_max": 0.5653125000000001,
        "reward_min": -1.55871875,
        "leartime_s": 0.040159232972655445,
        "sampletime": 0.7962189310055692,
        "best_mean": -0.23537499999999978,
        "best_max": 0.5310125000000002,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 101,
        "timesteps": 20200,
        "reward_mean": -0.37304999999999977,
        "reward_max": 0.6642437500000002,
        "reward_min": -1.73923125,
        "leartime_s": 0.07753072798368521,
        "sampletime": 0.950765820016386,
        "best_mean": -0.23537499999999978,
        "best_max": 0.5310125000000002,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 102,
        "timesteps": 20400,
        "reward_mean": -0.2314249999999998,
        "reward_max": 0.6122000000000003,
        "reward_min": -1.5862124999999996,
        "leartime_s": 0.09657106900704093,
        "sampletime": 0.7496423039992806,
        "best_mean": -0.2314249999999998,
        "best_max": 0.6122000000000003,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 103,
        "timesteps": 20600,
        "reward_mean": -0.3673749999999997,
        "reward_max": 0.7496937500000004,
        "reward_min": -1.670662499999999,
        "leartime_s": 0.02571965998504311,
        "sampletime": 0.8178123890247662,
        "best_mean": -0.2314249999999998,
        "best_max": 0.6122000000000003,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 104,
        "timesteps": 20800,
        "reward_mean": -0.21217499999999964,
        "reward_max": 0.6109875000000002,
        "reward_min": -1.4024999999999999,
        "leartime_s": 0.01848966401303187,
        "sampletime": 0.7552052279934287,
        "best_mean": -0.21217499999999964,
        "best_max": 0.6109875000000002,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 105,
        "timesteps": 21000,
        "reward_mean": -0.17404999999999984,
        "reward_max": 0.6130875000000001,
        "reward_min": -1.1344874999999994,
        "leartime_s": 0.06185441600973718,
        "sampletime": 1.1407472899882123,
        "best_mean": -0.17404999999999984,
        "best_max": 0.6130875000000001,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 106,
        "timesteps": 21200,
        "reward_mean": -0.38437499999999963,
        "reward_max": 0.5452562500000003,
        "reward_min": -1.4995187499999993,
        "leartime_s": 0.06363370001781732,
        "sampletime": 0.8453503729833756,
        "best_mean": -0.17404999999999984,
        "best_max": 0.6130875000000001,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 107,
        "timesteps": 21400,
        "reward_mean": -0.3376749999999997,
        "reward_max": 0.6850187500000001,
        "reward_min": -1.3685874999999994,
        "leartime_s": 0.0662174700119067,
        "sampletime": 0.7139501819910947,
        "best_mean": -0.17404999999999984,
        "best_max": 0.6130875000000001,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 108,
        "timesteps": 21600,
        "reward_mean": -0.31714999999999977,
        "reward_max": 0.4007312500000002,
        "reward_min": -1.4018062500000001,
        "leartime_s": 0.07693059300072491,
        "sampletime": 0.8367547869856935,
        "best_mean": -0.17404999999999984,
        "best_max": 0.6130875000000001,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 109,
        "timesteps": 21800,
        "reward_mean": -0.2981999999999997,
        "reward_max": 0.5479062500000005,
        "reward_min": -2.2345375,
        "leartime_s": 0.09914668998681009,
        "sampletime": 1.0627498289977666,
        "best_mean": -0.17404999999999984,
        "best_max": 0.6130875000000001,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 110,
        "timesteps": 22000,
        "reward_mean": -0.42274999999999985,
        "reward_max": 0.4543562500000003,
        "reward_min": -1.6831875,
        "leartime_s": 0.07408411099459045,
        "sampletime": 0.9731587969872635,
        "best_mean": -0.17404999999999984,
        "best_max": 0.6130875000000001,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 111,
        "timesteps": 22200,
        "reward_mean": -0.4644999999999998,
        "reward_max": 0.47238749999999996,
        "reward_min": -1.6256249999999999,
        "leartime_s": 0.028880205005407333,
        "sampletime": 0.8275852749939077,
        "best_mean": -0.17404999999999984,
        "best_max": 0.6130875000000001,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 112,
        "timesteps": 22400,
        "reward_mean": -0.3779999999999999,
        "reward_max": 0.5281625000000003,
        "reward_min": -1.6785499999999995,
        "leartime_s": 0.03478174499468878,
        "sampletime": 0.9569230759807397,
        "best_mean": -0.17404999999999984,
        "best_max": 0.6130875000000001,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 113,
        "timesteps": 22600,
        "reward_mean": -0.1717499999999997,
        "reward_max": 0.8615937500000005,
        "reward_min": -1.3214687499999997,
        "leartime_s": 0.050680999003816396,
        "sampletime": 0.894861292996211,
        "best_mean": -0.1717499999999997,
        "best_max": 0.8615937500000005,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 114,
        "timesteps": 22800,
        "reward_mean": -0.023024999999999893,
        "reward_max": 0.8506125,
        "reward_min": -1.351718749999999,
        "leartime_s": 0.03414108598371968,
        "sampletime": 0.8313623139983974,
        "best_mean": -0.023024999999999893,
        "best_max": 0.8506125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 115,
        "timesteps": 23000,
        "reward_mean": -0.18884999999999982,
        "reward_max": 0.7500749999999999,
        "reward_min": -1.51875,
        "leartime_s": 0.016628822981147096,
        "sampletime": 0.9012602599977981,
        "best_mean": -0.023024999999999893,
        "best_max": 0.8506125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 116,
        "timesteps": 23200,
        "reward_mean": -0.20367499999999983,
        "reward_max": 0.5653062500000001,
        "reward_min": -1.169575,
        "leartime_s": 0.02441065400489606,
        "sampletime": 0.8503388820099644,
        "best_mean": -0.023024999999999893,
        "best_max": 0.8506125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 117,
        "timesteps": 23400,
        "reward_mean": -0.10647499999999976,
        "reward_max": 0.8005312500000001,
        "reward_min": -1.1901562499999996,
        "leartime_s": 0.025453268986893818,
        "sampletime": 0.7461885370139498,
        "best_mean": -0.023024999999999893,
        "best_max": 0.8506125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 118,
        "timesteps": 23600,
        "reward_mean": -0.18592499999999978,
        "reward_max": 0.6569062500000002,
        "reward_min": -1.289275,
        "leartime_s": 0.02206607098923996,
        "sampletime": 0.8181667619792279,
        "best_mean": -0.023024999999999893,
        "best_max": 0.8506125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 119,
        "timesteps": 23800,
        "reward_mean": -0.3370749999999998,
        "reward_max": 0.6383875000000001,
        "reward_min": -1.7464125,
        "leartime_s": 0.023264810995897278,
        "sampletime": 0.8498421490075998,
        "best_mean": -0.023024999999999893,
        "best_max": 0.8506125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 120,
        "timesteps": 24000,
        "reward_mean": -0.38972499999999993,
        "reward_max": 0.5948062500000002,
        "reward_min": -1.412475,
        "leartime_s": 0.023736639006529003,
        "sampletime": 0.7430681079858914,
        "best_mean": -0.023024999999999893,
        "best_max": 0.8506125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 121,
        "timesteps": 24200,
        "reward_mean": -0.30597499999999983,
        "reward_max": 0.7182937500000002,
        "reward_min": -1.5436125,
        "leartime_s": 0.02766307001002133,
        "sampletime": 0.9251359689806122,
        "best_mean": -0.023024999999999893,
        "best_max": 0.8506125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 122,
        "timesteps": 24400,
        "reward_mean": -0.4689749999999998,
        "reward_max": 0.4606937500000002,
        "reward_min": -1.6563312499999996,
        "leartime_s": 0.020711460994789377,
        "sampletime": 0.9172763680107892,
        "best_mean": -0.023024999999999893,
        "best_max": 0.8506125,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 123,
        "timesteps": 24600,
        "reward_mean": 0.03240000000000009,
        "reward_max": 1.087,
        "reward_min": -1.1205125,
        "leartime_s": 0.03881587600335479,
        "sampletime": 0.8554833729867823,
        "best_mean": 0.03240000000000009,
        "best_max": 1.087,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 124,
        "timesteps": 24800,
        "reward_mean": -0.23682499999999987,
        "reward_max": 0.7977687500000001,
        "reward_min": -1.2046749999999997,
        "leartime_s": 0.033481262013083324,
        "sampletime": 0.9184753359877504,
        "best_mean": 0.03240000000000009,
        "best_max": 1.087,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 125,
        "timesteps": 25000,
        "reward_mean": -0.37507499999999977,
        "reward_max": 0.7474375000000002,
        "reward_min": -1.623675,
        "leartime_s": 0.05440586697659455,
        "sampletime": 0.913604678993579,
        "best_mean": 0.03240000000000009,
        "best_max": 1.087,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 126,
        "timesteps": 25200,
        "reward_mean": -0.3184249999999998,
        "reward_max": 0.5706625000000001,
        "reward_min": -1.5186437499999998,
        "leartime_s": 0.0797319560078904,
        "sampletime": 0.7949529110046569,
        "best_mean": 0.03240000000000009,
        "best_max": 1.087,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 127,
        "timesteps": 25400,
        "reward_mean": -0.26402499999999973,
        "reward_max": 0.7037687500000004,
        "reward_min": -1.7335374999999997,
        "leartime_s": 0.045269612019183114,
        "sampletime": 0.8757152839971241,
        "best_mean": 0.03240000000000009,
        "best_max": 1.087,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 128,
        "timesteps": 25600,
        "reward_mean": 0.05605000000000024,
        "reward_max": 1.01044375,
        "reward_min": -1.1568687499999994,
        "leartime_s": 0.03725163999479264,
        "sampletime": 0.9576551069912966,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 129,
        "timesteps": 25800,
        "reward_mean": -0.22172499999999998,
        "reward_max": 0.6239437499999999,
        "reward_min": -1.31145,
        "leartime_s": 0.012049033015500754,
        "sampletime": 0.7796867580036633,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 130,
        "timesteps": 26000,
        "reward_mean": 0.04727500000000001,
        "reward_max": 1.1893562500000001,
        "reward_min": -0.9400374999999999,
        "leartime_s": 0.05537687600008212,
        "sampletime": 0.7370163229934406,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 131,
        "timesteps": 26200,
        "reward_mean": -0.15654999999999983,
        "reward_max": 0.83239375,
        "reward_min": -1.5419687499999999,
        "leartime_s": 0.031959640997229144,
        "sampletime": 0.9760515799862333,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 132,
        "timesteps": 26400,
        "reward_mean": -0.25100000000000006,
        "reward_max": 0.7076312499999998,
        "reward_min": -1.3486187500000002,
        "leartime_s": 0.05417366401525214,
        "sampletime": 0.7364957490062807,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 133,
        "timesteps": 26600,
        "reward_mean": -0.08800000000000002,
        "reward_max": 0.8306999999999999,
        "reward_min": -1.19285,
        "leartime_s": 0.01935914100613445,
        "sampletime": 0.77873623999767,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 134,
        "timesteps": 26800,
        "reward_mean": -0.10407499999999979,
        "reward_max": 0.8206875000000005,
        "reward_min": -2.18475625,
        "leartime_s": 0.035143838002113625,
        "sampletime": 1.002325823996216,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 135,
        "timesteps": 27000,
        "reward_mean": -0.3409250000000001,
        "reward_max": 0.63851875,
        "reward_min": -1.7263687500000002,
        "leartime_s": 0.05889929199474864,
        "sampletime": 0.8626749289978761,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 136,
        "timesteps": 27200,
        "reward_mean": -0.5188999999999997,
        "reward_max": 0.4568125000000001,
        "reward_min": -1.851962499999999,
        "leartime_s": 0.027329921984346583,
        "sampletime": 0.8129051509895362,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 137,
        "timesteps": 27400,
        "reward_mean": -0.19794999999999996,
        "reward_max": 0.84745625,
        "reward_min": -1.3229750000000002,
        "leartime_s": 0.019839234999381006,
        "sampletime": 0.906490652996581,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 138,
        "timesteps": 27600,
        "reward_mean": -0.28574999999999995,
        "reward_max": 0.6432312500000001,
        "reward_min": -1.415775,
        "leartime_s": 0.016567198996199295,
        "sampletime": 0.8597940469917376,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 139,
        "timesteps": 27800,
        "reward_mean": -0.3987250000000001,
        "reward_max": 0.6821562499999999,
        "reward_min": -1.64813125,
        "leartime_s": 0.06464879598934203,
        "sampletime": 0.8426599420199636,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 140,
        "timesteps": 28000,
        "reward_mean": -0.3446749999999999,
        "reward_max": 0.635325,
        "reward_min": -1.5053062499999998,
        "leartime_s": 0.07746960798976943,
        "sampletime": 0.8290953070099931,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 141,
        "timesteps": 28200,
        "reward_mean": -0.1541999999999997,
        "reward_max": 0.7042625000000003,
        "reward_min": -1.6080437499999995,
        "leartime_s": 0.03400006899028085,
        "sampletime": 1.149762200016994,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 142,
        "timesteps": 28400,
        "reward_mean": -0.144675,
        "reward_max": 0.73733125,
        "reward_min": -1.2788000000000004,
        "leartime_s": 0.026074902998516336,
        "sampletime": 0.7401244100183249,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 143,
        "timesteps": 28600,
        "reward_mean": -0.20652499999999988,
        "reward_max": 0.9514312500000002,
        "reward_min": -1.6067375000000002,
        "leartime_s": 0.016087016003439203,
        "sampletime": 0.785141999978805,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 144,
        "timesteps": 28800,
        "reward_mean": -0.28772499999999984,
        "reward_max": 0.6973125000000001,
        "reward_min": -1.4977999999999996,
        "leartime_s": 0.02182220999384299,
        "sampletime": 0.9996570229995996,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 145,
        "timesteps": 29000,
        "reward_mean": -0.43862499999999993,
        "reward_max": 0.5779375,
        "reward_min": -1.40965625,
        "leartime_s": 0.058200838015181944,
        "sampletime": 0.824927203997504,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 146,
        "timesteps": 29200,
        "reward_mean": -0.08277499999999964,
        "reward_max": 0.8383875000000002,
        "reward_min": -1.4269812499999996,
        "leartime_s": 0.07661206100601703,
        "sampletime": 0.6772448839910794,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 147,
        "timesteps": 29400,
        "reward_mean": -0.2674749999999999,
        "reward_max": 0.7771750000000003,
        "reward_min": -1.3374062499999997,
        "leartime_s": 0.056824844010407105,
        "sampletime": 0.8850058569805697,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 148,
        "timesteps": 29600,
        "reward_mean": -0.25969999999999993,
        "reward_max": 0.8169250000000001,
        "reward_min": -1.615175,
        "leartime_s": 0.09895081401919015,
        "sampletime": 1.0517971639928874,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 149,
        "timesteps": 29800,
        "reward_mean": -0.189575,
        "reward_max": 1.0040625000000003,
        "reward_min": -1.2509812500000004,
        "leartime_s": 0.03087943998980336,
        "sampletime": 0.7260566310142167,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 150,
        "timesteps": 30000,
        "reward_mean": -0.5356499999999998,
        "reward_max": 0.6687937499999999,
        "reward_min": -1.830681249999999,
        "leartime_s": 0.03163708598003723,
        "sampletime": 0.7721835400152486,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 151,
        "timesteps": 30200,
        "reward_mean": -0.023074999999999946,
        "reward_max": 1.0446437499999999,
        "reward_min": -1.2134125,
        "leartime_s": 0.024271438014693558,
        "sampletime": 0.928876088000834,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 152,
        "timesteps": 30400,
        "reward_mean": -0.5576499999999998,
        "reward_max": 0.33386875000000027,
        "reward_min": -1.84195625,
        "leartime_s": 0.027377238002372906,
        "sampletime": 0.8954070729960222,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 153,
        "timesteps": 30600,
        "reward_mean": -0.34759999999999974,
        "reward_max": 0.5594062500000001,
        "reward_min": -1.7617687499999997,
        "leartime_s": 0.06680477398913354,
        "sampletime": 0.8046152669994626,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 154,
        "timesteps": 30800,
        "reward_mean": -0.15017499999999964,
        "reward_max": 0.8102125000000004,
        "reward_min": -1.0928687499999998,
        "leartime_s": 0.018735935998847708,
        "sampletime": 0.9286335149954539,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 155,
        "timesteps": 31000,
        "reward_mean": -0.3094499999999998,
        "reward_max": 0.5978500000000002,
        "reward_min": -1.699425,
        "leartime_s": 0.03525027900468558,
        "sampletime": 0.7480322099872865,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 156,
        "timesteps": 31200,
        "reward_mean": -0.2422249999999997,
        "reward_max": 0.6669125000000005,
        "reward_min": -1.3065374999999995,
        "leartime_s": 0.020002692006528378,
        "sampletime": 0.6841115449788049,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 157,
        "timesteps": 31400,
        "reward_mean": -0.523875,
        "reward_max": 0.5774875000000003,
        "reward_min": -1.7985937500000009,
        "leartime_s": 0.04195635300129652,
        "sampletime": 0.8665432260022499,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 158,
        "timesteps": 31600,
        "reward_mean": -0.5509249999999998,
        "reward_max": 0.5696062500000003,
        "reward_min": -1.6541562500000002,
        "leartime_s": 0.011810871976194903,
        "sampletime": 0.9928246519993991,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 159,
        "timesteps": 31800,
        "reward_mean": -0.33852499999999974,
        "reward_max": 0.6347187500000001,
        "reward_min": -1.4155749999999998,
        "leartime_s": 0.029289480997249484,
        "sampletime": 0.9092789059795905,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 160,
        "timesteps": 32000,
        "reward_mean": -0.4059249999999998,
        "reward_max": 0.4387125,
        "reward_min": -1.5001062499999995,
        "leartime_s": 0.03089118900243193,
        "sampletime": 0.8225536170066334,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 161,
        "timesteps": 32200,
        "reward_mean": -0.3417749999999999,
        "reward_max": 0.6161562500000003,
        "reward_min": -1.916825,
        "leartime_s": 0.026699816982727498,
        "sampletime": 0.9458087130042259,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 162,
        "timesteps": 32400,
        "reward_mean": -0.20437499999999972,
        "reward_max": 0.8325750000000002,
        "reward_min": -1.2951125,
        "leartime_s": 0.06393412000034004,
        "sampletime": 0.7704041580145713,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 163,
        "timesteps": 32600,
        "reward_mean": -0.47167499999999984,
        "reward_max": 0.54583125,
        "reward_min": -1.76251875,
        "leartime_s": 0.021961653023026884,
        "sampletime": 0.7960423649928998,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 164,
        "timesteps": 32800,
        "reward_mean": -0.3425999999999997,
        "reward_max": 0.7120125000000004,
        "reward_min": -1.5948624999999996,
        "leartime_s": 0.036608624010114,
        "sampletime": 1.0335541869862936,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 165,
        "timesteps": 33000,
        "reward_mean": -0.541775,
        "reward_max": 0.3004625000000001,
        "reward_min": -1.8101937500000003,
        "leartime_s": 0.03614897499210201,
        "sampletime": 0.8873476200096775,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 166,
        "timesteps": 33200,
        "reward_mean": -0.5140999999999998,
        "reward_max": 0.40208125000000017,
        "reward_min": -2.1068124999999998,
        "leartime_s": 0.01388888101791963,
        "sampletime": 0.8057283380185254,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 167,
        "timesteps": 33400,
        "reward_mean": -0.22849999999999976,
        "reward_max": 0.5720250000000002,
        "reward_min": -1.47731875,
        "leartime_s": 0.06113932799780741,
        "sampletime": 0.9184463680139743,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 168,
        "timesteps": 33600,
        "reward_mean": -0.4541749999999998,
        "reward_max": 0.3062062500000002,
        "reward_min": -1.77421875,
        "leartime_s": 0.05450569500681013,
        "sampletime": 0.9607689239783213,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 169,
        "timesteps": 33800,
        "reward_mean": -0.4675249999999997,
        "reward_max": 0.5697625000000003,
        "reward_min": -1.647412499999999,
        "leartime_s": 0.0238362209929619,
        "sampletime": 0.7171105559973512,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 170,
        "timesteps": 34000,
        "reward_mean": -0.5995749999999999,
        "reward_max": 0.4673562500000001,
        "reward_min": -1.8280500000000002,
        "leartime_s": 0.05094497199752368,
        "sampletime": 0.8765666940016672,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 171,
        "timesteps": 34200,
        "reward_mean": -0.4775249999999997,
        "reward_max": 0.3320375000000006,
        "reward_min": -1.7303687499999993,
        "leartime_s": 0.037993456004187465,
        "sampletime": 1.0631449990032706,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 172,
        "timesteps": 34400,
        "reward_mean": -0.6161749999999998,
        "reward_max": 0.3218250000000003,
        "reward_min": -1.7555624999999997,
        "leartime_s": 0.02139112399891019,
        "sampletime": 0.736810577014694,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 173,
        "timesteps": 34600,
        "reward_mean": -0.4560999999999998,
        "reward_max": 0.4575625000000002,
        "reward_min": -1.7906812499999998,
        "leartime_s": 0.04769134600064717,
        "sampletime": 0.7833196939900517,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 174,
        "timesteps": 34800,
        "reward_mean": -0.5212249999999999,
        "reward_max": 0.3935312500000001,
        "reward_min": -1.77348125,
        "leartime_s": 0.02328532500541769,
        "sampletime": 0.8729754749801941,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 175,
        "timesteps": 35000,
        "reward_mean": -0.5939249999999996,
        "reward_max": 0.5515062500000005,
        "reward_min": -2.1176687500000004,
        "leartime_s": 0.0338640850095544,
        "sampletime": 0.7918535619974136,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 176,
        "timesteps": 35200,
        "reward_mean": -0.6082999999999997,
        "reward_max": 0.5739000000000003,
        "reward_min": -1.7935187500000003,
        "leartime_s": 0.07309791498119012,
        "sampletime": 0.7385608359763864,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 177,
        "timesteps": 35400,
        "reward_mean": -0.5382499999999998,
        "reward_max": 0.32230000000000014,
        "reward_min": -1.9255874999999996,
        "leartime_s": 0.05535576300462708,
        "sampletime": 0.8670803960121702,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 178,
        "timesteps": 35600,
        "reward_mean": -0.47682499999999983,
        "reward_max": 0.3111750000000001,
        "reward_min": -1.6253625,
        "leartime_s": 0.0800158669881057,
        "sampletime": 0.7474054579797667,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 179,
        "timesteps": 35800,
        "reward_mean": -0.4520499999999996,
        "reward_max": 0.6211312500000005,
        "reward_min": -1.5110312499999994,
        "leartime_s": 0.024483845016220585,
        "sampletime": 0.7767042820050847,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 180,
        "timesteps": 36000,
        "reward_mean": -0.3259749999999998,
        "reward_max": 0.7189812500000002,
        "reward_min": -1.5137249999999998,
        "leartime_s": 0.06565358201623894,
        "sampletime": 0.9478018719819374,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 181,
        "timesteps": 36200,
        "reward_mean": -0.7550749999999998,
        "reward_max": 0.39297500000000013,
        "reward_min": -1.8845937499999994,
        "leartime_s": 0.015991652995580807,
        "sampletime": 0.9618084109970368,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 182,
        "timesteps": 36400,
        "reward_mean": -0.32642499999999985,
        "reward_max": 0.52695,
        "reward_min": -1.4181312500000003,
        "leartime_s": 0.05628651598817669,
        "sampletime": 0.8783536569972057,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 183,
        "timesteps": 36600,
        "reward_mean": -0.71145,
        "reward_max": 0.14529999999999996,
        "reward_min": -1.93145,
        "leartime_s": 0.029713758995058015,
        "sampletime": 0.9938842790143099,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 184,
        "timesteps": 36800,
        "reward_mean": -0.4634749999999999,
        "reward_max": 0.34864375,
        "reward_min": -1.6985062499999999,
        "leartime_s": 0.044294398016063496,
        "sampletime": 1.1046116200159304,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 185,
        "timesteps": 37000,
        "reward_mean": -0.6272250000000001,
        "reward_max": 0.24008125000000002,
        "reward_min": -2.004775,
        "leartime_s": 0.048721713974373415,
        "sampletime": 0.8728091730154119,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 186,
        "timesteps": 37200,
        "reward_mean": -0.31332499999999985,
        "reward_max": 0.61621875,
        "reward_min": -1.5689375,
        "leartime_s": 0.046677598991664127,
        "sampletime": 0.8547739899950102,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 187,
        "timesteps": 37400,
        "reward_mean": -0.5510999999999999,
        "reward_max": 0.4138750000000002,
        "reward_min": -1.5353562499999998,
        "leartime_s": 0.020715900987852365,
        "sampletime": 1.0663553419872187,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 188,
        "timesteps": 37600,
        "reward_mean": -0.6881999999999998,
        "reward_max": 0.16210000000000016,
        "reward_min": -2.1060375,
        "leartime_s": 0.05039894601213746,
        "sampletime": 0.9123782370006666,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 189,
        "timesteps": 37800,
        "reward_mean": -0.5599999999999996,
        "reward_max": 0.3684750000000003,
        "reward_min": -2.0613749999999995,
        "leartime_s": 0.030861903011100367,
        "sampletime": 0.828963270992972,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 190,
        "timesteps": 38000,
        "reward_mean": -0.6058749999999997,
        "reward_max": 0.39809375,
        "reward_min": -1.9007499999999995,
        "leartime_s": 0.03875757602509111,
        "sampletime": 0.7393002370081376,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 191,
        "timesteps": 38200,
        "reward_mean": -0.659225,
        "reward_max": 0.37740625000000005,
        "reward_min": -1.926287499999999,
        "leartime_s": 0.04779828799655661,
        "sampletime": 0.7290598849940579,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 192,
        "timesteps": 38400,
        "reward_mean": -0.6765249999999998,
        "reward_max": 0.3495187500000002,
        "reward_min": -2.1390125,
        "leartime_s": 0.04348328500054777,
        "sampletime": 0.8094437280087732,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 193,
        "timesteps": 38600,
        "reward_mean": -0.48347499999999977,
        "reward_max": 0.3392312500000003,
        "reward_min": -1.608649999999999,
        "leartime_s": 0.06496245501330122,
        "sampletime": 0.9094085580145475,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 194,
        "timesteps": 38800,
        "reward_mean": -0.7546249999999999,
        "reward_max": 0.3272937500000002,
        "reward_min": -2.0800625,
        "leartime_s": 0.11417913500918075,
        "sampletime": 0.9477448420075234,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 195,
        "timesteps": 39000,
        "reward_mean": -0.4991249999999999,
        "reward_max": 0.4085750000000001,
        "reward_min": -1.7163749999999993,
        "leartime_s": 0.06875762500567362,
        "sampletime": 0.7845017430081498,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 196,
        "timesteps": 39200,
        "reward_mean": -0.41757499999999975,
        "reward_max": 0.5920937500000001,
        "reward_min": -1.2528437499999994,
        "leartime_s": 0.06529182801023126,
        "sampletime": 0.8465662749949843,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 197,
        "timesteps": 39400,
        "reward_mean": -0.7261749999999999,
        "reward_max": 0.22423125000000008,
        "reward_min": -2.619331249999999,
        "leartime_s": 0.074774722015718,
        "sampletime": 0.8804479499813169,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 198,
        "timesteps": 39600,
        "reward_mean": -0.5668499999999997,
        "reward_max": 0.36131250000000015,
        "reward_min": -1.7359312499999993,
        "leartime_s": 0.03605247399536893,
        "sampletime": 0.843894049001392,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 199,
        "timesteps": 39800,
        "reward_mean": -0.603875,
        "reward_max": 0.22510625,
        "reward_min": -1.6067249999999995,
        "leartime_s": 0.02676767998491414,
        "sampletime": 0.8925395940023009,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 200,
        "timesteps": 40000,
        "reward_mean": -0.4619499999999999,
        "reward_max": 0.31107499999999993,
        "reward_min": -1.594975,
        "leartime_s": 0.04094910100684501,
        "sampletime": 0.8712099310068879,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 201,
        "timesteps": 40200,
        "reward_mean": -0.6522749999999996,
        "reward_max": 0.31461875000000017,
        "reward_min": -1.8145249999999993,
        "leartime_s": 0.05394588102353737,
        "sampletime": 0.9131440829951316,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 202,
        "timesteps": 40400,
        "reward_mean": -0.6219749999999997,
        "reward_max": 0.20510000000000037,
        "reward_min": -1.9276249999999993,
        "leartime_s": 0.023192195018054917,
        "sampletime": 0.9775120809790678,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 203,
        "timesteps": 40600,
        "reward_mean": -0.40652499999999975,
        "reward_max": 0.40190625000000013,
        "reward_min": -1.65639375,
        "leartime_s": 0.07394048100104555,
        "sampletime": 0.8776268219808117,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 204,
        "timesteps": 40800,
        "reward_mean": -0.530075,
        "reward_max": 0.14325000000000013,
        "reward_min": -1.7291625,
        "leartime_s": 0.0820448370068334,
        "sampletime": 0.8013708149956074,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 205,
        "timesteps": 41000,
        "reward_mean": -0.544225,
        "reward_max": 0.28755000000000014,
        "reward_min": -1.4804999999999997,
        "leartime_s": 0.034047359018586576,
        "sampletime": 0.8462227679847274,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 206,
        "timesteps": 41200,
        "reward_mean": -0.6263,
        "reward_max": 0.3349312499999999,
        "reward_min": -1.6695625,
        "leartime_s": 0.06677548500010744,
        "sampletime": 0.9299472109996714,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 207,
        "timesteps": 41400,
        "reward_mean": -0.46387499999999987,
        "reward_max": 0.6127562500000002,
        "reward_min": -1.4518312499999997,
        "leartime_s": 0.033036676002666354,
        "sampletime": 0.7876453380158637,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 208,
        "timesteps": 41600,
        "reward_mean": -0.546925,
        "reward_max": 0.35458125,
        "reward_min": -1.7125875000000002,
        "leartime_s": 0.049607951019424945,
        "sampletime": 0.8113026329956483,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 209,
        "timesteps": 41800,
        "reward_mean": -0.44562499999999977,
        "reward_max": 0.7541937500000002,
        "reward_min": -1.5550999999999995,
        "leartime_s": 0.06250848199124448,
        "sampletime": 0.8818245849979576,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 210,
        "timesteps": 42000,
        "reward_mean": -0.518025,
        "reward_max": 0.5325500000000002,
        "reward_min": -1.6449250000000002,
        "leartime_s": 0.055947036016732454,
        "sampletime": 0.8020315110043157,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 211,
        "timesteps": 42200,
        "reward_mean": -0.43915,
        "reward_max": 0.47379999999999994,
        "reward_min": -1.669625,
        "leartime_s": 0.05417525800294243,
        "sampletime": 0.8041108780016657,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 212,
        "timesteps": 42400,
        "reward_mean": -0.7300749999999999,
        "reward_max": 0.25673125000000024,
        "reward_min": -2.1620624999999998,
        "leartime_s": 0.059960765996947885,
        "sampletime": 0.9086678620078601,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 213,
        "timesteps": 42600,
        "reward_mean": -0.7940749999999999,
        "reward_max": 0.19556875000000012,
        "reward_min": -2.12369375,
        "leartime_s": 0.052419909014133736,
        "sampletime": 0.8615989480167627,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 214,
        "timesteps": 42800,
        "reward_mean": -0.938625,
        "reward_max": 0.17713125,
        "reward_min": -2.3266250000000004,
        "leartime_s": 0.03573724097805098,
        "sampletime": 0.7068556220037863,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 215,
        "timesteps": 43000,
        "reward_mean": -0.8220249999999999,
        "reward_max": 0.43328750000000027,
        "reward_min": -2.5686874999999993,
        "leartime_s": 0.049297491990728304,
        "sampletime": 1.0078640340070706,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 216,
        "timesteps": 43200,
        "reward_mean": -0.7181249999999998,
        "reward_max": 0.45359375000000013,
        "reward_min": -1.8216312499999998,
        "leartime_s": 0.0756002289999742,
        "sampletime": 0.8529396379890386,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 217,
        "timesteps": 43400,
        "reward_mean": -0.5748249999999999,
        "reward_max": 0.3238437499999999,
        "reward_min": -1.8571437499999999,
        "leartime_s": 0.02044080098858103,
        "sampletime": 0.8977108540129848,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 218,
        "timesteps": 43600,
        "reward_mean": -0.7383999999999997,
        "reward_max": 0.12676250000000008,
        "reward_min": -1.8925749999999997,
        "leartime_s": 0.058331982989329845,
        "sampletime": 1.0408258289971855,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 219,
        "timesteps": 43800,
        "reward_mean": -0.9024749999999999,
        "reward_max": 0.22377500000000008,
        "reward_min": -2.5750124999999993,
        "leartime_s": 0.040002391004236415,
        "sampletime": 0.821802516002208,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 220,
        "timesteps": 44000,
        "reward_mean": -0.4997249999999998,
        "reward_max": 0.4504062500000001,
        "reward_min": -1.7414124999999996,
        "leartime_s": 0.021712910995120183,
        "sampletime": 0.7745803380094003,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 221,
        "timesteps": 44200,
        "reward_mean": -0.5425499999999999,
        "reward_max": 0.2787625,
        "reward_min": -1.5270812499999997,
        "leartime_s": 0.013486773008480668,
        "sampletime": 0.9499768390087411,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 222,
        "timesteps": 44400,
        "reward_mean": -0.9186,
        "reward_max": -0.16493750000000032,
        "reward_min": -2.47799375,
        "leartime_s": 0.05684325500624254,
        "sampletime": 0.9083082019933499,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 223,
        "timesteps": 44600,
        "reward_mean": -0.8532749999999999,
        "reward_max": 0.19658125000000004,
        "reward_min": -2.0604124999999995,
        "leartime_s": 0.03030898599536158,
        "sampletime": 0.8054926740005612,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 224,
        "timesteps": 44800,
        "reward_mean": -0.7310249999999998,
        "reward_max": 0.26286250000000017,
        "reward_min": -2.66795625,
        "leartime_s": 0.055385018000379205,
        "sampletime": 0.7878528309811372,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 225,
        "timesteps": 45000,
        "reward_mean": -0.917075,
        "reward_max": 0.15415625000000016,
        "reward_min": -2.05236875,
        "leartime_s": 0.074520758993458,
        "sampletime": 0.6665709190128837,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 226,
        "timesteps": 45200,
        "reward_mean": -0.6718500000000002,
        "reward_max": 0.015968749999999962,
        "reward_min": -1.7357749999999998,
        "leartime_s": 0.06708220302243717,
        "sampletime": 0.7216051750001498,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 227,
        "timesteps": 45400,
        "reward_mean": -0.95045,
        "reward_max": -0.10006875000000029,
        "reward_min": -2.1717437500000005,
        "leartime_s": 0.02296076001948677,
        "sampletime": 0.9004754560010042,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 228,
        "timesteps": 45600,
        "reward_mean": -0.7333999999999998,
        "reward_max": 0.1581125,
        "reward_min": -1.7354562499999995,
        "leartime_s": 0.034536140999989584,
        "sampletime": 1.0222827140241861,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 229,
        "timesteps": 45800,
        "reward_mean": -0.6877999999999999,
        "reward_max": 0.21767500000000017,
        "reward_min": -1.9276937500000002,
        "leartime_s": 0.02929178098565899,
        "sampletime": 0.8995678000210319,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 230,
        "timesteps": 46000,
        "reward_mean": -0.8335999999999999,
        "reward_max": -0.09225625000000014,
        "reward_min": -1.8508687499999996,
        "leartime_s": 0.02065362298162654,
        "sampletime": 0.8098036029841751,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 231,
        "timesteps": 46200,
        "reward_mean": -0.6650250000000001,
        "reward_max": 0.38241875000000003,
        "reward_min": -1.934225,
        "leartime_s": 0.029938088991912082,
        "sampletime": 1.1436708779947367,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 232,
        "timesteps": 46400,
        "reward_mean": -0.7245499999999999,
        "reward_max": 0.1778625,
        "reward_min": -2.4187124999999994,
        "leartime_s": 0.05771468300372362,
        "sampletime": 0.8978728000074625,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 233,
        "timesteps": 46600,
        "reward_mean": -0.53565,
        "reward_max": 0.5677625,
        "reward_min": -1.70529375,
        "leartime_s": 0.0230191640148405,
        "sampletime": 0.7496302719810046,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 234,
        "timesteps": 46800,
        "reward_mean": -0.5148499999999999,
        "reward_max": 0.3948500000000002,
        "reward_min": -1.56376875,
        "leartime_s": 0.03156536098686047,
        "sampletime": 0.916890605003573,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 235,
        "timesteps": 47000,
        "reward_mean": -0.8047,
        "reward_max": 0.279625,
        "reward_min": -2.02431875,
        "leartime_s": 0.043725027004256845,
        "sampletime": 1.0038007570256013,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 236,
        "timesteps": 47200,
        "reward_mean": -0.5937499999999998,
        "reward_max": 0.3173625000000001,
        "reward_min": -1.870625,
        "leartime_s": 0.060053683002479374,
        "sampletime": 0.7723480260174256,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 237,
        "timesteps": 47400,
        "reward_mean": -0.6290999999999999,
        "reward_max": 0.20661250000000017,
        "reward_min": -1.9369000000000003,
        "leartime_s": 0.04212016999372281,
        "sampletime": 0.8068146479781717,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 238,
        "timesteps": 47600,
        "reward_mean": -0.5857999999999998,
        "reward_max": 0.40065000000000034,
        "reward_min": -1.85625,
        "leartime_s": 0.04372443800093606,
        "sampletime": 0.8674071739951614,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 239,
        "timesteps": 47800,
        "reward_mean": -0.6803500000000001,
        "reward_max": 0.19053124999999993,
        "reward_min": -1.9916500000000001,
        "leartime_s": 0.0452603489975445,
        "sampletime": 0.9879683689796366,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 240,
        "timesteps": 48000,
        "reward_mean": -0.85935,
        "reward_max": 0.13048750000000015,
        "reward_min": -2.2230437500000004,
        "leartime_s": 0.0749883140088059,
        "sampletime": 0.7309079259866849,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 241,
        "timesteps": 48200,
        "reward_mean": -0.8859750000000002,
        "reward_max": -0.07016250000000031,
        "reward_min": -1.9474750000000003,
        "leartime_s": 0.06310687598306686,
        "sampletime": 0.794218999973964,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 242,
        "timesteps": 48400,
        "reward_mean": -0.706425,
        "reward_max": 0.2644,
        "reward_min": -1.9110812500000003,
        "leartime_s": 0.04141838400391862,
        "sampletime": 0.960294068994699,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 243,
        "timesteps": 48600,
        "reward_mean": -0.7518749999999997,
        "reward_max": 0.20681250000000012,
        "reward_min": -1.7903374999999997,
        "leartime_s": 0.02217957700486295,
        "sampletime": 0.856121268006973,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 244,
        "timesteps": 48800,
        "reward_mean": -0.6640000000000003,
        "reward_max": 0.21683124999999984,
        "reward_min": -1.7262500000000003,
        "leartime_s": 0.036821404995862395,
        "sampletime": 0.941230793017894,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 245,
        "timesteps": 49000,
        "reward_mean": -0.4905999999999998,
        "reward_max": 0.4627500000000001,
        "reward_min": -2.1433249999999995,
        "leartime_s": 0.03697265399387106,
        "sampletime": 0.8876510350091849,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 246,
        "timesteps": 49200,
        "reward_mean": -0.7212499999999997,
        "reward_max": 0.28710000000000024,
        "reward_min": -1.9468999999999994,
        "leartime_s": 0.056558513024356216,
        "sampletime": 0.8572435120004229,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 247,
        "timesteps": 49400,
        "reward_mean": -0.5039250000000001,
        "reward_max": 0.4602187499999998,
        "reward_min": -1.6162187499999998,
        "leartime_s": 0.036356884986162186,
        "sampletime": 0.9783422519976739,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 248,
        "timesteps": 49600,
        "reward_mean": -0.9330499999999998,
        "reward_max": 0.08005625000000006,
        "reward_min": -2.1104624999999997,
        "leartime_s": 0.047074032976524904,
        "sampletime": 0.7710926439904142,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 249,
        "timesteps": 49800,
        "reward_mean": -0.5407499999999997,
        "reward_max": 0.4636125000000002,
        "reward_min": -1.7806874999999998,
        "leartime_s": 0.02954836600110866,
        "sampletime": 0.7679557389928959,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 250,
        "timesteps": 50000,
        "reward_mean": -0.6046749999999999,
        "reward_max": 0.27785625,
        "reward_min": -1.8298937499999992,
        "leartime_s": 0.019948981003835797,
        "sampletime": 0.9803018739912659,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 251,
        "timesteps": 50200,
        "reward_mean": -0.4366249999999999,
        "reward_max": 0.5844750000000002,
        "reward_min": -1.7834875000000001,
        "leartime_s": 0.04451656501623802,
        "sampletime": 0.8245120889914688,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 252,
        "timesteps": 50400,
        "reward_mean": -0.5700999999999998,
        "reward_max": 0.35840625000000015,
        "reward_min": -2.1498249999999994,
        "leartime_s": 0.014286977995652705,
        "sampletime": 0.7409245900053065,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 253,
        "timesteps": 50600,
        "reward_mean": -0.8640749999999998,
        "reward_max": 0.135175,
        "reward_min": -2.4472499999999986,
        "leartime_s": 0.02110511701903306,
        "sampletime": 0.8635996429948136,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 254,
        "timesteps": 50800,
        "reward_mean": -0.8398249999999997,
        "reward_max": 0.3214375000000001,
        "reward_min": -2.3765749999999994,
        "leartime_s": 0.038727528997696936,
        "sampletime": 1.0592439879837912,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 255,
        "timesteps": 51000,
        "reward_mean": -0.5718,
        "reward_max": 0.23977500000000007,
        "reward_min": -2.0102249999999997,
        "leartime_s": 0.04947296099271625,
        "sampletime": 0.8304687160125468,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 256,
        "timesteps": 51200,
        "reward_mean": -0.84005,
        "reward_max": 0.09698750000000014,
        "reward_min": -1.8817125000000003,
        "leartime_s": 0.0252699610136915,
        "sampletime": 0.8268161739979405,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 257,
        "timesteps": 51400,
        "reward_mean": -0.7937749999999997,
        "reward_max": 0.43291875000000013,
        "reward_min": -1.7133249999999995,
        "leartime_s": 0.06007584001054056,
        "sampletime": 1.0061845379823353,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 258,
        "timesteps": 51600,
        "reward_mean": -0.8601999999999999,
        "reward_max": 0.32461249999999997,
        "reward_min": -2.1780249999999994,
        "leartime_s": 0.04251924098934978,
        "sampletime": 1.0365730729827192,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 259,
        "timesteps": 51800,
        "reward_mean": -0.8906249999999999,
        "reward_max": 0.06365625000000003,
        "reward_min": -2.1878249999999997,
        "leartime_s": 0.037464851018739864,
        "sampletime": 0.8091883290035184,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 260,
        "timesteps": 52000,
        "reward_mean": -0.73505,
        "reward_max": 0.47896250000000024,
        "reward_min": -1.6585624999999997,
        "leartime_s": 0.059942029998637736,
        "sampletime": 0.8126569779997226,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 261,
        "timesteps": 52200,
        "reward_mean": -0.5388749999999998,
        "reward_max": 0.4514500000000001,
        "reward_min": -1.7395499999999997,
        "leartime_s": 0.0324521709990222,
        "sampletime": 0.7928895959921647,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 262,
        "timesteps": 52400,
        "reward_mean": -0.595725,
        "reward_max": 0.44546250000000015,
        "reward_min": -1.563575,
        "leartime_s": 0.02934551000362262,
        "sampletime": 0.7698679330060259,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 263,
        "timesteps": 52600,
        "reward_mean": -0.5235749999999998,
        "reward_max": 0.39101250000000004,
        "reward_min": -1.6666,
        "leartime_s": 0.02722460200311616,
        "sampletime": 0.8578566600044724,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 264,
        "timesteps": 52800,
        "reward_mean": -0.39224999999999977,
        "reward_max": 0.7103437500000004,
        "reward_min": -1.7694499999999997,
        "leartime_s": 0.028164852992631495,
        "sampletime": 1.1026910299842712,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 265,
        "timesteps": 53000,
        "reward_mean": -0.5918249999999999,
        "reward_max": 0.5950625000000002,
        "reward_min": -1.9026625,
        "leartime_s": 0.07744004798587412,
        "sampletime": 0.8226756090007257,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 266,
        "timesteps": 53200,
        "reward_mean": -0.6714249999999999,
        "reward_max": 0.37849374999999996,
        "reward_min": -2.0003375,
        "leartime_s": 0.034218932007206604,
        "sampletime": 0.753611997992266,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 267,
        "timesteps": 53400,
        "reward_mean": -0.7299749999999999,
        "reward_max": 0.15288750000000012,
        "reward_min": -2.3339812499999995,
        "leartime_s": 0.06432435900205746,
        "sampletime": 0.9175442069827113,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 268,
        "timesteps": 53600,
        "reward_mean": -0.7719749999999999,
        "reward_max": 0.07713125000000005,
        "reward_min": -1.9133875000000005,
        "leartime_s": 0.031942925008479506,
        "sampletime": 0.9693128960207105,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 269,
        "timesteps": 53800,
        "reward_mean": -0.52825,
        "reward_max": 0.4891499999999999,
        "reward_min": -2.02005625,
        "leartime_s": 0.024524392996681854,
        "sampletime": 0.8127543270238675,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 270,
        "timesteps": 54000,
        "reward_mean": -0.6442499999999999,
        "reward_max": 0.2145750000000001,
        "reward_min": -1.8231875,
        "leartime_s": 0.03656190598849207,
        "sampletime": 1.0400167499901727,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 271,
        "timesteps": 54200,
        "reward_mean": -0.531575,
        "reward_max": 0.3309500000000001,
        "reward_min": -1.5294062499999996,
        "leartime_s": 0.04226165701402351,
        "sampletime": 0.7935543330095243,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 272,
        "timesteps": 54400,
        "reward_mean": -0.6667249999999999,
        "reward_max": 0.34270625,
        "reward_min": -1.8355249999999994,
        "leartime_s": 0.042913048004265875,
        "sampletime": 0.74501715801307,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 273,
        "timesteps": 54600,
        "reward_mean": -0.6114749999999999,
        "reward_max": 0.20869375000000023,
        "reward_min": -1.9270874999999998,
        "leartime_s": 0.07363491700380109,
        "sampletime": 0.8960194970131852,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 274,
        "timesteps": 54800,
        "reward_mean": -0.844725,
        "reward_max": -0.03249375000000004,
        "reward_min": -1.8543249999999998,
        "leartime_s": 0.025107296998612583,
        "sampletime": 0.9873644379840698,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 275,
        "timesteps": 55000,
        "reward_mean": -0.36954999999999993,
        "reward_max": 0.55559375,
        "reward_min": -1.4032250000000004,
        "leartime_s": 0.07396020600572228,
        "sampletime": 0.7930752789834514,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 276,
        "timesteps": 55200,
        "reward_mean": -0.6652499999999999,
        "reward_max": 0.24769375000000002,
        "reward_min": -2.12728125,
        "leartime_s": 0.051556794001953676,
        "sampletime": 0.7607289580046199,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 277,
        "timesteps": 55400,
        "reward_mean": -0.5853999999999998,
        "reward_max": 0.2945437500000002,
        "reward_min": -2.0364812499999996,
        "leartime_s": 0.053333306015701964,
        "sampletime": 1.057361901999684,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 278,
        "timesteps": 55600,
        "reward_mean": -0.6540499999999999,
        "reward_max": 0.3165000000000003,
        "reward_min": -2.05795,
        "leartime_s": 0.06262754398630932,
        "sampletime": 0.689606569998432,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 279,
        "timesteps": 55800,
        "reward_mean": -0.4397249999999997,
        "reward_max": 0.5743750000000003,
        "reward_min": -1.8606562500000001,
        "leartime_s": 0.02618626700132154,
        "sampletime": 0.7622305550030433,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 280,
        "timesteps": 56000,
        "reward_mean": -0.5863999999999998,
        "reward_max": 0.32337500000000013,
        "reward_min": -2.1155749999999993,
        "leartime_s": 0.04597312299301848,
        "sampletime": 0.9010276980116032,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 281,
        "timesteps": 56200,
        "reward_mean": -0.5876249999999997,
        "reward_max": 0.6388125000000002,
        "reward_min": -1.7910812499999997,
        "leartime_s": 0.020029876002809033,
        "sampletime": 0.9659267750103027,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 282,
        "timesteps": 56400,
        "reward_mean": -0.5234499999999999,
        "reward_max": 0.5457937500000001,
        "reward_min": -1.5298937499999994,
        "leartime_s": 0.04434804298216477,
        "sampletime": 0.753472418000456,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 283,
        "timesteps": 56600,
        "reward_mean": -0.8179499999999998,
        "reward_max": 0.2524875000000001,
        "reward_min": -2.06646875,
        "leartime_s": 0.05807278698193841,
        "sampletime": 0.8642230439872947,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 284,
        "timesteps": 56800,
        "reward_mean": -0.5192249999999997,
        "reward_max": 0.42882500000000007,
        "reward_min": -1.6898062499999993,
        "leartime_s": 0.0354257799917832,
        "sampletime": 1.013557733997004,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 285,
        "timesteps": 57000,
        "reward_mean": -0.3925999999999999,
        "reward_max": 0.5315500000000001,
        "reward_min": -1.3410687499999996,
        "leartime_s": 0.017645165004068986,
        "sampletime": 0.7915829610137735,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 286,
        "timesteps": 57200,
        "reward_mean": -0.14229999999999973,
        "reward_max": 1.134225,
        "reward_min": -1.3929874999999996,
        "leartime_s": 0.0768333259911742,
        "sampletime": 0.8416698639921378,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 287,
        "timesteps": 57400,
        "reward_mean": -0.45599999999999985,
        "reward_max": 0.44233750000000016,
        "reward_min": -1.7996125000000005,
        "leartime_s": 0.056070599996019155,
        "sampletime": 0.9611137599858921,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 288,
        "timesteps": 57600,
        "reward_mean": -0.28667499999999974,
        "reward_max": 0.6209687500000003,
        "reward_min": -1.3169687499999998,
        "leartime_s": 0.08271888000308536,
        "sampletime": 0.7117270379967522,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 289,
        "timesteps": 57800,
        "reward_mean": -0.6557249999999997,
        "reward_max": 0.3124187500000002,
        "reward_min": -1.9561562499999996,
        "leartime_s": 0.04464333699434064,
        "sampletime": 0.8845184009987861,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 290,
        "timesteps": 58000,
        "reward_mean": -0.3549999999999997,
        "reward_max": 0.6954687500000003,
        "reward_min": -1.97901875,
        "leartime_s": 0.0791917220049072,
        "sampletime": 1.0253955679945648,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 291,
        "timesteps": 58200,
        "reward_mean": -0.43127499999999996,
        "reward_max": 0.42208125000000013,
        "reward_min": -1.523,
        "leartime_s": 0.034924623992992565,
        "sampletime": 0.7384392219828442,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 292,
        "timesteps": 58400,
        "reward_mean": -0.25745000000000007,
        "reward_max": 0.5857999999999999,
        "reward_min": -1.3592937500000004,
        "leartime_s": 0.030176391010172665,
        "sampletime": 0.7899949720012955,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 293,
        "timesteps": 58600,
        "reward_mean": -0.5570249999999999,
        "reward_max": 0.3618687500000003,
        "reward_min": -1.8172124999999995,
        "leartime_s": 0.08108548598829657,
        "sampletime": 0.9552173599950038,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 294,
        "timesteps": 58800,
        "reward_mean": -0.3459499999999998,
        "reward_max": 0.7264187500000003,
        "reward_min": -1.4600250000000004,
        "leartime_s": 0.07842407599673606,
        "sampletime": 1.0498348280088976,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 295,
        "timesteps": 59000,
        "reward_mean": -0.30949999999999994,
        "reward_max": 0.6679500000000002,
        "reward_min": -1.81745625,
        "leartime_s": 0.027562781993765384,
        "sampletime": 0.768055539985653,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 296,
        "timesteps": 59200,
        "reward_mean": -0.2988999999999998,
        "reward_max": 0.6242625000000003,
        "reward_min": -1.6122500000000004,
        "leartime_s": 0.05944933800492436,
        "sampletime": 0.7292258309898898,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 297,
        "timesteps": 59400,
        "reward_mean": -0.1915249999999998,
        "reward_max": 0.6712187500000004,
        "reward_min": -1.2721,
        "leartime_s": 0.03195351400063373,
        "sampletime": 0.7847785239864606,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 298,
        "timesteps": 59600,
        "reward_mean": -0.1486999999999999,
        "reward_max": 0.6767437500000002,
        "reward_min": -1.5198187499999998,
        "leartime_s": 0.060178999992785975,
        "sampletime": 0.7338922080234624,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 299,
        "timesteps": 59800,
        "reward_mean": -0.25389999999999996,
        "reward_max": 0.7747687500000002,
        "reward_min": -1.91899375,
        "leartime_s": 0.03938437800388783,
        "sampletime": 0.7852650819986593,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 300,
        "timesteps": 60000,
        "reward_mean": -0.4366000000000001,
        "reward_max": 0.592775,
        "reward_min": -1.7240000000000004,
        "leartime_s": 0.03469996599596925,
        "sampletime": 0.9268782809958793,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 301,
        "timesteps": 60200,
        "reward_mean": -0.17884999999999993,
        "reward_max": 0.7985624999999998,
        "reward_min": -1.4540874999999995,
        "leartime_s": 0.05440071600605734,
        "sampletime": 0.7512400500127114,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 302,
        "timesteps": 60400,
        "reward_mean": -0.39477499999999993,
        "reward_max": 0.47428750000000014,
        "reward_min": -1.3970000000000002,
        "leartime_s": 0.08535107600619085,
        "sampletime": 0.7677178349986207,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 303,
        "timesteps": 60600,
        "reward_mean": -0.019575000000000002,
        "reward_max": 1.0002499999999999,
        "reward_min": -1.3656562500000005,
        "leartime_s": 0.02863071599858813,
        "sampletime": 0.9711174920084886,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 304,
        "timesteps": 60800,
        "reward_mean": -0.2740999999999999,
        "reward_max": 0.7807750000000001,
        "reward_min": -1.4175625,
        "leartime_s": 0.034684059995925054,
        "sampletime": 1.0783144879969768,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 305,
        "timesteps": 61000,
        "reward_mean": -0.357375,
        "reward_max": 0.6240687499999998,
        "reward_min": -2.0067812499999995,
        "leartime_s": 0.022274621995165944,
        "sampletime": 0.8555285820038989,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 306,
        "timesteps": 61200,
        "reward_mean": -0.38092499999999985,
        "reward_max": 0.45873125000000026,
        "reward_min": -1.4352187499999998,
        "leartime_s": 0.05110351802431978,
        "sampletime": 0.7875507480057422,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 307,
        "timesteps": 61400,
        "reward_mean": -0.040449999999999944,
        "reward_max": 0.8979124999999999,
        "reward_min": -1.146175,
        "leartime_s": 0.07562626199796796,
        "sampletime": 1.0445859839965124,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 308,
        "timesteps": 61600,
        "reward_mean": -0.1829999999999998,
        "reward_max": 0.8344000000000003,
        "reward_min": -1.6568750000000003,
        "leartime_s": 0.042569726007059216,
        "sampletime": 0.7389501910074614,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 309,
        "timesteps": 61800,
        "reward_mean": -0.23309999999999984,
        "reward_max": 0.7324875000000002,
        "reward_min": -1.4525374999999998,
        "leartime_s": 0.043934867018833756,
        "sampletime": 0.8030260009982157,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 310,
        "timesteps": 62000,
        "reward_mean": -0.4325249999999999,
        "reward_max": 0.58125625,
        "reward_min": -1.49796875,
        "leartime_s": 0.06319678699946962,
        "sampletime": 0.9348323610029183,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 311,
        "timesteps": 62200,
        "reward_mean": -0.3834250000000001,
        "reward_max": 0.55125,
        "reward_min": -1.9983437499999996,
        "leartime_s": 0.06560092099243775,
        "sampletime": 0.7901537599973381,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 312,
        "timesteps": 62400,
        "reward_mean": -0.38339999999999996,
        "reward_max": 0.48088125,
        "reward_min": -1.7065437500000002,
        "leartime_s": 0.02845554699888453,
        "sampletime": 0.8969879760115873,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 313,
        "timesteps": 62600,
        "reward_mean": -0.16732499999999986,
        "reward_max": 0.9020750000000002,
        "reward_min": -1.4102749999999997,
        "leartime_s": 0.03969474500627257,
        "sampletime": 0.9100997550121974,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 314,
        "timesteps": 62800,
        "reward_mean": -0.27387499999999987,
        "reward_max": 0.8295999999999999,
        "reward_min": -1.5516874999999997,
        "leartime_s": 0.06331117197987624,
        "sampletime": 0.8542419279983733,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 315,
        "timesteps": 63000,
        "reward_mean": -0.72415,
        "reward_max": 0.29766249999999994,
        "reward_min": -1.8084749999999994,
        "leartime_s": 0.05362148498534225,
        "sampletime": 0.8326412909955252,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 316,
        "timesteps": 63200,
        "reward_mean": -0.00554999999999984,
        "reward_max": 0.947125,
        "reward_min": -1.3765,
        "leartime_s": 0.08363680099137127,
        "sampletime": 0.8503320129821077,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 317,
        "timesteps": 63400,
        "reward_mean": -0.58665,
        "reward_max": 0.34611250000000005,
        "reward_min": -1.9601374999999992,
        "leartime_s": 0.08777549900696613,
        "sampletime": 0.9704114499909338,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 318,
        "timesteps": 63600,
        "reward_mean": -0.49139999999999984,
        "reward_max": 0.4534875000000001,
        "reward_min": -1.6814687499999998,
        "leartime_s": 0.05001247601467185,
        "sampletime": 0.8306708460149821,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 319,
        "timesteps": 63800,
        "reward_mean": -0.23454999999999973,
        "reward_max": 0.5069000000000004,
        "reward_min": -1.2587374999999996,
        "leartime_s": 0.03204652402200736,
        "sampletime": 0.794781413016608,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 320,
        "timesteps": 64000,
        "reward_mean": -0.051624999999999845,
        "reward_max": 0.9833874999999996,
        "reward_min": -1.2259374999999997,
        "leartime_s": 0.03905663901241496,
        "sampletime": 0.9517747710051481,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 321,
        "timesteps": 64200,
        "reward_mean": -0.2563499999999999,
        "reward_max": 0.6248750000000002,
        "reward_min": -1.7891000000000001,
        "leartime_s": 0.08096431900048628,
        "sampletime": 0.7126591809792444,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 322,
        "timesteps": 64400,
        "reward_mean": -0.42679999999999996,
        "reward_max": 0.484475,
        "reward_min": -1.4526375000000002,
        "leartime_s": 0.06742679901071824,
        "sampletime": 0.7540503960044589,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 323,
        "timesteps": 64600,
        "reward_mean": -0.11902499999999983,
        "reward_max": 0.8032125000000002,
        "reward_min": -1.2827687499999996,
        "leartime_s": 0.07344268797896802,
        "sampletime": 0.9810416240070481,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 324,
        "timesteps": 64800,
        "reward_mean": -0.36615000000000003,
        "reward_max": 0.6432687500000001,
        "reward_min": -1.52249375,
        "leartime_s": 0.09456399298505858,
        "sampletime": 1.0271234399988316,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 325,
        "timesteps": 65000,
        "reward_mean": -0.21192499999999997,
        "reward_max": 0.6060749999999999,
        "reward_min": -2.0816187499999996,
        "leartime_s": 0.04625567400944419,
        "sampletime": 0.777267742989352,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 326,
        "timesteps": 65200,
        "reward_mean": -0.2746249999999999,
        "reward_max": 0.75096875,
        "reward_min": -1.4614500000000001,
        "leartime_s": 0.04160749100265093,
        "sampletime": 0.8485153660003562,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 327,
        "timesteps": 65400,
        "reward_mean": -0.27095,
        "reward_max": 0.5911124999999999,
        "reward_min": -1.4727625000000004,
        "leartime_s": 0.08625247998861596,
        "sampletime": 0.8000947840046138,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 328,
        "timesteps": 65600,
        "reward_mean": -0.17707499999999998,
        "reward_max": 0.7796062499999998,
        "reward_min": -1.5411687500000002,
        "leartime_s": 0.03327797801466659,
        "sampletime": 0.8240549839974847,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 329,
        "timesteps": 65800,
        "reward_mean": -0.11852499999999999,
        "reward_max": 0.6651812499999997,
        "reward_min": -1.2151875,
        "leartime_s": 0.044450927001889795,
        "sampletime": 0.9723464540147688,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 330,
        "timesteps": 66000,
        "reward_mean": -0.15209999999999985,
        "reward_max": 0.7567875000000001,
        "reward_min": -1.2628499999999998,
        "leartime_s": 0.06663397699594498,
        "sampletime": 0.8829644490033388,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 331,
        "timesteps": 66200,
        "reward_mean": -0.28807499999999986,
        "reward_max": 0.7629874999999998,
        "reward_min": -1.4888374999999996,
        "leartime_s": 0.06766163799329661,
        "sampletime": 0.7823185359884519,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 332,
        "timesteps": 66400,
        "reward_mean": -0.35664999999999986,
        "reward_max": 0.6341000000000002,
        "reward_min": -1.675425,
        "leartime_s": 0.0651568360044621,
        "sampletime": 0.8280483729904518,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 333,
        "timesteps": 66600,
        "reward_mean": -0.176,
        "reward_max": 0.7702624999999999,
        "reward_min": -1.65338125,
        "leartime_s": 0.04417976099648513,
        "sampletime": 0.8108972839836497,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 334,
        "timesteps": 66800,
        "reward_mean": -0.4441499999999999,
        "reward_max": 0.47523125,
        "reward_min": -1.498175,
        "leartime_s": 0.04722296301042661,
        "sampletime": 0.7432813030027319,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 335,
        "timesteps": 67000,
        "reward_mean": -0.24409999999999996,
        "reward_max": 0.7673312499999999,
        "reward_min": -1.2895687500000004,
        "leartime_s": 0.07122541300486773,
        "sampletime": 0.8070464190095663,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 336,
        "timesteps": 67200,
        "reward_mean": -0.17952499999999985,
        "reward_max": 0.8505312500000001,
        "reward_min": -1.5690374999999999,
        "leartime_s": 0.08525650500087067,
        "sampletime": 1.023566842020955,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 337,
        "timesteps": 67400,
        "reward_mean": -0.3214499999999998,
        "reward_max": 0.48792500000000005,
        "reward_min": -1.5651499999999996,
        "leartime_s": 0.10465317699708976,
        "sampletime": 0.908640479989117,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 338,
        "timesteps": 67600,
        "reward_mean": -0.2574999999999999,
        "reward_max": 0.654,
        "reward_min": -1.6224,
        "leartime_s": 0.08725383001728915,
        "sampletime": 0.7154432609968353,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 339,
        "timesteps": 67800,
        "reward_mean": -0.321625,
        "reward_max": 0.7111250000000001,
        "reward_min": -1.6590937500000003,
        "leartime_s": 0.02706106600817293,
        "sampletime": 0.8227553570177406,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 340,
        "timesteps": 68000,
        "reward_mean": -0.4539999999999998,
        "reward_max": 0.3975437500000002,
        "reward_min": -1.4445312499999996,
        "leartime_s": 0.05293643899494782,
        "sampletime": 0.9626435480022337,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 341,
        "timesteps": 68200,
        "reward_mean": -0.06527500000000003,
        "reward_max": 0.8306687499999997,
        "reward_min": -1.2622562499999999,
        "leartime_s": 0.061433761002263054,
        "sampletime": 0.8026813250035048,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 342,
        "timesteps": 68400,
        "reward_mean": -0.2255999999999999,
        "reward_max": 0.5995812500000002,
        "reward_min": -1.2278624999999996,
        "leartime_s": 0.0526536209799815,
        "sampletime": 0.7969932699925266,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 343,
        "timesteps": 68600,
        "reward_mean": -0.19507499999999997,
        "reward_max": 0.82106875,
        "reward_min": -1.2605875,
        "leartime_s": 0.09601611300604418,
        "sampletime": 1.051477558008628,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 344,
        "timesteps": 68800,
        "reward_mean": -0.32997499999999996,
        "reward_max": 0.65068125,
        "reward_min": -1.669893749999999,
        "leartime_s": 0.05801157600944862,
        "sampletime": 0.8997278379974887,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 345,
        "timesteps": 69000,
        "reward_mean": -0.17634999999999998,
        "reward_max": 0.8167562500000003,
        "reward_min": -1.17531875,
        "leartime_s": 0.038059649989008904,
        "sampletime": 0.8821487109817099,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 346,
        "timesteps": 69200,
        "reward_mean": -0.06757500000000011,
        "reward_max": 0.7844312499999997,
        "reward_min": -1.3874062500000004,
        "leartime_s": 0.03132564201951027,
        "sampletime": 0.7681940640031826,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 347,
        "timesteps": 69400,
        "reward_mean": -0.17034999999999995,
        "reward_max": 0.9619125000000004,
        "reward_min": -1.23889375,
        "leartime_s": 0.06404547599959187,
        "sampletime": 1.0911661610007286,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 348,
        "timesteps": 69600,
        "reward_mean": -0.1773749999999998,
        "reward_max": 0.9203125000000003,
        "reward_min": -1.5432624999999998,
        "leartime_s": 0.07224917600979097,
        "sampletime": 0.8673666639951989,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 349,
        "timesteps": 69800,
        "reward_mean": -0.2595999999999998,
        "reward_max": 0.6684125000000001,
        "reward_min": -1.4364749999999997,
        "leartime_s": 0.02849277897621505,
        "sampletime": 0.7323587230057456,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 350,
        "timesteps": 70000,
        "reward_mean": -0.14072499999999985,
        "reward_max": 0.83144375,
        "reward_min": -1.2213687499999994,
        "leartime_s": 0.055954479990759864,
        "sampletime": 0.7714828989992384,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 351,
        "timesteps": 70200,
        "reward_mean": -0.03399999999999989,
        "reward_max": 0.8469375,
        "reward_min": -1.01375,
        "leartime_s": 0.06329254599404521,
        "sampletime": 0.9552147840149701,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 352,
        "timesteps": 70400,
        "reward_mean": -0.1555749999999999,
        "reward_max": 0.8165562500000001,
        "reward_min": -1.2956062500000003,
        "leartime_s": 0.07114288400043733,
        "sampletime": 0.7797589160036296,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 353,
        "timesteps": 70600,
        "reward_mean": -0.05974999999999987,
        "reward_max": 0.8582500000000002,
        "reward_min": -1.58464375,
        "leartime_s": 0.06478402198990807,
        "sampletime": 0.8347736999858171,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 354,
        "timesteps": 70800,
        "reward_mean": -0.12430000000000005,
        "reward_max": 0.8105874999999998,
        "reward_min": -1.4515249999999997,
        "leartime_s": 0.10599387501133606,
        "sampletime": 1.0491497470065951,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 355,
        "timesteps": 71000,
        "reward_mean": -0.1643250000000001,
        "reward_max": 0.7064249999999995,
        "reward_min": -1.1541562499999998,
        "leartime_s": 0.04541987198172137,
        "sampletime": 0.8110554250015412,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 356,
        "timesteps": 71200,
        "reward_mean": -0.24810000000000001,
        "reward_max": 0.5451125000000001,
        "reward_min": -1.4002874999999997,
        "leartime_s": 0.05776793300174177,
        "sampletime": 0.8360172320099082,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 357,
        "timesteps": 71400,
        "reward_mean": -0.06112499999999984,
        "reward_max": 0.8361875000000001,
        "reward_min": -1.4250812499999996,
        "leartime_s": 0.03204301299410872,
        "sampletime": 0.8570990459993482,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 358,
        "timesteps": 71600,
        "reward_mean": -0.22565000000000004,
        "reward_max": 0.9413374999999999,
        "reward_min": -1.5306249999999997,
        "leartime_s": 0.059155755006941035,
        "sampletime": 1.0311729300010484,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 359,
        "timesteps": 71800,
        "reward_mean": -0.0997999999999999,
        "reward_max": 0.8735125,
        "reward_min": -1.1384999999999998,
        "leartime_s": 0.02458119799848646,
        "sampletime": 0.8292247710051015,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 360,
        "timesteps": 72000,
        "reward_mean": -0.19402499999999995,
        "reward_max": 0.7259750000000003,
        "reward_min": -1.7990312500000003,
        "leartime_s": 0.04901453299680725,
        "sampletime": 0.8102697180001996,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 361,
        "timesteps": 72200,
        "reward_mean": -0.04772499999999996,
        "reward_max": 0.8672749999999999,
        "reward_min": -1.1218937499999995,
        "leartime_s": 0.0369694730034098,
        "sampletime": 0.9059285489784088,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 362,
        "timesteps": 72400,
        "reward_mean": -0.3565000000000001,
        "reward_max": 0.9330999999999995,
        "reward_min": -1.579475,
        "leartime_s": 0.07530813800985925,
        "sampletime": 0.8202880969911348,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 363,
        "timesteps": 72600,
        "reward_mean": -0.2890749999999999,
        "reward_max": 0.6859812500000001,
        "reward_min": -1.5644437500000001,
        "leartime_s": 0.024283488019136712,
        "sampletime": 0.8002212149731349,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 364,
        "timesteps": 72800,
        "reward_mean": -0.25735,
        "reward_max": 0.7029874999999999,
        "reward_min": -1.9319249999999997,
        "leartime_s": 0.02555159298935905,
        "sampletime": 0.9015643750026356,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 365,
        "timesteps": 73000,
        "reward_mean": -0.12719999999999998,
        "reward_max": 0.7404999999999999,
        "reward_min": -1.2014375000000004,
        "leartime_s": 0.06480782601283863,
        "sampletime": 0.8404156430042349,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 366,
        "timesteps": 73200,
        "reward_mean": -0.36404999999999993,
        "reward_max": 0.5398187500000001,
        "reward_min": -1.7085375000000003,
        "leartime_s": 0.021097054006531835,
        "sampletime": 0.7748024010215886,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 367,
        "timesteps": 73400,
        "reward_mean": -0.23442500000000008,
        "reward_max": 0.5788249999999999,
        "reward_min": -1.2909062500000001,
        "leartime_s": 0.0793149069941137,
        "sampletime": 0.9127406250045169,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 368,
        "timesteps": 73600,
        "reward_mean": -0.332225,
        "reward_max": 0.7307187500000001,
        "reward_min": -1.5906874999999998,
        "leartime_s": 0.06585917100892402,
        "sampletime": 1.0496674870082643,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 369,
        "timesteps": 73800,
        "reward_mean": -0.13507499999999995,
        "reward_max": 0.7217312499999999,
        "reward_min": -1.90936875,
        "leartime_s": 0.030003324995050207,
        "sampletime": 0.7461093419988174,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 370,
        "timesteps": 74000,
        "reward_mean": -0.24715000000000006,
        "reward_max": 1.0582749999999996,
        "reward_min": -1.3278999999999999,
        "leartime_s": 0.05993352399673313,
        "sampletime": 0.7326449489919469,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 371,
        "timesteps": 74200,
        "reward_mean": -0.33894999999999986,
        "reward_max": 0.7721062500000002,
        "reward_min": -1.46120625,
        "leartime_s": 0.023750168998958543,
        "sampletime": 0.732097705011256,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 372,
        "timesteps": 74400,
        "reward_mean": -0.37860000000000016,
        "reward_max": 0.6670999999999998,
        "reward_min": -1.5329000000000002,
        "leartime_s": 0.024358818016480654,
        "sampletime": 0.7637788919964805,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 373,
        "timesteps": 74600,
        "reward_mean": -0.24879999999999994,
        "reward_max": 0.63410625,
        "reward_min": -1.3302874999999998,
        "leartime_s": 0.042406794003909454,
        "sampletime": 0.7010710370086599,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 374,
        "timesteps": 74800,
        "reward_mean": -0.2984250000000001,
        "reward_max": 1.0842562499999997,
        "reward_min": -1.4328625000000004,
        "leartime_s": 0.04617749998578802,
        "sampletime": 0.9650145320047159,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 375,
        "timesteps": 75000,
        "reward_mean": 0.04634999999999992,
        "reward_max": 1.1599624999999998,
        "reward_min": -1.6498187500000003,
        "leartime_s": 0.02577099099289626,
        "sampletime": 0.9527807699923869,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 376,
        "timesteps": 75200,
        "reward_mean": -0.45747499999999997,
        "reward_max": 0.6959187500000001,
        "reward_min": -1.46376875,
        "leartime_s": 0.05274481599917635,
        "sampletime": 0.8057388760207687,
        "best_mean": 0.05605000000000024,
        "best_max": 1.01044375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 377,
        "timesteps": 75400,
        "reward_mean": 0.0764500000000001,
        "reward_max": 0.9600250000000001,
        "reward_min": -1.1523812500000004,
        "leartime_s": 0.053537540981778875,
        "sampletime": 0.7551823740068357,
        "best_mean": 0.0764500000000001,
        "best_max": 0.9600250000000001,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 378,
        "timesteps": 75600,
        "reward_mean": -0.07362499999999995,
        "reward_max": 1.2346125,
        "reward_min": -1.26144375,
        "leartime_s": 0.08280072099296376,
        "sampletime": 0.9814164030249231,
        "best_mean": 0.0764500000000001,
        "best_max": 0.9600250000000001,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 379,
        "timesteps": 75800,
        "reward_mean": -0.1349249999999999,
        "reward_max": 0.7598562499999999,
        "reward_min": -1.1808812500000003,
        "leartime_s": 0.0758480119984597,
        "sampletime": 0.8675462489773054,
        "best_mean": 0.0764500000000001,
        "best_max": 0.9600250000000001,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 380,
        "timesteps": 76000,
        "reward_mean": -0.27587499999999987,
        "reward_max": 0.8344500000000002,
        "reward_min": -1.7427624999999998,
        "leartime_s": 0.047951335000107065,
        "sampletime": 0.7657924210070632,
        "best_mean": 0.0764500000000001,
        "best_max": 0.9600250000000001,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 381,
        "timesteps": 76200,
        "reward_mean": -0.3035249999999999,
        "reward_max": 0.7745812500000001,
        "reward_min": -2.1654875,
        "leartime_s": 0.07501624102587812,
        "sampletime": 0.9797470839985181,
        "best_mean": 0.0764500000000001,
        "best_max": 0.9600250000000001,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 382,
        "timesteps": 76400,
        "reward_mean": -0.20692499999999986,
        "reward_max": 0.64925625,
        "reward_min": -1.7308812499999993,
        "leartime_s": 0.04070736200083047,
        "sampletime": 0.8929571440094151,
        "best_mean": 0.0764500000000001,
        "best_max": 0.9600250000000001,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 383,
        "timesteps": 76600,
        "reward_mean": 0.06490000000000029,
        "reward_max": 1.3258187500000003,
        "reward_min": -0.9968749999999995,
        "leartime_s": 0.038985544990282506,
        "sampletime": 0.8469306449987926,
        "best_mean": 0.0764500000000001,
        "best_max": 0.9600250000000001,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 384,
        "timesteps": 76800,
        "reward_mean": -0.267275,
        "reward_max": 0.7786875000000002,
        "reward_min": -1.7307500000000005,
        "leartime_s": 0.06834412401076406,
        "sampletime": 0.711421904998133,
        "best_mean": 0.0764500000000001,
        "best_max": 0.9600250000000001,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 385,
        "timesteps": 77000,
        "reward_mean": 0.05809999999999998,
        "reward_max": 1.2846374999999999,
        "reward_min": -0.9681312500000001,
        "leartime_s": 0.07449502500821836,
        "sampletime": 1.198383968003327,
        "best_mean": 0.0764500000000001,
        "best_max": 0.9600250000000001,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 386,
        "timesteps": 77200,
        "reward_mean": -0.420875,
        "reward_max": 0.7863687499999996,
        "reward_min": -1.6024562500000006,
        "leartime_s": 0.054633464984362945,
        "sampletime": 0.7867758969950955,
        "best_mean": 0.0764500000000001,
        "best_max": 0.9600250000000001,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 387,
        "timesteps": 77400,
        "reward_mean": -0.12562500000000013,
        "reward_max": 0.8132625,
        "reward_min": -1.7415625000000001,
        "leartime_s": 0.0501358020119369,
        "sampletime": 0.7749687480099965,
        "best_mean": 0.0764500000000001,
        "best_max": 0.9600250000000001,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 388,
        "timesteps": 77600,
        "reward_mean": -0.3215749999999999,
        "reward_max": 0.7621750000000003,
        "reward_min": -1.5847375,
        "leartime_s": 0.07340522401500493,
        "sampletime": 0.7784212219994515,
        "best_mean": 0.0764500000000001,
        "best_max": 0.9600250000000001,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 389,
        "timesteps": 77800,
        "reward_mean": -0.23839999999999992,
        "reward_max": 0.81968125,
        "reward_min": -1.4056374999999999,
        "leartime_s": 0.05188046398689039,
        "sampletime": 1.021872318990063,
        "best_mean": 0.0764500000000001,
        "best_max": 0.9600250000000001,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 390,
        "timesteps": 78000,
        "reward_mean": -0.10912499999999999,
        "reward_max": 0.7953,
        "reward_min": -1.5798999999999996,
        "leartime_s": 0.08282679700641893,
        "sampletime": 0.7771135660004802,
        "best_mean": 0.0764500000000001,
        "best_max": 0.9600250000000001,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 391,
        "timesteps": 78200,
        "reward_mean": -0.25325,
        "reward_max": 0.7867562499999999,
        "reward_min": -1.7001750000000002,
        "leartime_s": 0.04404946297290735,
        "sampletime": 0.9520313699904364,
        "best_mean": 0.0764500000000001,
        "best_max": 0.9600250000000001,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 392,
        "timesteps": 78400,
        "reward_mean": -0.22384999999999997,
        "reward_max": 0.8704999999999999,
        "reward_min": -1.82085,
        "leartime_s": 0.044994322990532964,
        "sampletime": 1.1510588689998258,
        "best_mean": 0.0764500000000001,
        "best_max": 0.9600250000000001,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 393,
        "timesteps": 78600,
        "reward_mean": -0.07559999999999982,
        "reward_max": 1.1107500000000001,
        "reward_min": -1.5107999999999997,
        "leartime_s": 0.0553403009835165,
        "sampletime": 0.8088317000074312,
        "best_mean": 0.0764500000000001,
        "best_max": 0.9600250000000001,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 394,
        "timesteps": 78800,
        "reward_mean": 0.1166750000000001,
        "reward_max": 1.1881000000000002,
        "reward_min": -0.9383749999999998,
        "leartime_s": 0.051674554008059204,
        "sampletime": 0.8865048709849361,
        "best_mean": 0.1166750000000001,
        "best_max": 1.1881000000000002,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 395,
        "timesteps": 79000,
        "reward_mean": 0.13197500000000015,
        "reward_max": 1.0361625,
        "reward_min": -1.32895625,
        "leartime_s": 0.02350855400436558,
        "sampletime": 1.0130726400238927,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 396,
        "timesteps": 79200,
        "reward_mean": -0.11332499999999993,
        "reward_max": 0.8384874999999998,
        "reward_min": -1.6249562499999999,
        "leartime_s": 0.08499559800839052,
        "sampletime": 1.0254740840173326,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 397,
        "timesteps": 79400,
        "reward_mean": -0.24874999999999992,
        "reward_max": 0.7635875,
        "reward_min": -1.4987624999999998,
        "leartime_s": 0.08289250600500964,
        "sampletime": 0.8051144040073268,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 398,
        "timesteps": 79600,
        "reward_mean": -0.014199999999999826,
        "reward_max": 0.99896875,
        "reward_min": -1.4572250000000002,
        "leartime_s": 0.05358590200194158,
        "sampletime": 0.7157538540195674,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 399,
        "timesteps": 79800,
        "reward_mean": -0.05644999999999994,
        "reward_max": 0.98865,
        "reward_min": -1.2403625,
        "leartime_s": 0.067477123986464,
        "sampletime": 1.0544864920084365,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 400,
        "timesteps": 80000,
        "reward_mean": -0.2829749999999998,
        "reward_max": 0.7224875000000001,
        "reward_min": -1.5318874999999998,
        "leartime_s": 0.0683295460185036,
        "sampletime": 1.0815636590123177,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 401,
        "timesteps": 80200,
        "reward_mean": -0.4695749999999999,
        "reward_max": 0.5142562500000001,
        "reward_min": -1.9116500000000003,
        "leartime_s": 0.05639274598797783,
        "sampletime": 0.8391746210108977,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 402,
        "timesteps": 80400,
        "reward_mean": -0.235375,
        "reward_max": 0.99679375,
        "reward_min": -1.3570875,
        "leartime_s": 0.04208789297263138,
        "sampletime": 0.7125065300206188,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 403,
        "timesteps": 80600,
        "reward_mean": -0.38867499999999977,
        "reward_max": 0.8587562500000003,
        "reward_min": -1.4293375,
        "leartime_s": 0.0836343209957704,
        "sampletime": 0.8650810050021391,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 404,
        "timesteps": 80800,
        "reward_mean": -0.3827749999999999,
        "reward_max": 0.7068125000000001,
        "reward_min": -1.3238625,
        "leartime_s": 0.05699017201550305,
        "sampletime": 1.0254443679878023,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 405,
        "timesteps": 81000,
        "reward_mean": -0.3651249999999998,
        "reward_max": 0.5012875000000002,
        "reward_min": -1.61551875,
        "leartime_s": 0.06374586801393889,
        "sampletime": 0.7905641539837234,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 406,
        "timesteps": 81200,
        "reward_mean": -0.2785749999999996,
        "reward_max": 0.7033500000000001,
        "reward_min": -1.1801499999999994,
        "leartime_s": 0.03990237400284968,
        "sampletime": 0.7660024669894483,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 407,
        "timesteps": 81400,
        "reward_mean": -0.2334499999999997,
        "reward_max": 1.1083,
        "reward_min": -1.3145999999999995,
        "leartime_s": 0.038208572019357234,
        "sampletime": 0.9575404049828649,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 408,
        "timesteps": 81600,
        "reward_mean": -0.30804999999999993,
        "reward_max": 0.7606375000000001,
        "reward_min": -1.6144250000000004,
        "leartime_s": 0.09353533101966605,
        "sampletime": 1.1685862820013426,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 409,
        "timesteps": 81800,
        "reward_mean": 0.09502499999999989,
        "reward_max": 1.006275,
        "reward_min": -1.1238250000000005,
        "leartime_s": 0.07644813798833638,
        "sampletime": 0.7869633880036417,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 410,
        "timesteps": 82000,
        "reward_mean": -0.2849749999999999,
        "reward_max": 0.9220750000000002,
        "reward_min": -1.9744437499999998,
        "leartime_s": 0.06820191998849623,
        "sampletime": 0.8344211440125946,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 411,
        "timesteps": 82200,
        "reward_mean": -0.2652499999999998,
        "reward_max": 0.8360000000000001,
        "reward_min": -1.5789437499999999,
        "leartime_s": 0.04504014700069092,
        "sampletime": 0.7913076579861809,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 412,
        "timesteps": 82400,
        "reward_mean": -0.4863249999999999,
        "reward_max": 0.46707500000000013,
        "reward_min": -1.8923437500000002,
        "leartime_s": 0.04986410099081695,
        "sampletime": 0.7774026950064581,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 413,
        "timesteps": 82600,
        "reward_mean": -0.2621999999999998,
        "reward_max": 0.8175875000000002,
        "reward_min": -2.1209249999999997,
        "leartime_s": 0.05883396900026128,
        "sampletime": 0.7700308579951525,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 414,
        "timesteps": 82800,
        "reward_mean": -0.5103249999999999,
        "reward_max": 0.6391937500000002,
        "reward_min": -1.8656749999999995,
        "leartime_s": 0.08211586598190479,
        "sampletime": 1.0462262490182184,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 415,
        "timesteps": 83000,
        "reward_mean": -0.26485,
        "reward_max": 0.6799187500000003,
        "reward_min": -1.7503749999999998,
        "leartime_s": 0.08791845000814646,
        "sampletime": 0.8025930080038961,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 416,
        "timesteps": 83200,
        "reward_mean": -0.14449999999999968,
        "reward_max": 0.7700375000000002,
        "reward_min": -1.3710812499999996,
        "leartime_s": 0.04030867898836732,
        "sampletime": 0.803986888990039,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 417,
        "timesteps": 83400,
        "reward_mean": -0.4124249999999998,
        "reward_max": 0.5810312500000001,
        "reward_min": -1.423674999999999,
        "leartime_s": 0.0653733600047417,
        "sampletime": 0.892186414974276,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 418,
        "timesteps": 83600,
        "reward_mean": -0.20789999999999975,
        "reward_max": 0.7239375000000001,
        "reward_min": -1.5848250000000004,
        "leartime_s": 0.03320535700186156,
        "sampletime": 1.0028905340004712,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 419,
        "timesteps": 83800,
        "reward_mean": -0.5027999999999998,
        "reward_max": 0.34938125000000025,
        "reward_min": -1.7671124999999996,
        "leartime_s": 0.05773631201009266,
        "sampletime": 0.830695566983195,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 420,
        "timesteps": 84000,
        "reward_mean": -0.4016749999999999,
        "reward_max": 0.7432187500000006,
        "reward_min": -2.07805625,
        "leartime_s": 0.03369370600557886,
        "sampletime": 0.8825659739959519,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 421,
        "timesteps": 84200,
        "reward_mean": -0.18512499999999982,
        "reward_max": 0.7873062500000001,
        "reward_min": -1.3372249999999992,
        "leartime_s": 0.03145205500186421,
        "sampletime": 0.8799170480051544,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 422,
        "timesteps": 84400,
        "reward_mean": -0.4895499999999999,
        "reward_max": 0.6861499999999999,
        "reward_min": -1.6970250000000004,
        "leartime_s": 0.03676687501138076,
        "sampletime": 0.7538171919877641,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 423,
        "timesteps": 84600,
        "reward_mean": -0.39944999999999997,
        "reward_max": 0.6349374999999999,
        "reward_min": -1.379625,
        "leartime_s": 0.020896595990052447,
        "sampletime": 0.8557387399778236,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 424,
        "timesteps": 84800,
        "reward_mean": -0.35519999999999985,
        "reward_max": 0.7896625000000002,
        "reward_min": -1.5979437499999996,
        "leartime_s": 0.06467005499871448,
        "sampletime": 0.9298552580003161,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 425,
        "timesteps": 85000,
        "reward_mean": -0.22754999999999984,
        "reward_max": 0.8115250000000002,
        "reward_min": -1.210774999999999,
        "leartime_s": 0.10549060799530707,
        "sampletime": 0.9319278720067814,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 426,
        "timesteps": 85200,
        "reward_mean": -0.33697500000000014,
        "reward_max": 0.5292624999999997,
        "reward_min": -1.8425375,
        "leartime_s": 0.06689336101408117,
        "sampletime": 0.8144324210006744,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 427,
        "timesteps": 85400,
        "reward_mean": -0.6269749999999998,
        "reward_max": 0.3452875000000001,
        "reward_min": -1.8005875,
        "leartime_s": 0.04616235301364213,
        "sampletime": 0.889470572990831,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 428,
        "timesteps": 85600,
        "reward_mean": -0.3610499999999998,
        "reward_max": 0.6643125000000002,
        "reward_min": -1.7888875000000004,
        "leartime_s": 0.052807034022407606,
        "sampletime": 1.0033483580045868,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 429,
        "timesteps": 85800,
        "reward_mean": -0.21639999999999976,
        "reward_max": 0.7448562500000004,
        "reward_min": -1.2630562499999998,
        "leartime_s": 0.04314938798779622,
        "sampletime": 0.7634476090024691,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 430,
        "timesteps": 86000,
        "reward_mean": -0.29732499999999984,
        "reward_max": 0.5743687500000002,
        "reward_min": -2.05914375,
        "leartime_s": 0.07970451601431705,
        "sampletime": 0.8145606299804058,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 431,
        "timesteps": 86200,
        "reward_mean": -0.4691750000000001,
        "reward_max": 0.70209375,
        "reward_min": -1.68040625,
        "leartime_s": 0.03771251899888739,
        "sampletime": 1.0050499869976193,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 432,
        "timesteps": 86400,
        "reward_mean": -0.3631249999999998,
        "reward_max": 0.5114562500000003,
        "reward_min": -1.5443749999999998,
        "leartime_s": 0.09286277199862525,
        "sampletime": 0.8304269550135359,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 433,
        "timesteps": 86600,
        "reward_mean": -0.16624999999999995,
        "reward_max": 0.7604187499999999,
        "reward_min": -1.3169187499999995,
        "leartime_s": 0.04746298599638976,
        "sampletime": 0.7273135900031775,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 434,
        "timesteps": 86800,
        "reward_mean": -0.2617249999999999,
        "reward_max": 0.4964437500000002,
        "reward_min": -1.4450937499999996,
        "leartime_s": 0.039552483009174466,
        "sampletime": 0.8858087320113555,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 435,
        "timesteps": 87000,
        "reward_mean": -0.4563499999999998,
        "reward_max": 0.32717500000000016,
        "reward_min": -1.6416937499999995,
        "leartime_s": 0.05962394198286347,
        "sampletime": 0.9915591779863462,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 436,
        "timesteps": 87200,
        "reward_mean": -0.26465,
        "reward_max": 0.6236625,
        "reward_min": -1.9104812500000001,
        "leartime_s": 0.029218056006357074,
        "sampletime": 0.7912866569822654,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 437,
        "timesteps": 87400,
        "reward_mean": -0.3981249999999998,
        "reward_max": 0.6683625000000002,
        "reward_min": -1.5928125,
        "leartime_s": 0.06916722102323547,
        "sampletime": 0.8411025000095833,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 438,
        "timesteps": 87600,
        "reward_mean": -0.3696999999999998,
        "reward_max": 0.6954187500000003,
        "reward_min": -1.9123249999999998,
        "leartime_s": 0.09119246300542727,
        "sampletime": 0.9725555079930928,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 439,
        "timesteps": 87800,
        "reward_mean": -0.3367749999999998,
        "reward_max": 0.5507937500000002,
        "reward_min": -1.870381249999999,
        "leartime_s": 0.0707093259843532,
        "sampletime": 0.8079192920122296,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 440,
        "timesteps": 88000,
        "reward_mean": -0.16034999999999985,
        "reward_max": 0.8778125000000003,
        "reward_min": -1.35095625,
        "leartime_s": 0.04066205900744535,
        "sampletime": 0.8227080799988471,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 441,
        "timesteps": 88200,
        "reward_mean": -0.04129999999999996,
        "reward_max": 0.78095,
        "reward_min": -1.0298749999999997,
        "leartime_s": 0.06429584400029853,
        "sampletime": 1.0544300290057436,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 442,
        "timesteps": 88400,
        "reward_mean": -0.3137249999999997,
        "reward_max": 0.6194375000000003,
        "reward_min": -1.5170312499999996,
        "leartime_s": 0.05284919400583021,
        "sampletime": 0.7969748259929474,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 443,
        "timesteps": 88600,
        "reward_mean": -0.31294999999999995,
        "reward_max": 0.46105,
        "reward_min": -1.9136250000000001,
        "leartime_s": 0.046466338011668995,
        "sampletime": 0.8001732770062517,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 444,
        "timesteps": 88800,
        "reward_mean": -0.4669749999999999,
        "reward_max": 0.5825125,
        "reward_min": -1.9507937499999994,
        "leartime_s": 0.05759141201269813,
        "sampletime": 0.8428129990061279,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 445,
        "timesteps": 89000,
        "reward_mean": -0.27414999999999984,
        "reward_max": 0.6967625000000003,
        "reward_min": -1.6713437499999995,
        "leartime_s": 0.05000344500876963,
        "sampletime": 0.8932367649977095,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 446,
        "timesteps": 89200,
        "reward_mean": -0.21899999999999983,
        "reward_max": 0.6585875,
        "reward_min": -1.2691124999999999,
        "leartime_s": 0.05795069399755448,
        "sampletime": 0.7662502699822653,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 447,
        "timesteps": 89400,
        "reward_mean": 0.03095000000000037,
        "reward_max": 1.0263000000000004,
        "reward_min": -1.2998874999999996,
        "leartime_s": 0.06920725500094704,
        "sampletime": 0.7950009909982327,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 448,
        "timesteps": 89600,
        "reward_mean": -0.1251499999999999,
        "reward_max": 1.0058625,
        "reward_min": -1.4965937500000004,
        "leartime_s": 0.05402660998515785,
        "sampletime": 0.5944832499953918,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 449,
        "timesteps": 89800,
        "reward_mean": 0.0164750000000001,
        "reward_max": 1.2719625,
        "reward_min": -1.150525,
        "leartime_s": 0.02873590899980627,
        "sampletime": 0.7149135809740983,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 450,
        "timesteps": 90000,
        "reward_mean": -0.3698749999999997,
        "reward_max": 0.5957875000000002,
        "reward_min": -1.6668374999999995,
        "leartime_s": 0.06056950401398353,
        "sampletime": 0.8031191029876936,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 451,
        "timesteps": 90200,
        "reward_mean": -0.3079499999999997,
        "reward_max": 0.5292375000000002,
        "reward_min": -1.34425,
        "leartime_s": 0.07231246802257374,
        "sampletime": 0.7336934089835268,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 452,
        "timesteps": 90400,
        "reward_mean": -0.29027499999999984,
        "reward_max": 0.7189875000000003,
        "reward_min": -1.5173624999999993,
        "leartime_s": 0.05213395701139234,
        "sampletime": 0.622944145987276,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 453,
        "timesteps": 90600,
        "reward_mean": -0.2620249999999999,
        "reward_max": 0.7351499999999999,
        "reward_min": -1.6654062499999998,
        "leartime_s": 0.0490123979980126,
        "sampletime": 0.7786855570157059,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 454,
        "timesteps": 90800,
        "reward_mean": -0.16517499999999996,
        "reward_max": 0.596875,
        "reward_min": -1.6340687499999995,
        "leartime_s": 0.028886234009405598,
        "sampletime": 0.720649275026517,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 455,
        "timesteps": 91000,
        "reward_mean": -0.0459249999999998,
        "reward_max": 1.1583250000000005,
        "reward_min": -1.2957625,
        "leartime_s": 0.0747841129777953,
        "sampletime": 0.7007230939925648,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 456,
        "timesteps": 91200,
        "reward_mean": -0.3577499999999998,
        "reward_max": 0.7179187500000003,
        "reward_min": -1.7962624999999997,
        "leartime_s": 0.043836709985043854,
        "sampletime": 0.7344346910249442,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 457,
        "timesteps": 91400,
        "reward_mean": -0.0114499999999998,
        "reward_max": 0.9895437500000004,
        "reward_min": -1.4597375000000004,
        "leartime_s": 0.089091986999847,
        "sampletime": 0.8377248180040624,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 458,
        "timesteps": 91600,
        "reward_mean": -0.20399999999999976,
        "reward_max": 0.7423750000000002,
        "reward_min": -1.5737999999999999,
        "leartime_s": 0.04722183701233007,
        "sampletime": 0.6153851200069766,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 459,
        "timesteps": 91800,
        "reward_mean": -0.16422499999999973,
        "reward_max": 0.7553312500000002,
        "reward_min": -1.426375,
        "leartime_s": 0.029518191004171968,
        "sampletime": 0.8978694440156687,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 460,
        "timesteps": 92000,
        "reward_mean": -0.15362499999999976,
        "reward_max": 0.7536937500000002,
        "reward_min": -1.5465062499999997,
        "leartime_s": 0.04467274199123494,
        "sampletime": 0.6403709860169329,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 461,
        "timesteps": 92200,
        "reward_mean": -0.19769999999999988,
        "reward_max": 0.6819875000000001,
        "reward_min": -1.12295625,
        "leartime_s": 0.06367226500879042,
        "sampletime": 0.6115834010124672,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 462,
        "timesteps": 92400,
        "reward_mean": -0.14427499999999993,
        "reward_max": 0.80458125,
        "reward_min": -1.322025,
        "leartime_s": 0.041079114977037534,
        "sampletime": 0.7477326990047004,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 463,
        "timesteps": 92600,
        "reward_mean": 0.015500000000000175,
        "reward_max": 0.9446374999999999,
        "reward_min": -1.1487249999999998,
        "leartime_s": 0.05690972099546343,
        "sampletime": 0.9731777099950705,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 464,
        "timesteps": 92800,
        "reward_mean": -0.11899999999999986,
        "reward_max": 0.8197375000000001,
        "reward_min": -1.6210124999999997,
        "leartime_s": 0.03511372199864127,
        "sampletime": 0.7216443289944436,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 465,
        "timesteps": 93000,
        "reward_mean": -0.4011749999999999,
        "reward_max": 0.8793500000000002,
        "reward_min": -1.74524375,
        "leartime_s": 0.04353537000133656,
        "sampletime": 0.7259226719907019,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 466,
        "timesteps": 93200,
        "reward_mean": -0.4610499999999999,
        "reward_max": 0.48463749999999994,
        "reward_min": -1.5600499999999997,
        "leartime_s": 0.03503780599567108,
        "sampletime": 0.7782373360241763,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 467,
        "timesteps": 93400,
        "reward_mean": -0.12657499999999977,
        "reward_max": 0.878525,
        "reward_min": -1.2408374999999998,
        "leartime_s": 0.03457444399828091,
        "sampletime": 0.6982469040085562,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 468,
        "timesteps": 93600,
        "reward_mean": -0.17414999999999992,
        "reward_max": 0.7738750000000002,
        "reward_min": -1.47213125,
        "leartime_s": 0.045687809004448354,
        "sampletime": 0.6131413349939976,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 469,
        "timesteps": 93800,
        "reward_mean": -0.3625749999999997,
        "reward_max": 0.6600625000000003,
        "reward_min": -1.67169375,
        "leartime_s": 0.041858840006170794,
        "sampletime": 0.9543464810121804,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 470,
        "timesteps": 94000,
        "reward_mean": -0.09362499999999986,
        "reward_max": 0.9344187500000003,
        "reward_min": -1.4776625,
        "leartime_s": 0.046239199000410736,
        "sampletime": 0.722229710983811,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 471,
        "timesteps": 94200,
        "reward_mean": -0.23302499999999987,
        "reward_max": 0.6821124999999999,
        "reward_min": -1.5388187500000001,
        "leartime_s": 0.029066839982988313,
        "sampletime": 0.6357577699818648,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 472,
        "timesteps": 94400,
        "reward_mean": -0.21647499999999978,
        "reward_max": 0.85085,
        "reward_min": -1.399331249999999,
        "leartime_s": 0.0635292179940734,
        "sampletime": 0.7722014579921961,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 473,
        "timesteps": 94600,
        "reward_mean": -0.21787499999999976,
        "reward_max": 0.7736375000000002,
        "reward_min": -1.7261874999999998,
        "leartime_s": 0.10033253498841077,
        "sampletime": 0.7247887639969122,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 474,
        "timesteps": 94800,
        "reward_mean": -0.1289499999999997,
        "reward_max": 0.9118500000000004,
        "reward_min": -1.4438499999999994,
        "leartime_s": 0.030895795993274078,
        "sampletime": 0.6921197450137697,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 475,
        "timesteps": 95000,
        "reward_mean": -0.17039999999999975,
        "reward_max": 0.8780625000000004,
        "reward_min": -1.5637124999999998,
        "leartime_s": 0.06592214401462115,
        "sampletime": 0.7628348139987793,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 476,
        "timesteps": 95200,
        "reward_mean": -0.13562499999999977,
        "reward_max": 0.8458625000000003,
        "reward_min": -1.4930562499999998,
        "leartime_s": 0.04378538599121384,
        "sampletime": 0.890286527981516,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 477,
        "timesteps": 95400,
        "reward_mean": -0.05064999999999971,
        "reward_max": 0.8477062500000003,
        "reward_min": -1.4570187500000005,
        "leartime_s": 0.04865539900492877,
        "sampletime": 0.727534117992036,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 478,
        "timesteps": 95600,
        "reward_mean": 0.03995000000000017,
        "reward_max": 1.0165874999999998,
        "reward_min": -1.6100625,
        "leartime_s": 0.03654554899549112,
        "sampletime": 0.6798650499840733,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 479,
        "timesteps": 95800,
        "reward_mean": 0.0070500000000002,
        "reward_max": 1.0138937500000005,
        "reward_min": -0.9134624999999996,
        "leartime_s": 0.03953405699576251,
        "sampletime": 0.8328903930087108,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 480,
        "timesteps": 96000,
        "reward_mean": -0.41555,
        "reward_max": 0.6699249999999999,
        "reward_min": -1.7123375,
        "leartime_s": 0.048916226980509236,
        "sampletime": 0.6590751009935047,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 481,
        "timesteps": 96200,
        "reward_mean": -0.05722499999999983,
        "reward_max": 0.8596687500000001,
        "reward_min": -1.5369687499999993,
        "leartime_s": 0.04390635699382983,
        "sampletime": 0.7292614630132448,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 482,
        "timesteps": 96400,
        "reward_mean": -0.20804999999999968,
        "reward_max": 0.6764312500000004,
        "reward_min": -1.5737999999999996,
        "leartime_s": 0.04519421199802309,
        "sampletime": 0.7145615359768271,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 483,
        "timesteps": 96600,
        "reward_mean": -0.31424999999999964,
        "reward_max": 0.7802375000000003,
        "reward_min": -1.4697374999999993,
        "leartime_s": 0.054754422017140314,
        "sampletime": 0.6505739639978856,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 484,
        "timesteps": 96800,
        "reward_mean": 0.031425000000000106,
        "reward_max": 1.1359562500000002,
        "reward_min": -0.9530999999999998,
        "leartime_s": 0.05874340300215408,
        "sampletime": 0.9088148099835962,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 485,
        "timesteps": 97000,
        "reward_mean": -0.3288749999999998,
        "reward_max": 0.7513437500000002,
        "reward_min": -1.4492749999999999,
        "leartime_s": 0.058746062975842506,
        "sampletime": 0.6628966519783717,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 486,
        "timesteps": 97200,
        "reward_mean": -0.07749999999999982,
        "reward_max": 0.7366625,
        "reward_min": -1.4804312499999996,
        "leartime_s": 0.06825063700671308,
        "sampletime": 0.721342500008177,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 487,
        "timesteps": 97400,
        "reward_mean": -0.10627499999999984,
        "reward_max": 0.8061624999999999,
        "reward_min": -1.49293125,
        "leartime_s": 0.04508062099921517,
        "sampletime": 0.8821512119902764,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 488,
        "timesteps": 97600,
        "reward_mean": -0.2577249999999998,
        "reward_max": 0.7003375000000002,
        "reward_min": -1.4756124999999998,
        "leartime_s": 0.028597664000699297,
        "sampletime": 0.8087620410078671,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 489,
        "timesteps": 97800,
        "reward_mean": -0.19259999999999963,
        "reward_max": 0.7819375000000005,
        "reward_min": -1.4081999999999997,
        "leartime_s": 0.035483180021401495,
        "sampletime": 0.6371294150012545,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 490,
        "timesteps": 98000,
        "reward_mean": 0.07492500000000019,
        "reward_max": 0.9201312500000001,
        "reward_min": -1.1311874999999998,
        "leartime_s": 0.03098978300113231,
        "sampletime": 0.7013721019902732,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 491,
        "timesteps": 98200,
        "reward_mean": -0.028499999999999522,
        "reward_max": 0.9934500000000004,
        "reward_min": -1.3857249999999997,
        "leartime_s": 0.06137419899459928,
        "sampletime": 1.0067079039872624,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 492,
        "timesteps": 98400,
        "reward_mean": -0.1502249999999997,
        "reward_max": 0.7387250000000005,
        "reward_min": -1.8418562499999993,
        "leartime_s": 0.042123866005567834,
        "sampletime": 0.7187320890079718,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 493,
        "timesteps": 98600,
        "reward_mean": -0.010124999999999764,
        "reward_max": 0.7857500000000001,
        "reward_min": -1.0888375,
        "leartime_s": 0.030258120998041704,
        "sampletime": 0.8501056130044162,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 494,
        "timesteps": 98800,
        "reward_mean": -0.10517499999999975,
        "reward_max": 0.9950062500000005,
        "reward_min": -1.49635,
        "leartime_s": 0.06910937000066042,
        "sampletime": 0.7905840830062516,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 495,
        "timesteps": 99000,
        "reward_mean": -0.39289999999999975,
        "reward_max": 0.41442500000000027,
        "reward_min": -1.8448125,
        "leartime_s": 0.039190172974485904,
        "sampletime": 0.6892186420154758,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 496,
        "timesteps": 99200,
        "reward_mean": -0.10762499999999987,
        "reward_max": 0.8999000000000003,
        "reward_min": -1.40020625,
        "leartime_s": 0.048816713999258354,
        "sampletime": 0.6714405859820545,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 497,
        "timesteps": 99400,
        "reward_mean": -0.26512500000000006,
        "reward_max": 0.8017875000000001,
        "reward_min": -2.03266875,
        "leartime_s": 0.03362278899294324,
        "sampletime": 0.947226824995596,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 498,
        "timesteps": 99600,
        "reward_mean": -0.40719999999999973,
        "reward_max": 0.5325625000000004,
        "reward_min": -1.4751374999999995,
        "leartime_s": 0.08023918099934235,
        "sampletime": 0.6899293279857375,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 499,
        "timesteps": 99800,
        "reward_mean": -0.21419999999999964,
        "reward_max": 0.6461437500000003,
        "reward_min": -1.4511499999999995,
        "leartime_s": 0.05458841100335121,
        "sampletime": 0.7270981399924494,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 500,
        "timesteps": 100000,
        "reward_mean": -0.3497999999999998,
        "reward_max": 0.6699687500000001,
        "reward_min": -1.6420625,
        "leartime_s": 0.05247532497742213,
        "sampletime": 0.8196537960029673,
        "best_mean": 0.13197500000000015,
        "best_max": 1.0361625,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 2133132,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    }
]