[
    {
        "generation": 1,
        "timesteps": 200,
        "reward_mean": -39.10865000000001,
        "reward_max": -3.4611874999999994,
        "reward_min": -80.95306875000001,
        "leartime_s": 0.04994254600023851,
        "sampletime": 0.6653815990139265,
        "best_mean": -39.10865000000001,
        "best_max": -3.4611874999999994,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 2,
        "timesteps": 400,
        "reward_mean": -35.57759999999999,
        "reward_max": -2.2939,
        "reward_min": -209.31207500000002,
        "leartime_s": 0.020086349017219618,
        "sampletime": 0.766374418977648,
        "best_mean": -35.57759999999999,
        "best_max": -2.2939,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 3,
        "timesteps": 600,
        "reward_mean": -19.28135,
        "reward_max": 0.1955125000000002,
        "reward_min": -89.86763749999999,
        "leartime_s": 0.011285468004643917,
        "sampletime": 0.8297995360044297,
        "best_mean": -19.28135,
        "best_max": 0.1955125000000002,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 4,
        "timesteps": 800,
        "reward_mean": -18.239375,
        "reward_max": 2.0145750000000002,
        "reward_min": -41.456025,
        "leartime_s": 0.048109358991496265,
        "sampletime": 0.788519775000168,
        "best_mean": -18.239375,
        "best_max": 2.0145750000000002,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 5,
        "timesteps": 1000,
        "reward_mean": -17.9975,
        "reward_max": 1.2893374999999998,
        "reward_min": -55.06396875,
        "leartime_s": 0.01061415602453053,
        "sampletime": 0.7101997410063632,
        "best_mean": -17.9975,
        "best_max": 1.2893374999999998,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 6,
        "timesteps": 1200,
        "reward_mean": -7.77055,
        "reward_max": 1.4428750000000004,
        "reward_min": -78.25667499999999,
        "leartime_s": 0.012983316002646461,
        "sampletime": 0.8669844200194348,
        "best_mean": -7.77055,
        "best_max": 1.4428750000000004,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 7,
        "timesteps": 1400,
        "reward_mean": -3.0683249999999997,
        "reward_max": 2.8394875,
        "reward_min": -38.16516875000001,
        "leartime_s": 0.03538796698558144,
        "sampletime": 0.7763780509994831,
        "best_mean": -3.0683249999999997,
        "best_max": 2.8394875,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 8,
        "timesteps": 1600,
        "reward_mean": -1.310425,
        "reward_max": 2.86001875,
        "reward_min": -26.723924999999994,
        "leartime_s": 0.018360777001362294,
        "sampletime": 0.7195317900041118,
        "best_mean": -1.310425,
        "best_max": 2.86001875,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 9,
        "timesteps": 1800,
        "reward_mean": -0.5009999999999999,
        "reward_max": 1.6336562499999996,
        "reward_min": -7.414187500000001,
        "leartime_s": 0.034465913980966434,
        "sampletime": 0.6728257929789834,
        "best_mean": -0.5009999999999999,
        "best_max": 1.6336562499999996,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 10,
        "timesteps": 2000,
        "reward_mean": -0.9532999999999998,
        "reward_max": 0.9719000000000001,
        "reward_min": -5.4129999999999985,
        "leartime_s": 0.05415362099302001,
        "sampletime": 0.9246588950045407,
        "best_mean": -0.5009999999999999,
        "best_max": 1.6336562499999996,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 11,
        "timesteps": 2200,
        "reward_mean": -1.3762249999999998,
        "reward_max": -0.26138750000000016,
        "reward_min": -3.5911874999999998,
        "leartime_s": 0.022476329992059618,
        "sampletime": 0.6954012470087036,
        "best_mean": -0.5009999999999999,
        "best_max": 1.6336562499999996,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 12,
        "timesteps": 2400,
        "reward_mean": -1.3578000000000001,
        "reward_max": -0.4218875000000001,
        "reward_min": -3.0888312500000006,
        "leartime_s": 0.008709172019734979,
        "sampletime": 0.721839606994763,
        "best_mean": -0.5009999999999999,
        "best_max": 1.6336562499999996,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 13,
        "timesteps": 2600,
        "reward_mean": -1.2885000000000002,
        "reward_max": -0.14738749999999998,
        "reward_min": -3.245662499999999,
        "leartime_s": 0.012313506013015285,
        "sampletime": 0.735168525017798,
        "best_mean": -0.5009999999999999,
        "best_max": 1.6336562499999996,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 14,
        "timesteps": 2800,
        "reward_mean": -0.6015750000000001,
        "reward_max": 0.4422125,
        "reward_min": -3.443600000000001,
        "leartime_s": 0.006627792987274006,
        "sampletime": 0.8464863630069885,
        "best_mean": -0.5009999999999999,
        "best_max": 1.6336562499999996,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 15,
        "timesteps": 3000,
        "reward_mean": -1.1865749999999997,
        "reward_max": 0.048881249999999966,
        "reward_min": -2.9328624999999984,
        "leartime_s": 0.0425281040079426,
        "sampletime": 0.754006290982943,
        "best_mean": -0.5009999999999999,
        "best_max": 1.6336562499999996,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 16,
        "timesteps": 3200,
        "reward_mean": -1.1539999999999997,
        "reward_max": -0.13844374999999995,
        "reward_min": -2.8572749999999996,
        "leartime_s": 0.016858560993568972,
        "sampletime": 0.9561615650018211,
        "best_mean": -0.5009999999999999,
        "best_max": 1.6336562499999996,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 17,
        "timesteps": 3400,
        "reward_mean": -1.06075,
        "reward_max": -0.02733125,
        "reward_min": -2.8346500000000012,
        "leartime_s": 0.027781379991210997,
        "sampletime": 1.0966171589971054,
        "best_mean": -0.5009999999999999,
        "best_max": 1.6336562499999996,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 18,
        "timesteps": 3600,
        "reward_mean": -1.2898000000000003,
        "reward_max": -0.4359687500000001,
        "reward_min": -2.2942562499999997,
        "leartime_s": 0.009771103999810293,
        "sampletime": 0.8127176300040446,
        "best_mean": -0.5009999999999999,
        "best_max": 1.6336562499999996,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 19,
        "timesteps": 3800,
        "reward_mean": -1.5666750000000005,
        "reward_max": -0.5551562500000002,
        "reward_min": -3.279381250000001,
        "leartime_s": 0.03213267697719857,
        "sampletime": 0.8307482689851895,
        "best_mean": -0.5009999999999999,
        "best_max": 1.6336562499999996,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 20,
        "timesteps": 4000,
        "reward_mean": -1.3292000000000004,
        "reward_max": -0.4405000000000001,
        "reward_min": -2.2566062500000004,
        "leartime_s": 0.007534195989137515,
        "sampletime": 1.0345772510045208,
        "best_mean": -0.5009999999999999,
        "best_max": 1.6336562499999996,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 21,
        "timesteps": 4200,
        "reward_mean": -1.43565,
        "reward_max": -0.4890125000000003,
        "reward_min": -3.0546624999999996,
        "leartime_s": 0.023312106990488246,
        "sampletime": 0.8507041310076602,
        "best_mean": -0.5009999999999999,
        "best_max": 1.6336562499999996,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 22,
        "timesteps": 4400,
        "reward_mean": -1.4136999999999997,
        "reward_max": -0.5814437500000001,
        "reward_min": -2.5784687499999994,
        "leartime_s": 0.025599830987630412,
        "sampletime": 0.8334151830058545,
        "best_mean": -0.5009999999999999,
        "best_max": 1.6336562499999996,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 23,
        "timesteps": 4600,
        "reward_mean": -1.3872250000000002,
        "reward_max": -0.30969375000000005,
        "reward_min": -2.8100875000000003,
        "leartime_s": 0.030976823007222265,
        "sampletime": 0.9354168300051242,
        "best_mean": -0.5009999999999999,
        "best_max": 1.6336562499999996,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 24,
        "timesteps": 4800,
        "reward_mean": -1.314025,
        "reward_max": -0.4351500000000002,
        "reward_min": -2.7381625,
        "leartime_s": 0.052003378979861736,
        "sampletime": 0.9356416249938775,
        "best_mean": -0.5009999999999999,
        "best_max": 1.6336562499999996,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 25,
        "timesteps": 5000,
        "reward_mean": -1.0417250000000002,
        "reward_max": -0.1996374999999999,
        "reward_min": -2.369475,
        "leartime_s": 0.017034951015375555,
        "sampletime": 0.8111777059966698,
        "best_mean": -0.5009999999999999,
        "best_max": 1.6336562499999996,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 26,
        "timesteps": 5200,
        "reward_mean": -1.0597750000000001,
        "reward_max": -0.1884999999999999,
        "reward_min": -2.1523125,
        "leartime_s": 0.012814925983548164,
        "sampletime": 0.7424229210009798,
        "best_mean": -0.5009999999999999,
        "best_max": 1.6336562499999996,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 27,
        "timesteps": 5400,
        "reward_mean": -1.1535499999999999,
        "reward_max": -0.23370624999999984,
        "reward_min": -2.4387312500000005,
        "leartime_s": 0.015470713988179341,
        "sampletime": 0.9552783530089073,
        "best_mean": -0.5009999999999999,
        "best_max": 1.6336562499999996,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 28,
        "timesteps": 5600,
        "reward_mean": -1.020125,
        "reward_max": -0.08931874999999993,
        "reward_min": -1.96383125,
        "leartime_s": 0.009221935004461557,
        "sampletime": 0.8104018330050167,
        "best_mean": -0.5009999999999999,
        "best_max": 1.6336562499999996,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 29,
        "timesteps": 5800,
        "reward_mean": -1.1784499999999998,
        "reward_max": -0.22910625,
        "reward_min": -2.1283625,
        "leartime_s": 0.015027117013232782,
        "sampletime": 0.7701350520073902,
        "best_mean": -0.5009999999999999,
        "best_max": 1.6336562499999996,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 30,
        "timesteps": 6000,
        "reward_mean": -0.8645250000000001,
        "reward_max": 0.14333124999999988,
        "reward_min": -2.2671749999999995,
        "leartime_s": 0.027203888981603086,
        "sampletime": 1.086359699984314,
        "best_mean": -0.5009999999999999,
        "best_max": 1.6336562499999996,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 31,
        "timesteps": 6200,
        "reward_mean": -1.00335,
        "reward_max": -0.050375000000000225,
        "reward_min": -2.3245125000000004,
        "leartime_s": 0.030686166021041572,
        "sampletime": 0.8376418460102286,
        "best_mean": -0.5009999999999999,
        "best_max": 1.6336562499999996,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 32,
        "timesteps": 6400,
        "reward_mean": -0.9594250000000002,
        "reward_max": 0.06586249999999985,
        "reward_min": -2.0516937500000005,
        "leartime_s": 0.008597531996201724,
        "sampletime": 0.9548571880150121,
        "best_mean": -0.5009999999999999,
        "best_max": 1.6336562499999996,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 33,
        "timesteps": 6600,
        "reward_mean": -0.974625,
        "reward_max": 0.014237499999999959,
        "reward_min": -2.1202875000000008,
        "leartime_s": 0.05240315498667769,
        "sampletime": 0.8832381780084688,
        "best_mean": -0.5009999999999999,
        "best_max": 1.6336562499999996,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 34,
        "timesteps": 6800,
        "reward_mean": -0.806725,
        "reward_max": 0.07508749999999997,
        "reward_min": -2.51585625,
        "leartime_s": 0.0322448090009857,
        "sampletime": 0.7432000909757335,
        "best_mean": -0.5009999999999999,
        "best_max": 1.6336562499999996,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 35,
        "timesteps": 7000,
        "reward_mean": -0.5842,
        "reward_max": 0.32353750000000003,
        "reward_min": -1.7456,
        "leartime_s": 0.026373900996986777,
        "sampletime": 0.8200536599906627,
        "best_mean": -0.5009999999999999,
        "best_max": 1.6336562499999996,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 36,
        "timesteps": 7200,
        "reward_mean": -0.4610999999999998,
        "reward_max": 0.7318437500000003,
        "reward_min": -1.4599499999999994,
        "leartime_s": 0.02354812901467085,
        "sampletime": 0.837264140980551,
        "best_mean": -0.4610999999999998,
        "best_max": 0.7318437500000003,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 37,
        "timesteps": 7400,
        "reward_mean": -0.536775,
        "reward_max": 0.33938750000000006,
        "reward_min": -1.8042062500000005,
        "leartime_s": 0.07673982298001647,
        "sampletime": 0.938521331991069,
        "best_mean": -0.4610999999999998,
        "best_max": 0.7318437500000003,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 38,
        "timesteps": 7600,
        "reward_mean": -0.687425,
        "reward_max": 0.07828750000000004,
        "reward_min": -1.5798249999999996,
        "leartime_s": 0.03191114900982939,
        "sampletime": 0.8339457389956806,
        "best_mean": -0.4610999999999998,
        "best_max": 0.7318437500000003,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 39,
        "timesteps": 7800,
        "reward_mean": -0.5213249999999997,
        "reward_max": 0.4415937500000001,
        "reward_min": -1.8095062499999999,
        "leartime_s": 0.021092540002427995,
        "sampletime": 0.9093425299797673,
        "best_mean": -0.4610999999999998,
        "best_max": 0.7318437500000003,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 40,
        "timesteps": 8000,
        "reward_mean": -0.18887499999999996,
        "reward_max": 0.5542937500000003,
        "reward_min": -1.3889375000000006,
        "leartime_s": 0.05814783798996359,
        "sampletime": 0.9187128439953085,
        "best_mean": -0.18887499999999996,
        "best_max": 0.5542937500000003,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 41,
        "timesteps": 8200,
        "reward_mean": -0.4694249999999998,
        "reward_max": 0.47670000000000007,
        "reward_min": -1.3112499999999994,
        "leartime_s": 0.013111499982187524,
        "sampletime": 0.8345563039765693,
        "best_mean": -0.18887499999999996,
        "best_max": 0.5542937500000003,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 42,
        "timesteps": 8400,
        "reward_mean": -0.4046250000000001,
        "reward_max": 0.45554999999999995,
        "reward_min": -1.6833875000000007,
        "leartime_s": 0.0454424709896557,
        "sampletime": 0.9447076020005625,
        "best_mean": -0.18887499999999996,
        "best_max": 0.5542937500000003,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 43,
        "timesteps": 8600,
        "reward_mean": -0.3072999999999999,
        "reward_max": 0.7819000000000003,
        "reward_min": -1.55671875,
        "leartime_s": 0.06285655501415022,
        "sampletime": 0.8176878610101994,
        "best_mean": -0.18887499999999996,
        "best_max": 0.5542937500000003,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 44,
        "timesteps": 8800,
        "reward_mean": -0.60605,
        "reward_max": 0.12435000000000011,
        "reward_min": -1.51035,
        "leartime_s": 0.050966919981874526,
        "sampletime": 0.7926838200073689,
        "best_mean": -0.18887499999999996,
        "best_max": 0.5542937500000003,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 45,
        "timesteps": 9000,
        "reward_mean": -0.4351999999999998,
        "reward_max": 0.3106375000000002,
        "reward_min": -1.7580874999999994,
        "leartime_s": 0.01618162199156359,
        "sampletime": 0.9371896759839728,
        "best_mean": -0.18887499999999996,
        "best_max": 0.5542937500000003,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 46,
        "timesteps": 9200,
        "reward_mean": -0.20714999999999978,
        "reward_max": 0.65934375,
        "reward_min": -1.3675562499999998,
        "leartime_s": 0.03493612300371751,
        "sampletime": 0.8714071649883408,
        "best_mean": -0.18887499999999996,
        "best_max": 0.5542937500000003,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 47,
        "timesteps": 9400,
        "reward_mean": -0.5273749999999999,
        "reward_max": 0.3240812500000002,
        "reward_min": -1.6801249999999994,
        "leartime_s": 0.031549539999105036,
        "sampletime": 0.8459748519817367,
        "best_mean": -0.18887499999999996,
        "best_max": 0.5542937500000003,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 48,
        "timesteps": 9600,
        "reward_mean": -0.3317749999999999,
        "reward_max": 0.6047250000000002,
        "reward_min": -1.9588375,
        "leartime_s": 0.02614860999165103,
        "sampletime": 0.792040204978548,
        "best_mean": -0.18887499999999996,
        "best_max": 0.5542937500000003,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 49,
        "timesteps": 9800,
        "reward_mean": -0.24394999999999972,
        "reward_max": 0.8241687500000003,
        "reward_min": -1.234575,
        "leartime_s": 0.03164368000579998,
        "sampletime": 0.84429413502221,
        "best_mean": -0.18887499999999996,
        "best_max": 0.5542937500000003,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 50,
        "timesteps": 10000,
        "reward_mean": -0.29632499999999984,
        "reward_max": 0.6321687500000003,
        "reward_min": -1.5747874999999998,
        "leartime_s": 0.014903806993970647,
        "sampletime": 0.7068694379995577,
        "best_mean": -0.18887499999999996,
        "best_max": 0.5542937500000003,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 51,
        "timesteps": 10200,
        "reward_mean": -0.2823749999999999,
        "reward_max": 0.8510187500000002,
        "reward_min": -1.90101875,
        "leartime_s": 0.04637926700524986,
        "sampletime": 1.0052817259856965,
        "best_mean": -0.18887499999999996,
        "best_max": 0.5542937500000003,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 52,
        "timesteps": 10400,
        "reward_mean": -0.15754999999999977,
        "reward_max": 1.0326250000000003,
        "reward_min": -1.155299999999999,
        "leartime_s": 0.04215252798167057,
        "sampletime": 0.8203486099955626,
        "best_mean": -0.15754999999999977,
        "best_max": 1.0326250000000003,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 53,
        "timesteps": 10600,
        "reward_mean": -0.13654999999999987,
        "reward_max": 0.9037937500000002,
        "reward_min": -0.9258500000000001,
        "leartime_s": 0.045839255006285384,
        "sampletime": 0.7652532809879631,
        "best_mean": -0.13654999999999987,
        "best_max": 0.9037937500000002,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 54,
        "timesteps": 10800,
        "reward_mean": -0.026799999999999904,
        "reward_max": 0.9111375,
        "reward_min": -1.0640500000000002,
        "leartime_s": 0.017448535974835977,
        "sampletime": 1.0143945050076582,
        "best_mean": -0.026799999999999904,
        "best_max": 0.9111375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 55,
        "timesteps": 11000,
        "reward_mean": -0.08362499999999992,
        "reward_max": 0.786,
        "reward_min": -1.311075,
        "leartime_s": 0.030754792009247467,
        "sampletime": 0.9456242620071862,
        "best_mean": -0.026799999999999904,
        "best_max": 0.9111375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 56,
        "timesteps": 11200,
        "reward_mean": -0.07919999999999983,
        "reward_max": 0.7876812500000003,
        "reward_min": -1.7581125,
        "leartime_s": 0.01885999200749211,
        "sampletime": 0.8139889840094838,
        "best_mean": -0.026799999999999904,
        "best_max": 0.9111375,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 57,
        "timesteps": 11400,
        "reward_mean": 0.07600000000000011,
        "reward_max": 0.9493625000000003,
        "reward_min": -1.41971875,
        "leartime_s": 0.025686907989438623,
        "sampletime": 0.8423472020076588,
        "best_mean": 0.07600000000000011,
        "best_max": 0.9493625000000003,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 58,
        "timesteps": 11600,
        "reward_mean": -0.04077499999999995,
        "reward_max": 0.8425874999999998,
        "reward_min": -1.14599375,
        "leartime_s": 0.061399094003718346,
        "sampletime": 1.156103802000871,
        "best_mean": 0.07600000000000011,
        "best_max": 0.9493625000000003,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 59,
        "timesteps": 11800,
        "reward_mean": -0.11214999999999996,
        "reward_max": 1.0026499999999998,
        "reward_min": -1.5515687500000002,
        "leartime_s": 0.02569542801938951,
        "sampletime": 0.8593342200038023,
        "best_mean": 0.07600000000000011,
        "best_max": 0.9493625000000003,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 60,
        "timesteps": 12000,
        "reward_mean": 0.031000000000000184,
        "reward_max": 1.1814875000000002,
        "reward_min": -1.07015,
        "leartime_s": 0.02236937000998296,
        "sampletime": 0.7333077200164553,
        "best_mean": 0.07600000000000011,
        "best_max": 0.9493625000000003,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 61,
        "timesteps": 12200,
        "reward_mean": -0.1650499999999999,
        "reward_max": 0.6873312500000002,
        "reward_min": -1.2146624999999998,
        "leartime_s": 0.02219359399168752,
        "sampletime": 0.9635299069923349,
        "best_mean": 0.07600000000000011,
        "best_max": 0.9493625000000003,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 62,
        "timesteps": 12400,
        "reward_mean": 0.07764999999999991,
        "reward_max": 0.9319687499999997,
        "reward_min": -0.9377375,
        "leartime_s": 0.020959164015948772,
        "sampletime": 0.7314822870248463,
        "best_mean": 0.07764999999999991,
        "best_max": 0.9319687499999997,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 63,
        "timesteps": 12600,
        "reward_mean": 0.1439750000000001,
        "reward_max": 0.8350562499999999,
        "reward_min": -1.1162812500000001,
        "leartime_s": 0.020844729006057605,
        "sampletime": 0.7890141259995289,
        "best_mean": 0.1439750000000001,
        "best_max": 0.8350562499999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 64,
        "timesteps": 12800,
        "reward_mean": -0.12907499999999988,
        "reward_max": 0.8176125000000002,
        "reward_min": -1.1321562499999998,
        "leartime_s": 0.06256830302299932,
        "sampletime": 0.9871389239851851,
        "best_mean": 0.1439750000000001,
        "best_max": 0.8350562499999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 65,
        "timesteps": 13000,
        "reward_mean": 0.07387500000000012,
        "reward_max": 0.8830437500000002,
        "reward_min": -0.8701687499999998,
        "leartime_s": 0.028553559008287266,
        "sampletime": 0.9054607870057225,
        "best_mean": 0.1439750000000001,
        "best_max": 0.8350562499999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 66,
        "timesteps": 13200,
        "reward_mean": -0.011424999999999963,
        "reward_max": 0.9403875000000002,
        "reward_min": -1.5444124999999995,
        "leartime_s": 0.029885404015658423,
        "sampletime": 0.826755486021284,
        "best_mean": 0.1439750000000001,
        "best_max": 0.8350562499999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 67,
        "timesteps": 13400,
        "reward_mean": 0.050200000000000015,
        "reward_max": 0.8915875,
        "reward_min": -1.3892624999999998,
        "leartime_s": 0.028826769994338974,
        "sampletime": 0.8142915799980983,
        "best_mean": 0.1439750000000001,
        "best_max": 0.8350562499999999,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 68,
        "timesteps": 13600,
        "reward_mean": 0.1605250000000001,
        "reward_max": 1.0056312500000002,
        "reward_min": -0.8762875,
        "leartime_s": 0.05033933598315343,
        "sampletime": 0.8887657120067161,
        "best_mean": 0.1605250000000001,
        "best_max": 1.0056312500000002,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 69,
        "timesteps": 13800,
        "reward_mean": 0.02142500000000012,
        "reward_max": 1.0588937500000002,
        "reward_min": -0.9921875000000003,
        "leartime_s": 0.030893571994965896,
        "sampletime": 0.7873078629781958,
        "best_mean": 0.1605250000000001,
        "best_max": 1.0056312500000002,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 70,
        "timesteps": 14000,
        "reward_mean": -0.08304999999999997,
        "reward_max": 0.7253375000000002,
        "reward_min": -1.0877374999999998,
        "leartime_s": 0.030437418987276033,
        "sampletime": 0.8779016289918218,
        "best_mean": 0.1605250000000001,
        "best_max": 1.0056312500000002,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 71,
        "timesteps": 14200,
        "reward_mean": 0.021025000000000113,
        "reward_max": 0.86848125,
        "reward_min": -1.1272312500000001,
        "leartime_s": 0.07185921902419068,
        "sampletime": 1.1101567020232324,
        "best_mean": 0.1605250000000001,
        "best_max": 1.0056312500000002,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 72,
        "timesteps": 14400,
        "reward_mean": -0.00742499999999991,
        "reward_max": 0.9304187500000002,
        "reward_min": -1.0629062499999997,
        "leartime_s": 0.03605025101569481,
        "sampletime": 0.7612385450047441,
        "best_mean": 0.1605250000000001,
        "best_max": 1.0056312500000002,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 73,
        "timesteps": 14600,
        "reward_mean": -0.0720749999999999,
        "reward_max": 0.9419625000000001,
        "reward_min": -0.9928999999999999,
        "leartime_s": 0.037212266004644334,
        "sampletime": 0.7656761939870194,
        "best_mean": 0.1605250000000001,
        "best_max": 1.0056312500000002,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 74,
        "timesteps": 14800,
        "reward_mean": 0.07027500000000003,
        "reward_max": 0.9437500000000001,
        "reward_min": -1.02728125,
        "leartime_s": 0.02469105599448085,
        "sampletime": 0.9036779800080694,
        "best_mean": 0.1605250000000001,
        "best_max": 1.0056312500000002,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 75,
        "timesteps": 15000,
        "reward_mean": 0.14557500000000015,
        "reward_max": 1.0978187500000003,
        "reward_min": -0.9399624999999996,
        "leartime_s": 0.08102944801794365,
        "sampletime": 1.0587341039790772,
        "best_mean": 0.1605250000000001,
        "best_max": 1.0056312500000002,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 76,
        "timesteps": 15200,
        "reward_mean": 0.40332500000000004,
        "reward_max": 1.319175,
        "reward_min": -0.868725,
        "leartime_s": 0.035002315999008715,
        "sampletime": 0.8109845530125313,
        "best_mean": 0.40332500000000004,
        "best_max": 1.319175,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 77,
        "timesteps": 15400,
        "reward_mean": 0.10230000000000015,
        "reward_max": 0.9438125,
        "reward_min": -1.0030750000000002,
        "leartime_s": 0.00984579199575819,
        "sampletime": 0.8515694260131568,
        "best_mean": 0.40332500000000004,
        "best_max": 1.319175,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 78,
        "timesteps": 15600,
        "reward_mean": 0.18522500000000006,
        "reward_max": 1.0936500000000002,
        "reward_min": -1.1921374999999999,
        "leartime_s": 0.037733377976110205,
        "sampletime": 1.0208831019990612,
        "best_mean": 0.40332500000000004,
        "best_max": 1.319175,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 79,
        "timesteps": 15800,
        "reward_mean": 0.031125000000000107,
        "reward_max": 0.9010312500000004,
        "reward_min": -1.3298312499999996,
        "leartime_s": 0.019178616988938302,
        "sampletime": 1.1141870820138138,
        "best_mean": 0.40332500000000004,
        "best_max": 1.319175,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 80,
        "timesteps": 16000,
        "reward_mean": 0.021675000000000146,
        "reward_max": 0.9297625000000002,
        "reward_min": -1.14489375,
        "leartime_s": 0.017745192017173395,
        "sampletime": 0.8712022690160666,
        "best_mean": 0.40332500000000004,
        "best_max": 1.319175,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 81,
        "timesteps": 16200,
        "reward_mean": 0.16545000000000012,
        "reward_max": 1.3292562499999998,
        "reward_min": -1.1696187499999997,
        "leartime_s": 0.011399106995668262,
        "sampletime": 0.9911497699795291,
        "best_mean": 0.40332500000000004,
        "best_max": 1.319175,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 82,
        "timesteps": 16400,
        "reward_mean": 0.2442000000000002,
        "reward_max": 1.1420124999999999,
        "reward_min": -0.9689999999999998,
        "leartime_s": 0.04727194699808024,
        "sampletime": 0.8892744010081515,
        "best_mean": 0.40332500000000004,
        "best_max": 1.319175,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 83,
        "timesteps": 16600,
        "reward_mean": 0.05762500000000022,
        "reward_max": 0.8817500000000003,
        "reward_min": -1.10016875,
        "leartime_s": 0.022613609995460138,
        "sampletime": 0.8046405219938606,
        "best_mean": 0.40332500000000004,
        "best_max": 1.319175,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 84,
        "timesteps": 16800,
        "reward_mean": 0.054450000000000116,
        "reward_max": 0.8326375,
        "reward_min": -1.0510062500000001,
        "leartime_s": 0.0387985740089789,
        "sampletime": 0.7842537249962334,
        "best_mean": 0.40332500000000004,
        "best_max": 1.319175,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 85,
        "timesteps": 17000,
        "reward_mean": 0.19852500000000028,
        "reward_max": 1.0797250000000003,
        "reward_min": -0.7301749999999998,
        "leartime_s": 0.01725879599689506,
        "sampletime": 0.9048477169999387,
        "best_mean": 0.40332500000000004,
        "best_max": 1.319175,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 86,
        "timesteps": 17200,
        "reward_mean": 0.07367500000000005,
        "reward_max": 0.9833062499999999,
        "reward_min": -1.0444999999999998,
        "leartime_s": 0.03184747800696641,
        "sampletime": 0.7531713579955976,
        "best_mean": 0.40332500000000004,
        "best_max": 1.319175,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 87,
        "timesteps": 17400,
        "reward_mean": -0.1452249999999999,
        "reward_max": 0.9604124999999999,
        "reward_min": -1.3195375,
        "leartime_s": 0.021715414011850953,
        "sampletime": 0.7957571120059583,
        "best_mean": 0.40332500000000004,
        "best_max": 1.319175,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 88,
        "timesteps": 17600,
        "reward_mean": 0.07172500000000002,
        "reward_max": 0.9111375000000003,
        "reward_min": -1.3443375,
        "leartime_s": 0.09496331997797824,
        "sampletime": 0.9092763270018622,
        "best_mean": 0.40332500000000004,
        "best_max": 1.319175,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 89,
        "timesteps": 17800,
        "reward_mean": -0.12099999999999969,
        "reward_max": 0.7424875000000002,
        "reward_min": -1.3578312499999996,
        "leartime_s": 0.028953423985512927,
        "sampletime": 0.6960663399950135,
        "best_mean": 0.40332500000000004,
        "best_max": 1.319175,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 90,
        "timesteps": 18000,
        "reward_mean": 0.12020000000000003,
        "reward_max": 1.0354187499999998,
        "reward_min": -0.9004000000000002,
        "leartime_s": 0.023579884000355378,
        "sampletime": 0.8730859300121665,
        "best_mean": 0.40332500000000004,
        "best_max": 1.319175,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 91,
        "timesteps": 18200,
        "reward_mean": 0.017900000000000235,
        "reward_max": 1.028825,
        "reward_min": -1.0374499999999989,
        "leartime_s": 0.04050041298614815,
        "sampletime": 1.0293929710169323,
        "best_mean": 0.40332500000000004,
        "best_max": 1.319175,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 92,
        "timesteps": 18400,
        "reward_mean": -0.20842499999999986,
        "reward_max": 0.7987687500000001,
        "reward_min": -1.5627312500000001,
        "leartime_s": 0.017522930982522666,
        "sampletime": 0.8523516190180089,
        "best_mean": 0.40332500000000004,
        "best_max": 1.319175,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 93,
        "timesteps": 18600,
        "reward_mean": 0.024425000000000138,
        "reward_max": 1.13745625,
        "reward_min": -0.97975625,
        "leartime_s": 0.059199304989306256,
        "sampletime": 0.7305525219999254,
        "best_mean": 0.40332500000000004,
        "best_max": 1.319175,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 94,
        "timesteps": 18800,
        "reward_mean": 0.021700000000000115,
        "reward_max": 0.94239375,
        "reward_min": -0.9743812499999998,
        "leartime_s": 0.021211715997196734,
        "sampletime": 1.0701174919959158,
        "best_mean": 0.40332500000000004,
        "best_max": 1.319175,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 95,
        "timesteps": 19000,
        "reward_mean": -0.148,
        "reward_max": 0.7429437500000001,
        "reward_min": -1.2536500000000004,
        "leartime_s": 0.029625427996506914,
        "sampletime": 0.8113695569918491,
        "best_mean": 0.40332500000000004,
        "best_max": 1.319175,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 96,
        "timesteps": 19200,
        "reward_mean": 0.2211000000000001,
        "reward_max": 1.0342,
        "reward_min": -0.6622187500000001,
        "leartime_s": 0.0460471140104346,
        "sampletime": 0.8223673139873426,
        "best_mean": 0.40332500000000004,
        "best_max": 1.319175,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 97,
        "timesteps": 19400,
        "reward_mean": -0.18342499999999978,
        "reward_max": 0.6648312500000003,
        "reward_min": -1.42008125,
        "leartime_s": 0.016714926983695477,
        "sampletime": 1.0906040989793837,
        "best_mean": 0.40332500000000004,
        "best_max": 1.319175,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 98,
        "timesteps": 19600,
        "reward_mean": -0.03809999999999995,
        "reward_max": 0.7862187500000003,
        "reward_min": -1.3475125000000001,
        "leartime_s": 0.06504670297726989,
        "sampletime": 0.9572646970045753,
        "best_mean": 0.40332500000000004,
        "best_max": 1.319175,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 99,
        "timesteps": 19800,
        "reward_mean": -0.13492499999999985,
        "reward_max": 0.6732687500000003,
        "reward_min": -1.56520625,
        "leartime_s": 0.014455338998232037,
        "sampletime": 0.7612714690039866,
        "best_mean": 0.40332500000000004,
        "best_max": 1.319175,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 100,
        "timesteps": 20000,
        "reward_mean": 0.08350000000000013,
        "reward_max": 1.0789500000000003,
        "reward_min": -0.9154749999999997,
        "leartime_s": 0.023740575998090208,
        "sampletime": 0.8174292079929728,
        "best_mean": 0.40332500000000004,
        "best_max": 1.319175,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 101,
        "timesteps": 20200,
        "reward_mean": 0.14172500000000007,
        "reward_max": 0.9890625000000002,
        "reward_min": -1.1911874999999996,
        "leartime_s": 0.053707999002654105,
        "sampletime": 0.9906230960041285,
        "best_mean": 0.40332500000000004,
        "best_max": 1.319175,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 102,
        "timesteps": 20400,
        "reward_mean": -0.38157499999999983,
        "reward_max": 0.5743687500000001,
        "reward_min": -1.4395875,
        "leartime_s": 0.04136290799942799,
        "sampletime": 0.8295241669984534,
        "best_mean": 0.40332500000000004,
        "best_max": 1.319175,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 103,
        "timesteps": 20600,
        "reward_mean": -0.07722499999999986,
        "reward_max": 0.7352375,
        "reward_min": -1.2092062499999998,
        "leartime_s": 0.010599372995784506,
        "sampletime": 0.8803611260082107,
        "best_mean": 0.40332500000000004,
        "best_max": 1.319175,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 104,
        "timesteps": 20800,
        "reward_mean": 0.24950000000000025,
        "reward_max": 1.0200000000000002,
        "reward_min": -1.1084687499999997,
        "leartime_s": 0.034363901999313384,
        "sampletime": 1.0128200809995178,
        "best_mean": 0.40332500000000004,
        "best_max": 1.319175,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 105,
        "timesteps": 21000,
        "reward_mean": 0.1466750000000002,
        "reward_max": 1.1117375000000003,
        "reward_min": -0.8745187499999999,
        "leartime_s": 0.03182858999934979,
        "sampletime": 0.8982365700067021,
        "best_mean": 0.40332500000000004,
        "best_max": 1.319175,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 106,
        "timesteps": 21200,
        "reward_mean": 0.26310000000000017,
        "reward_max": 1.1103937500000003,
        "reward_min": -0.7818187499999998,
        "leartime_s": 0.02424331899965182,
        "sampletime": 0.7803826619929168,
        "best_mean": 0.40332500000000004,
        "best_max": 1.319175,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 107,
        "timesteps": 21400,
        "reward_mean": 0.01244999999999994,
        "reward_max": 1.2679937499999998,
        "reward_min": -1.1742374999999998,
        "leartime_s": 0.021248839009786025,
        "sampletime": 0.8288042930071242,
        "best_mean": 0.40332500000000004,
        "best_max": 1.319175,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 108,
        "timesteps": 21600,
        "reward_mean": 0.09897500000000028,
        "reward_max": 1.1034875000000006,
        "reward_min": -0.8223999999999998,
        "leartime_s": 0.020068850979441777,
        "sampletime": 1.0666295510018244,
        "best_mean": 0.40332500000000004,
        "best_max": 1.319175,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 109,
        "timesteps": 21800,
        "reward_mean": -0.18805,
        "reward_max": 0.7222312499999999,
        "reward_min": -1.1376625000000002,
        "leartime_s": 0.021801181021146476,
        "sampletime": 0.8954445070121437,
        "best_mean": 0.40332500000000004,
        "best_max": 1.319175,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 110,
        "timesteps": 22000,
        "reward_mean": 0.01932500000000014,
        "reward_max": 0.8219125,
        "reward_min": -1.38139375,
        "leartime_s": 0.018842746008886024,
        "sampletime": 0.8239684170112014,
        "best_mean": 0.40332500000000004,
        "best_max": 1.319175,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 111,
        "timesteps": 22200,
        "reward_mean": -0.002774999999999947,
        "reward_max": 1.10375,
        "reward_min": -1.8807125,
        "leartime_s": 0.04254220399889164,
        "sampletime": 0.9722372220130637,
        "best_mean": 0.40332500000000004,
        "best_max": 1.319175,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 112,
        "timesteps": 22400,
        "reward_mean": -0.09604999999999982,
        "reward_max": 0.8789187500000001,
        "reward_min": -1.3119750000000001,
        "leartime_s": 0.043627687002299353,
        "sampletime": 0.7521587510127574,
        "best_mean": 0.40332500000000004,
        "best_max": 1.319175,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 113,
        "timesteps": 22600,
        "reward_mean": 0.13765000000000022,
        "reward_max": 0.9510500000000004,
        "reward_min": -0.7979687499999999,
        "leartime_s": 0.03672729100799188,
        "sampletime": 0.7958336229785345,
        "best_mean": 0.40332500000000004,
        "best_max": 1.319175,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 114,
        "timesteps": 22800,
        "reward_mean": -0.12349999999999986,
        "reward_max": 0.9138125,
        "reward_min": -1.2680624999999996,
        "leartime_s": 0.060969910002313554,
        "sampletime": 0.9621355129929725,
        "best_mean": 0.40332500000000004,
        "best_max": 1.319175,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 115,
        "timesteps": 23000,
        "reward_mean": 0.11822500000000016,
        "reward_max": 1.13243125,
        "reward_min": -1.36946875,
        "leartime_s": 0.02106797500164248,
        "sampletime": 1.1116924450034276,
        "best_mean": 0.40332500000000004,
        "best_max": 1.319175,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 116,
        "timesteps": 23200,
        "reward_mean": 0.08912500000000005,
        "reward_max": 0.9321625000000001,
        "reward_min": -1.3158687500000004,
        "leartime_s": 0.032127822982147336,
        "sampletime": 0.7551691970147658,
        "best_mean": 0.40332500000000004,
        "best_max": 1.319175,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 117,
        "timesteps": 23400,
        "reward_mean": -0.17769999999999983,
        "reward_max": 0.6806187499999999,
        "reward_min": -1.2243124999999997,
        "leartime_s": 0.047537617007037625,
        "sampletime": 0.7179847380029969,
        "best_mean": 0.40332500000000004,
        "best_max": 1.319175,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 118,
        "timesteps": 23600,
        "reward_mean": 0.08825000000000018,
        "reward_max": 0.910825,
        "reward_min": -1.2824687499999998,
        "leartime_s": 0.038227237993851304,
        "sampletime": 0.9248333260184154,
        "best_mean": 0.40332500000000004,
        "best_max": 1.319175,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 119,
        "timesteps": 23800,
        "reward_mean": 0.21450000000000016,
        "reward_max": 1.2439812500000005,
        "reward_min": -0.8807437499999999,
        "leartime_s": 0.06698550601140596,
        "sampletime": 0.9020209670125041,
        "best_mean": 0.40332500000000004,
        "best_max": 1.319175,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 120,
        "timesteps": 24000,
        "reward_mean": 0.008525000000000211,
        "reward_max": 0.8635625,
        "reward_min": -1.03506875,
        "leartime_s": 0.0778633329900913,
        "sampletime": 0.782190605008509,
        "best_mean": 0.40332500000000004,
        "best_max": 1.319175,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 121,
        "timesteps": 24200,
        "reward_mean": 0.020925000000000176,
        "reward_max": 0.98226875,
        "reward_min": -1.1376249999999999,
        "leartime_s": 0.03141277900431305,
        "sampletime": 0.8218001640052535,
        "best_mean": 0.40332500000000004,
        "best_max": 1.319175,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 122,
        "timesteps": 24400,
        "reward_mean": 5.000000000014904e-05,
        "reward_max": 1.04149375,
        "reward_min": -1.3342999999999998,
        "leartime_s": 0.05994046601699665,
        "sampletime": 0.7172268319991417,
        "best_mean": 0.40332500000000004,
        "best_max": 1.319175,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 123,
        "timesteps": 24600,
        "reward_mean": 0.15775000000000033,
        "reward_max": 1.1666750000000006,
        "reward_min": -1.3322437499999995,
        "leartime_s": 0.02167745798942633,
        "sampletime": 0.8084849350270815,
        "best_mean": 0.40332500000000004,
        "best_max": 1.319175,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 124,
        "timesteps": 24800,
        "reward_mean": 0.09297500000000025,
        "reward_max": 0.9191562500000002,
        "reward_min": -0.9141874999999999,
        "leartime_s": 0.051366973988479,
        "sampletime": 0.9813148880202789,
        "best_mean": 0.40332500000000004,
        "best_max": 1.319175,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 125,
        "timesteps": 25000,
        "reward_mean": -0.2651749999999997,
        "reward_max": 0.6073875000000003,
        "reward_min": -1.33551875,
        "leartime_s": 0.06860230400343426,
        "sampletime": 0.8200496589997783,
        "best_mean": 0.40332500000000004,
        "best_max": 1.319175,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 126,
        "timesteps": 25200,
        "reward_mean": 0.14362500000000014,
        "reward_max": 1.06988125,
        "reward_min": -1.04078125,
        "leartime_s": 0.02457458499702625,
        "sampletime": 0.8563643830129877,
        "best_mean": 0.40332500000000004,
        "best_max": 1.319175,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 127,
        "timesteps": 25400,
        "reward_mean": -0.07042499999999986,
        "reward_max": 0.8472687500000001,
        "reward_min": -1.3307687499999994,
        "leartime_s": 0.0529829110018909,
        "sampletime": 0.8816344160004519,
        "best_mean": 0.40332500000000004,
        "best_max": 1.319175,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 128,
        "timesteps": 25600,
        "reward_mean": -0.05122499999999975,
        "reward_max": 0.8761437500000003,
        "reward_min": -1.29165625,
        "leartime_s": 0.08361461700405926,
        "sampletime": 1.0751624809927307,
        "best_mean": 0.40332500000000004,
        "best_max": 1.319175,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 129,
        "timesteps": 25800,
        "reward_mean": 0.13745000000000027,
        "reward_max": 1.1640687500000002,
        "reward_min": -1.4510312499999996,
        "leartime_s": 0.04955440599587746,
        "sampletime": 0.8632670159859117,
        "best_mean": 0.40332500000000004,
        "best_max": 1.319175,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 130,
        "timesteps": 26000,
        "reward_mean": 0.04480000000000012,
        "reward_max": 0.9744687500000002,
        "reward_min": -1.4013125,
        "leartime_s": 0.02039655702537857,
        "sampletime": 0.8974850419908762,
        "best_mean": 0.40332500000000004,
        "best_max": 1.319175,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 131,
        "timesteps": 26200,
        "reward_mean": 0.10345000000000025,
        "reward_max": 0.9587250000000003,
        "reward_min": -0.8994374999999994,
        "leartime_s": 0.018414377991575748,
        "sampletime": 1.2052032130013686,
        "best_mean": 0.40332500000000004,
        "best_max": 1.319175,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 132,
        "timesteps": 26400,
        "reward_mean": 0.2060750000000002,
        "reward_max": 1.2575187500000005,
        "reward_min": -0.9867562499999998,
        "leartime_s": 0.03038763499353081,
        "sampletime": 0.8115048239997122,
        "best_mean": 0.40332500000000004,
        "best_max": 1.319175,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 133,
        "timesteps": 26600,
        "reward_mean": 0.30712500000000004,
        "reward_max": 1.4044937499999999,
        "reward_min": -1.1638562499999998,
        "leartime_s": 0.011744010000256822,
        "sampletime": 0.880811218987219,
        "best_mean": 0.40332500000000004,
        "best_max": 1.319175,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 134,
        "timesteps": 26800,
        "reward_mean": 0.31092500000000023,
        "reward_max": 1.1306937500000005,
        "reward_min": -0.6276499999999997,
        "leartime_s": 0.033592177991522476,
        "sampletime": 0.9860160569951404,
        "best_mean": 0.40332500000000004,
        "best_max": 1.319175,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 135,
        "timesteps": 27000,
        "reward_mean": 0.1708250000000003,
        "reward_max": 1.1902062500000006,
        "reward_min": -0.8683812499999998,
        "leartime_s": 0.0412844660168048,
        "sampletime": 0.9950323489902075,
        "best_mean": 0.40332500000000004,
        "best_max": 1.319175,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 136,
        "timesteps": 27200,
        "reward_mean": 0.26515000000000016,
        "reward_max": 1.2561687500000005,
        "reward_min": -1.324625,
        "leartime_s": 0.07295525597874075,
        "sampletime": 0.7822767230099998,
        "best_mean": 0.40332500000000004,
        "best_max": 1.319175,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 137,
        "timesteps": 27400,
        "reward_mean": 0.40622500000000006,
        "reward_max": 1.2823249999999995,
        "reward_min": -0.7241749999999997,
        "leartime_s": 0.05293578500277363,
        "sampletime": 0.8828855049796402,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 138,
        "timesteps": 27600,
        "reward_mean": 0.2875500000000002,
        "reward_max": 1.32145,
        "reward_min": -1.2308499999999998,
        "leartime_s": 0.031023721996461973,
        "sampletime": 1.0084570700128097,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 139,
        "timesteps": 27800,
        "reward_mean": -0.0032749999999998405,
        "reward_max": 0.9310500000000004,
        "reward_min": -0.9389374999999999,
        "leartime_s": 0.057175259018549696,
        "sampletime": 0.845199393981602,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 140,
        "timesteps": 28000,
        "reward_mean": 0.3217750000000001,
        "reward_max": 1.36474375,
        "reward_min": -0.9953687500000001,
        "leartime_s": 0.02040173701243475,
        "sampletime": 0.8170041980047245,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 141,
        "timesteps": 28200,
        "reward_mean": 0.31325,
        "reward_max": 1.23326875,
        "reward_min": -0.68030625,
        "leartime_s": 0.034996047004824504,
        "sampletime": 0.9312878260097932,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 142,
        "timesteps": 28400,
        "reward_mean": 0.1170750000000002,
        "reward_max": 1.1799937500000004,
        "reward_min": -1.2889562500000005,
        "leartime_s": 0.05865650001214817,
        "sampletime": 0.7531270849867724,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 143,
        "timesteps": 28600,
        "reward_mean": 0.3739250000000003,
        "reward_max": 1.2354562500000001,
        "reward_min": -0.7041937499999996,
        "leartime_s": 0.04386967699974775,
        "sampletime": 0.7477744019997772,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 144,
        "timesteps": 28800,
        "reward_mean": 0.04367500000000018,
        "reward_max": 1.0311687500000002,
        "reward_min": -1.4098062499999997,
        "leartime_s": 0.028433850995497778,
        "sampletime": 1.0122386220027693,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 145,
        "timesteps": 29000,
        "reward_mean": 0.2867250000000001,
        "reward_max": 1.0378375000000002,
        "reward_min": -1.1516687499999998,
        "leartime_s": 0.021356480981921777,
        "sampletime": 0.8583533719938714,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 146,
        "timesteps": 29200,
        "reward_mean": 0.22747500000000015,
        "reward_max": 1.1513437499999999,
        "reward_min": -0.9554124999999996,
        "leartime_s": 0.03411749500082806,
        "sampletime": 0.7927401869965252,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 147,
        "timesteps": 29400,
        "reward_mean": 0.04370000000000016,
        "reward_max": 1.0930125000000002,
        "reward_min": -1.1626437499999998,
        "leartime_s": 0.026941385003738105,
        "sampletime": 0.8604779549932573,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 148,
        "timesteps": 29600,
        "reward_mean": 0.20840000000000009,
        "reward_max": 1.3550375,
        "reward_min": -0.8777187499999999,
        "leartime_s": 0.028766536997864023,
        "sampletime": 1.0489952359930612,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 149,
        "timesteps": 29800,
        "reward_mean": 0.1413500000000002,
        "reward_max": 1.1426750000000003,
        "reward_min": -1.1655249999999997,
        "leartime_s": 0.021576981991529465,
        "sampletime": 0.8038183829921763,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 150,
        "timesteps": 30000,
        "reward_mean": 0.05930000000000012,
        "reward_max": 1.2346750000000002,
        "reward_min": -1.2025312499999998,
        "leartime_s": 0.02194122297805734,
        "sampletime": 0.7792767329956405,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 151,
        "timesteps": 30200,
        "reward_mean": 0.15357500000000032,
        "reward_max": 1.1962750000000004,
        "reward_min": -1.06560625,
        "leartime_s": 0.025776160007808357,
        "sampletime": 1.025660704006441,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 152,
        "timesteps": 30400,
        "reward_mean": 0.00015000000000017443,
        "reward_max": 1.2306875,
        "reward_min": -1.1432687499999998,
        "leartime_s": 0.04744857200421393,
        "sampletime": 0.770989741984522,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 153,
        "timesteps": 30600,
        "reward_mean": 0.14435000000000003,
        "reward_max": 1.0429687500000002,
        "reward_min": -0.9823625,
        "leartime_s": 0.02948099799687043,
        "sampletime": 0.9096407130127773,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 154,
        "timesteps": 30800,
        "reward_mean": 0.17742500000000017,
        "reward_max": 1.5623937500000005,
        "reward_min": -1.0239937500000003,
        "leartime_s": 0.031857076013693586,
        "sampletime": 0.9840155059937388,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 155,
        "timesteps": 31000,
        "reward_mean": 0.006600000000000289,
        "reward_max": 1.1695499999999999,
        "reward_min": -1.1464874999999997,
        "leartime_s": 0.0419613329868298,
        "sampletime": 1.0970362100051716,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 156,
        "timesteps": 31200,
        "reward_mean": 0.25697500000000023,
        "reward_max": 1.0551312500000003,
        "reward_min": -0.8267625000000001,
        "leartime_s": 0.03486859900294803,
        "sampletime": 0.7453513159998693,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 157,
        "timesteps": 31400,
        "reward_mean": 0.2517500000000002,
        "reward_max": 1.1039000000000003,
        "reward_min": -0.9019249999999996,
        "leartime_s": 0.045330797001952305,
        "sampletime": 0.8685944720054977,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 158,
        "timesteps": 31600,
        "reward_mean": 0.17422500000000019,
        "reward_max": 1.1360250000000003,
        "reward_min": -1.0380812499999998,
        "leartime_s": 0.014942845999030396,
        "sampletime": 0.7529581839917228,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 159,
        "timesteps": 31800,
        "reward_mean": 0.32292500000000024,
        "reward_max": 1.1841812500000004,
        "reward_min": -0.6922187499999999,
        "leartime_s": 0.023411812988342717,
        "sampletime": 0.690266606019577,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 160,
        "timesteps": 32000,
        "reward_mean": 0.057250000000000335,
        "reward_max": 0.9537000000000003,
        "reward_min": -1.05419375,
        "leartime_s": 0.03841819800436497,
        "sampletime": 0.8528651210071985,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 161,
        "timesteps": 32200,
        "reward_mean": -0.013074999999999804,
        "reward_max": 0.8796375000000003,
        "reward_min": -1.1758437499999999,
        "leartime_s": 0.028602436010260135,
        "sampletime": 1.0197571619937662,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 162,
        "timesteps": 32400,
        "reward_mean": 0.09452500000000029,
        "reward_max": 0.9744125000000003,
        "reward_min": -0.9599812499999996,
        "leartime_s": 0.0408371860103216,
        "sampletime": 0.8494601779966615,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 163,
        "timesteps": 32600,
        "reward_mean": -0.031574999999999846,
        "reward_max": 0.9358062500000002,
        "reward_min": -0.9490250000000001,
        "leartime_s": 0.0467435350001324,
        "sampletime": 0.9220616040111054,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 164,
        "timesteps": 32800,
        "reward_mean": 0.01940000000000028,
        "reward_max": 1.0734250000000003,
        "reward_min": -1.3632875,
        "leartime_s": 0.048422569991089404,
        "sampletime": 0.8814576550212223,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 165,
        "timesteps": 33000,
        "reward_mean": 0.14200000000000024,
        "reward_max": 1.0539375000000002,
        "reward_min": -0.9136124999999998,
        "leartime_s": 0.09023589300340973,
        "sampletime": 0.7626773010124452,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 166,
        "timesteps": 33200,
        "reward_mean": 0.2980750000000003,
        "reward_max": 1.1738687500000005,
        "reward_min": -1.0751312499999996,
        "leartime_s": 0.019654856994748116,
        "sampletime": 0.8352647089923266,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 167,
        "timesteps": 33400,
        "reward_mean": 0.3103250000000003,
        "reward_max": 1.1963187500000003,
        "reward_min": -0.6811062499999998,
        "leartime_s": 0.0594584790233057,
        "sampletime": 0.8907613570045214,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 168,
        "timesteps": 33600,
        "reward_mean": 0.12057500000000032,
        "reward_max": 1.0232062500000003,
        "reward_min": -0.9357499999999996,
        "leartime_s": 0.08584236400201917,
        "sampletime": 0.7904813720087986,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 169,
        "timesteps": 33800,
        "reward_mean": 0.18412500000000015,
        "reward_max": 1.1846437500000002,
        "reward_min": -1.24425,
        "leartime_s": 0.038955460011493415,
        "sampletime": 0.7588230780092999,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 170,
        "timesteps": 34000,
        "reward_mean": -0.014349999999999797,
        "reward_max": 0.8246875000000002,
        "reward_min": -1.0781499999999997,
        "leartime_s": 0.013084596022963524,
        "sampletime": 0.8288914890144952,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 171,
        "timesteps": 34200,
        "reward_mean": 0.07572500000000022,
        "reward_max": 1.09724375,
        "reward_min": -1.4538562499999994,
        "leartime_s": 0.01518589400802739,
        "sampletime": 1.103162021987373,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 172,
        "timesteps": 34400,
        "reward_mean": 0.044325000000000205,
        "reward_max": 1.0032625000000002,
        "reward_min": -1.0584687499999996,
        "leartime_s": 0.027819882991025224,
        "sampletime": 0.811021934991004,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 173,
        "timesteps": 34600,
        "reward_mean": 0.3959250000000001,
        "reward_max": 1.20660625,
        "reward_min": -0.6821374999999997,
        "leartime_s": 0.019922956998925656,
        "sampletime": 0.9607028660248034,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 174,
        "timesteps": 34800,
        "reward_mean": 0.11947500000000028,
        "reward_max": 0.9682937500000005,
        "reward_min": -0.7836812499999997,
        "leartime_s": 0.020683793001808226,
        "sampletime": 0.9402404189750087,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 175,
        "timesteps": 35000,
        "reward_mean": 0.11670000000000028,
        "reward_max": 1.1301125000000003,
        "reward_min": -1.0923875,
        "leartime_s": 0.05980059300782159,
        "sampletime": 0.8599064419977367,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 176,
        "timesteps": 35200,
        "reward_mean": 0.11757500000000023,
        "reward_max": 1.1723249999999998,
        "reward_min": -1.3221812499999999,
        "leartime_s": 0.034157880989369005,
        "sampletime": 0.8297280510014389,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 177,
        "timesteps": 35400,
        "reward_mean": 0.11860000000000007,
        "reward_max": 0.8496250000000001,
        "reward_min": -1.0314750000000001,
        "leartime_s": 0.05649728898424655,
        "sampletime": 0.9125322200125083,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 178,
        "timesteps": 35600,
        "reward_mean": -0.0183499999999999,
        "reward_max": 0.7814312499999999,
        "reward_min": -1.3612125,
        "leartime_s": 0.07912875001784414,
        "sampletime": 0.7136472970014438,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 179,
        "timesteps": 35800,
        "reward_mean": 0.03850000000000018,
        "reward_max": 1.09175,
        "reward_min": -1.6594500000000005,
        "leartime_s": 0.04630886600352824,
        "sampletime": 0.7631322780216578,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 180,
        "timesteps": 36000,
        "reward_mean": 0.0029750000000001685,
        "reward_max": 1.0196125,
        "reward_min": -1.10310625,
        "leartime_s": 0.05640827797469683,
        "sampletime": 0.9144424709957093,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 181,
        "timesteps": 36200,
        "reward_mean": 0.2089250000000002,
        "reward_max": 1.4177937500000004,
        "reward_min": -1.0152312499999998,
        "leartime_s": 0.0689263140084222,
        "sampletime": 1.0282725510187447,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 182,
        "timesteps": 36400,
        "reward_mean": 0.13712500000000025,
        "reward_max": 1.2098750000000003,
        "reward_min": -0.8776187499999994,
        "leartime_s": 0.052702173008583486,
        "sampletime": 0.8241987480141688,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 183,
        "timesteps": 36600,
        "reward_mean": 0.18412500000000012,
        "reward_max": 1.02811875,
        "reward_min": -0.9994562500000002,
        "leartime_s": 0.04949042899534106,
        "sampletime": 0.7376439280051272,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 184,
        "timesteps": 36800,
        "reward_mean": 0.14492500000000014,
        "reward_max": 1.04963125,
        "reward_min": -1.2602,
        "leartime_s": 0.0360662929888349,
        "sampletime": 0.8453661770035978,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 185,
        "timesteps": 37000,
        "reward_mean": 0.26420000000000005,
        "reward_max": 1.106825,
        "reward_min": -0.6877437499999999,
        "leartime_s": 0.04695318901212886,
        "sampletime": 1.0228230110078584,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 186,
        "timesteps": 37200,
        "reward_mean": 0.08785000000000005,
        "reward_max": 0.9579749999999996,
        "reward_min": -1.0896499999999996,
        "leartime_s": 0.026157267013331875,
        "sampletime": 0.674134065018734,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 187,
        "timesteps": 37400,
        "reward_mean": 0.1728250000000001,
        "reward_max": 0.9886812500000001,
        "reward_min": -1.2119,
        "leartime_s": 0.02924333099508658,
        "sampletime": 0.7997454360011034,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 188,
        "timesteps": 37600,
        "reward_mean": 0.08537500000000015,
        "reward_max": 0.94095625,
        "reward_min": -0.9198875000000001,
        "leartime_s": 0.041807076981058344,
        "sampletime": 0.9675322569964919,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 189,
        "timesteps": 37800,
        "reward_mean": 0.03990000000000011,
        "reward_max": 0.9956,
        "reward_min": -1.1342687500000002,
        "leartime_s": 0.07383077900158241,
        "sampletime": 0.7434627239999827,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 190,
        "timesteps": 38000,
        "reward_mean": 0.08872500000000007,
        "reward_max": 1.0373687500000002,
        "reward_min": -1.01161875,
        "leartime_s": 0.03474088298389688,
        "sampletime": 0.7070433440094348,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 191,
        "timesteps": 38200,
        "reward_mean": -0.01777499999999992,
        "reward_max": 1.0212000000000003,
        "reward_min": -1.1123124999999998,
        "leartime_s": 0.04399325599661097,
        "sampletime": 0.8228405139816459,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 192,
        "timesteps": 38400,
        "reward_mean": 0.2661750000000003,
        "reward_max": 1.1254250000000003,
        "reward_min": -0.7908812499999993,
        "leartime_s": 0.0472224100085441,
        "sampletime": 1.0201965979940724,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 193,
        "timesteps": 38600,
        "reward_mean": 0.14752500000000016,
        "reward_max": 1.0467437499999999,
        "reward_min": -0.8631062499999999,
        "leartime_s": 0.0535570310021285,
        "sampletime": 0.7605920500063803,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 194,
        "timesteps": 38800,
        "reward_mean": -0.08894999999999988,
        "reward_max": 1.043125,
        "reward_min": -1.3322749999999997,
        "leartime_s": 0.031705061002867296,
        "sampletime": 0.7166408870252781,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 195,
        "timesteps": 39000,
        "reward_mean": -0.10324999999999991,
        "reward_max": 0.7192500000000001,
        "reward_min": -1.4958124999999995,
        "leartime_s": 0.034817236999515444,
        "sampletime": 0.7708261320076417,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 196,
        "timesteps": 39200,
        "reward_mean": 0.15737500000000024,
        "reward_max": 1.1146125000000002,
        "reward_min": -0.9473687499999995,
        "leartime_s": 0.013534551981138065,
        "sampletime": 0.7978135859884787,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 197,
        "timesteps": 39400,
        "reward_mean": -0.27764999999999995,
        "reward_max": 0.6097062499999998,
        "reward_min": -1.13611875,
        "leartime_s": 0.02259191099437885,
        "sampletime": 0.9296342319867108,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 198,
        "timesteps": 39600,
        "reward_mean": 0.045249999999999915,
        "reward_max": 0.9055812499999998,
        "reward_min": -1.278225,
        "leartime_s": 0.058289691020036116,
        "sampletime": 0.841711070999736,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 199,
        "timesteps": 39800,
        "reward_mean": -0.12404999999999991,
        "reward_max": 0.7223750000000001,
        "reward_min": -1.35251875,
        "leartime_s": 0.0425643110065721,
        "sampletime": 0.756114677991718,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 200,
        "timesteps": 40000,
        "reward_mean": -0.013599999999999878,
        "reward_max": 0.9056687500000002,
        "reward_min": -1.2175437500000001,
        "leartime_s": 0.024472110002534464,
        "sampletime": 0.8593829479941633,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 201,
        "timesteps": 40200,
        "reward_mean": 0.3408750000000002,
        "reward_max": 1.29141875,
        "reward_min": -0.8292687499999999,
        "leartime_s": 0.039677586988545954,
        "sampletime": 0.957260152004892,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 202,
        "timesteps": 40400,
        "reward_mean": -0.29645000000000005,
        "reward_max": 0.5997125,
        "reward_min": -1.4838750000000003,
        "leartime_s": 0.027478182018967345,
        "sampletime": 0.7890942389785778,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 203,
        "timesteps": 40600,
        "reward_mean": 0.00015000000000006962,
        "reward_max": 0.9337562499999998,
        "reward_min": -1.3816437499999998,
        "leartime_s": 0.03373046999331564,
        "sampletime": 0.8600820300052874,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 204,
        "timesteps": 40800,
        "reward_mean": -0.13612499999999986,
        "reward_max": 0.8463875000000003,
        "reward_min": -1.8644374999999989,
        "leartime_s": 0.07315979097620584,
        "sampletime": 1.0237889529962558,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 205,
        "timesteps": 41000,
        "reward_mean": 0.09390000000000011,
        "reward_max": 0.8082312500000003,
        "reward_min": -1.0005937499999995,
        "leartime_s": 0.07891414698679,
        "sampletime": 0.811289086996112,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 206,
        "timesteps": 41200,
        "reward_mean": -0.06232499999999983,
        "reward_max": 0.924225,
        "reward_min": -1.1974812499999998,
        "leartime_s": 0.019098625984042883,
        "sampletime": 0.8189066549821291,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 207,
        "timesteps": 41400,
        "reward_mean": 0.07922499999999993,
        "reward_max": 0.9066437499999999,
        "reward_min": -1.3376250000000005,
        "leartime_s": 0.015505480987485498,
        "sampletime": 0.9165946200082544,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 208,
        "timesteps": 41600,
        "reward_mean": 0.12230000000000017,
        "reward_max": 0.9767562500000004,
        "reward_min": -0.9575874999999996,
        "leartime_s": 0.04264136200072244,
        "sampletime": 1.0456268989946693,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 209,
        "timesteps": 41800,
        "reward_mean": -0.006950000000000032,
        "reward_max": 0.8858125,
        "reward_min": -1.1269375000000004,
        "leartime_s": 0.050526558014098555,
        "sampletime": 0.7423554480192252,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 210,
        "timesteps": 42000,
        "reward_mean": -0.16409999999999997,
        "reward_max": 0.7173687499999999,
        "reward_min": -1.269475,
        "leartime_s": 0.01829622298828326,
        "sampletime": 0.8879735230002552,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 211,
        "timesteps": 42200,
        "reward_mean": -0.16904999999999978,
        "reward_max": 0.8629500000000002,
        "reward_min": -1.45075,
        "leartime_s": 0.07401491500786506,
        "sampletime": 1.023572261998197,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 212,
        "timesteps": 42400,
        "reward_mean": -0.33770000000000006,
        "reward_max": 0.5114874999999998,
        "reward_min": -1.5590124999999997,
        "leartime_s": 0.05585174498264678,
        "sampletime": 0.9647061189753003,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 213,
        "timesteps": 42600,
        "reward_mean": 0.03652500000000012,
        "reward_max": 1.0089937500000001,
        "reward_min": -1.1656187499999997,
        "leartime_s": 0.06253097401349805,
        "sampletime": 0.7895700939989183,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 214,
        "timesteps": 42800,
        "reward_mean": -0.12242499999999991,
        "reward_max": 0.8582062499999998,
        "reward_min": -1.4446125,
        "leartime_s": 0.03148671501548961,
        "sampletime": 0.96055369800888,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 215,
        "timesteps": 43000,
        "reward_mean": -0.17917499999999995,
        "reward_max": 0.7570375000000001,
        "reward_min": -1.3258625,
        "leartime_s": 0.020380803005537018,
        "sampletime": 0.9309798869944643,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 216,
        "timesteps": 43200,
        "reward_mean": 0.055700000000000104,
        "reward_max": 1.0471062500000003,
        "reward_min": -1.0782125000000002,
        "leartime_s": 0.04948168498231098,
        "sampletime": 0.876853863010183,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 217,
        "timesteps": 43400,
        "reward_mean": -0.20182499999999998,
        "reward_max": 0.6475187500000001,
        "reward_min": -1.46276875,
        "leartime_s": 0.040715497016208246,
        "sampletime": 0.8167036840168294,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 218,
        "timesteps": 43600,
        "reward_mean": -0.11412499999999978,
        "reward_max": 0.989325,
        "reward_min": -1.0086124999999997,
        "leartime_s": 0.023993148002773523,
        "sampletime": 1.0843443209887482,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 219,
        "timesteps": 43800,
        "reward_mean": -0.22574999999999978,
        "reward_max": 0.7020625000000003,
        "reward_min": -1.3210875000000002,
        "leartime_s": 0.03259422900737263,
        "sampletime": 0.8050124550063629,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 220,
        "timesteps": 44000,
        "reward_mean": -0.11709999999999995,
        "reward_max": 0.7957875,
        "reward_min": -1.3353187499999999,
        "leartime_s": 0.049889668996911496,
        "sampletime": 0.8017590630042832,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 221,
        "timesteps": 44200,
        "reward_mean": 0.03967500000000016,
        "reward_max": 1.04055,
        "reward_min": -1.08650625,
        "leartime_s": 0.06448786798864603,
        "sampletime": 1.0330519379931502,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 222,
        "timesteps": 44400,
        "reward_mean": 0.05035000000000011,
        "reward_max": 0.9255187500000002,
        "reward_min": -1.1814562499999997,
        "leartime_s": 0.09787679798319004,
        "sampletime": 0.978116260987008,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 223,
        "timesteps": 44600,
        "reward_mean": -0.05197499999999993,
        "reward_max": 1.0453312499999998,
        "reward_min": -1.3097437499999998,
        "leartime_s": 0.031020471011288464,
        "sampletime": 0.8471721449750476,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 224,
        "timesteps": 44800,
        "reward_mean": -0.021275000000000002,
        "reward_max": 1.0150812500000002,
        "reward_min": -1.34146875,
        "leartime_s": 0.07457843198790215,
        "sampletime": 0.8565241289907135,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 225,
        "timesteps": 45000,
        "reward_mean": -0.30545000000000005,
        "reward_max": 0.48065625,
        "reward_min": -1.4962187500000004,
        "leartime_s": 0.06661790798534639,
        "sampletime": 1.0260690819995943,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 226,
        "timesteps": 45200,
        "reward_mean": -0.019849999999999913,
        "reward_max": 0.906375,
        "reward_min": -1.0884125000000002,
        "leartime_s": 0.044432994996896014,
        "sampletime": 0.8262097599799745,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 227,
        "timesteps": 45400,
        "reward_mean": -0.08369999999999995,
        "reward_max": 0.8315812499999997,
        "reward_min": -1.3771000000000002,
        "leartime_s": 0.01668353399145417,
        "sampletime": 0.7699258630163968,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 228,
        "timesteps": 45600,
        "reward_mean": -0.13994999999999988,
        "reward_max": 0.7045187500000003,
        "reward_min": -1.5493750000000002,
        "leartime_s": 0.036606389010557905,
        "sampletime": 0.9567661740002222,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 229,
        "timesteps": 45800,
        "reward_mean": -0.25547499999999995,
        "reward_max": 0.6637812500000001,
        "reward_min": -1.3387937500000002,
        "leartime_s": 0.05709925401606597,
        "sampletime": 0.9602537250029854,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 230,
        "timesteps": 46000,
        "reward_mean": -0.18135000000000007,
        "reward_max": 0.7033874999999998,
        "reward_min": -1.2399625,
        "leartime_s": 0.03385957897990011,
        "sampletime": 0.8108489269798156,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 231,
        "timesteps": 46200,
        "reward_mean": -0.013524999999999952,
        "reward_max": 0.7131437499999999,
        "reward_min": -1.147275,
        "leartime_s": 0.013680064002983272,
        "sampletime": 0.9367723840114195,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 232,
        "timesteps": 46400,
        "reward_mean": -0.30820000000000003,
        "reward_max": 0.5329312499999999,
        "reward_min": -1.5438437500000002,
        "leartime_s": 0.03288043400971219,
        "sampletime": 0.6625372580019757,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 233,
        "timesteps": 46600,
        "reward_mean": -0.22139999999999976,
        "reward_max": 0.89768125,
        "reward_min": -1.1804124999999996,
        "leartime_s": 0.03000039601465687,
        "sampletime": 0.7772850230103359,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 234,
        "timesteps": 46800,
        "reward_mean": -0.040524999999999874,
        "reward_max": 0.9889625000000002,
        "reward_min": -1.22950625,
        "leartime_s": 0.05104234899044968,
        "sampletime": 0.7540894679841585,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 235,
        "timesteps": 47000,
        "reward_mean": -0.12430000000000008,
        "reward_max": 0.7091124999999999,
        "reward_min": -1.1011812500000004,
        "leartime_s": 0.05554781699902378,
        "sampletime": 0.9405962940072641,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 236,
        "timesteps": 47200,
        "reward_mean": 0.12940000000000013,
        "reward_max": 0.9021625,
        "reward_min": -0.8302624999999999,
        "leartime_s": 0.0372178950055968,
        "sampletime": 0.7685761599859688,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 237,
        "timesteps": 47400,
        "reward_mean": 0.1495500000000001,
        "reward_max": 0.8173687500000002,
        "reward_min": -0.8730812499999998,
        "leartime_s": 0.03737793199252337,
        "sampletime": 0.7430427040089853,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 238,
        "timesteps": 47600,
        "reward_mean": -0.017475000000000088,
        "reward_max": 1.0898,
        "reward_min": -1.5470312499999999,
        "leartime_s": 0.03334005700889975,
        "sampletime": 1.0484618360060267,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 239,
        "timesteps": 47800,
        "reward_mean": -0.28777500000000006,
        "reward_max": 0.7401999999999997,
        "reward_min": -1.4629500000000002,
        "leartime_s": 0.019657402008306235,
        "sampletime": 0.9227783990208991,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 240,
        "timesteps": 48000,
        "reward_mean": -0.21497500000000003,
        "reward_max": 0.6321812499999999,
        "reward_min": -1.3204312500000004,
        "leartime_s": 0.03702113899635151,
        "sampletime": 0.7036329930124339,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 241,
        "timesteps": 48200,
        "reward_mean": -0.1802750000000001,
        "reward_max": 0.9711437500000001,
        "reward_min": -1.3395687500000006,
        "leartime_s": 0.03674857798614539,
        "sampletime": 0.9480589620070532,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 242,
        "timesteps": 48400,
        "reward_mean": -0.24722500000000006,
        "reward_max": 0.9301124999999998,
        "reward_min": -1.3687937500000007,
        "leartime_s": 0.07490321202203631,
        "sampletime": 1.0466021450120024,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 243,
        "timesteps": 48600,
        "reward_mean": -0.18572499999999992,
        "reward_max": 0.9386187500000005,
        "reward_min": -1.4920874999999996,
        "leartime_s": 0.07967512402683496,
        "sampletime": 0.8938014260202181,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 244,
        "timesteps": 48800,
        "reward_mean": -0.15132499999999993,
        "reward_max": 0.9194375000000001,
        "reward_min": -1.3236750000000004,
        "leartime_s": 0.031665418995544314,
        "sampletime": 0.770130719000008,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 245,
        "timesteps": 49000,
        "reward_mean": -0.004699999999999933,
        "reward_max": 1.051475,
        "reward_min": -1.1126624999999999,
        "leartime_s": 0.01737295198836364,
        "sampletime": 1.022040242998628,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 246,
        "timesteps": 49200,
        "reward_mean": -0.22342499999999998,
        "reward_max": 0.70508125,
        "reward_min": -1.3595125000000003,
        "leartime_s": 0.041870426008244976,
        "sampletime": 0.7770724709844217,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 247,
        "timesteps": 49400,
        "reward_mean": -0.10922499999999992,
        "reward_max": 0.8883312500000001,
        "reward_min": -1.3321937499999996,
        "leartime_s": 0.07168143702438101,
        "sampletime": 0.870200257981196,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 248,
        "timesteps": 49600,
        "reward_mean": 0.050300000000000046,
        "reward_max": 0.7637,
        "reward_min": -1.1076499999999996,
        "leartime_s": 0.07270653199520893,
        "sampletime": 0.9984234949806705,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 249,
        "timesteps": 49800,
        "reward_mean": -0.27157500000000007,
        "reward_max": 0.5886250000000001,
        "reward_min": -1.50995,
        "leartime_s": 0.0313509670086205,
        "sampletime": 0.7357851999986451,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 250,
        "timesteps": 50000,
        "reward_mean": -0.35700000000000004,
        "reward_max": 0.6405937500000001,
        "reward_min": -1.7041062500000002,
        "leartime_s": 0.03930829500313848,
        "sampletime": 0.8267619230027776,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 251,
        "timesteps": 50200,
        "reward_mean": -0.0016249999999998562,
        "reward_max": 0.9542750000000003,
        "reward_min": -1.04405625,
        "leartime_s": 0.07379618700360879,
        "sampletime": 0.9645419989828952,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 252,
        "timesteps": 50400,
        "reward_mean": -0.21129999999999985,
        "reward_max": 0.7176062500000002,
        "reward_min": -1.3418875000000001,
        "leartime_s": 0.05194977400242351,
        "sampletime": 0.7692053570062853,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 253,
        "timesteps": 50600,
        "reward_mean": -0.291375,
        "reward_max": 0.6726312499999997,
        "reward_min": -1.5811375000000003,
        "leartime_s": 0.023896727012470365,
        "sampletime": 0.7960573979944456,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 254,
        "timesteps": 50800,
        "reward_mean": -0.17867499999999994,
        "reward_max": 0.9786124999999999,
        "reward_min": -2.22945625,
        "leartime_s": 0.017104430007748306,
        "sampletime": 0.9893151340074837,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 255,
        "timesteps": 51000,
        "reward_mean": -0.19402499999999992,
        "reward_max": 0.9835562500000001,
        "reward_min": -1.7835062499999998,
        "leartime_s": 0.0644304429879412,
        "sampletime": 0.8109511059883516,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 256,
        "timesteps": 51200,
        "reward_mean": -0.24642499999999998,
        "reward_max": 0.84005,
        "reward_min": -1.5753999999999997,
        "leartime_s": 0.06270456599304453,
        "sampletime": 0.8116947130183689,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 257,
        "timesteps": 51400,
        "reward_mean": -0.20127499999999982,
        "reward_max": 0.8089437500000003,
        "reward_min": -1.5066312499999999,
        "leartime_s": 0.08027592199505307,
        "sampletime": 0.9989348179951776,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 258,
        "timesteps": 51600,
        "reward_mean": -0.16239999999999996,
        "reward_max": 0.85558125,
        "reward_min": -1.37614375,
        "leartime_s": 0.061458242998924106,
        "sampletime": 0.9340430280135479,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 259,
        "timesteps": 51800,
        "reward_mean": -0.21045000000000014,
        "reward_max": 0.7392874999999999,
        "reward_min": -1.4329375000000002,
        "leartime_s": 0.039630266022868454,
        "sampletime": 0.8382990180107299,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 260,
        "timesteps": 52000,
        "reward_mean": -0.160825,
        "reward_max": 0.8383812499999997,
        "reward_min": -1.4849999999999997,
        "leartime_s": 0.022974267980316654,
        "sampletime": 0.9405464379815385,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 261,
        "timesteps": 52200,
        "reward_mean": -0.372475,
        "reward_max": 0.7004187500000002,
        "reward_min": -2.0296687500000004,
        "leartime_s": 0.08200830899295397,
        "sampletime": 0.9190519369731192,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 262,
        "timesteps": 52400,
        "reward_mean": -0.015400000000000077,
        "reward_max": 0.9187124999999998,
        "reward_min": -1.14509375,
        "leartime_s": 0.022488855000119656,
        "sampletime": 0.7606873380136676,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 263,
        "timesteps": 52600,
        "reward_mean": -0.4289249999999999,
        "reward_max": 0.5012062500000001,
        "reward_min": -1.6896,
        "leartime_s": 0.04750129801686853,
        "sampletime": 0.7588853540073615,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 264,
        "timesteps": 52800,
        "reward_mean": -0.49330000000000007,
        "reward_max": 0.3694124999999999,
        "reward_min": -1.9868125000000003,
        "leartime_s": 0.03424510100740008,
        "sampletime": 1.0959872690145858,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 265,
        "timesteps": 53000,
        "reward_mean": -0.2605250000000001,
        "reward_max": 0.8349812500000002,
        "reward_min": -1.7187625,
        "leartime_s": 0.0805911630159244,
        "sampletime": 0.8489893170190044,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 266,
        "timesteps": 53200,
        "reward_mean": -0.25879999999999986,
        "reward_max": 0.8849937500000001,
        "reward_min": -1.5495062499999999,
        "leartime_s": 0.052897431974997744,
        "sampletime": 0.8150916210142896,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 267,
        "timesteps": 53400,
        "reward_mean": -0.25044999999999984,
        "reward_max": 0.6337625000000001,
        "reward_min": -1.7380624999999996,
        "leartime_s": 0.054772081988630816,
        "sampletime": 0.7661718270101119,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 268,
        "timesteps": 53600,
        "reward_mean": -0.43494999999999995,
        "reward_max": 0.5437500000000001,
        "reward_min": -1.5741500000000004,
        "leartime_s": 0.05124302499461919,
        "sampletime": 0.7805184189928696,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 269,
        "timesteps": 53800,
        "reward_mean": -0.14764999999999986,
        "reward_max": 0.783775,
        "reward_min": -1.4571499999999993,
        "leartime_s": 0.024063057004241273,
        "sampletime": 0.7526768990210257,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 270,
        "timesteps": 54000,
        "reward_mean": -0.1728500000000001,
        "reward_max": 0.9678249999999995,
        "reward_min": -1.3414875000000002,
        "leartime_s": 0.059878335014218464,
        "sampletime": 0.9169576979766134,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 271,
        "timesteps": 54200,
        "reward_mean": -0.24312499999999995,
        "reward_max": 0.9221250000000003,
        "reward_min": -1.2988937500000004,
        "leartime_s": 0.05451313001685776,
        "sampletime": 0.7447579200088512,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 272,
        "timesteps": 54400,
        "reward_mean": -0.455,
        "reward_max": 0.6269375,
        "reward_min": -1.9406062499999999,
        "leartime_s": 0.0586592800100334,
        "sampletime": 0.7934109620109666,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 273,
        "timesteps": 54600,
        "reward_mean": 0.10747500000000017,
        "reward_max": 0.9646125,
        "reward_min": -0.9755499999999996,
        "leartime_s": 0.08664323200355284,
        "sampletime": 0.9902421190054156,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 274,
        "timesteps": 54800,
        "reward_mean": -0.18957499999999994,
        "reward_max": 0.9400312500000001,
        "reward_min": -1.1848937499999994,
        "leartime_s": 0.08824265300063416,
        "sampletime": 0.7684197900234722,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 275,
        "timesteps": 55000,
        "reward_mean": -0.060424999999999854,
        "reward_max": 0.90478125,
        "reward_min": -1.3325874999999998,
        "leartime_s": 0.07425975298974663,
        "sampletime": 0.7694065460236743,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 276,
        "timesteps": 55200,
        "reward_mean": -0.05224999999999986,
        "reward_max": 0.9975312499999996,
        "reward_min": -1.9570374999999998,
        "leartime_s": 0.07227850699564442,
        "sampletime": 0.9170239270024467,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 277,
        "timesteps": 55400,
        "reward_mean": -0.10492499999999998,
        "reward_max": 0.8081562500000002,
        "reward_min": -1.41405,
        "leartime_s": 0.07416001500678249,
        "sampletime": 0.8323412629833911,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 278,
        "timesteps": 55600,
        "reward_mean": -0.03164999999999992,
        "reward_max": 0.8879750000000001,
        "reward_min": -1.1800375,
        "leartime_s": 0.033483342005638406,
        "sampletime": 0.8632697069842834,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 279,
        "timesteps": 55800,
        "reward_mean": -0.2489499999999999,
        "reward_max": 0.6841499999999999,
        "reward_min": -1.2713499999999998,
        "leartime_s": 0.05178529798286036,
        "sampletime": 0.9465904499811586,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 280,
        "timesteps": 56000,
        "reward_mean": -0.14052499999999998,
        "reward_max": 0.7957562499999999,
        "reward_min": -1.4583437499999996,
        "leartime_s": 0.08866451701032929,
        "sampletime": 0.9314717989764176,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 281,
        "timesteps": 56200,
        "reward_mean": -0.1462999999999998,
        "reward_max": 0.6107812500000003,
        "reward_min": -1.4464062499999994,
        "leartime_s": 0.040695698000490665,
        "sampletime": 0.8613573449838441,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 282,
        "timesteps": 56400,
        "reward_mean": -0.32152499999999995,
        "reward_max": 0.7925562500000001,
        "reward_min": -1.9077749999999998,
        "leartime_s": 0.06664184900000691,
        "sampletime": 0.7734247950138524,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 283,
        "timesteps": 56600,
        "reward_mean": -0.2792249999999999,
        "reward_max": 0.65671875,
        "reward_min": -1.9162374999999994,
        "leartime_s": 0.057351867988472804,
        "sampletime": 0.9843796170025598,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 284,
        "timesteps": 56800,
        "reward_mean": -0.5528,
        "reward_max": 0.5250750000000001,
        "reward_min": -1.6115374999999998,
        "leartime_s": 0.08357110197539441,
        "sampletime": 0.7773032679979224,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 285,
        "timesteps": 57000,
        "reward_mean": -0.04855,
        "reward_max": 0.9202875000000003,
        "reward_min": -1.5969374999999992,
        "leartime_s": 0.03369034398929216,
        "sampletime": 0.8956877839809749,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 286,
        "timesteps": 57200,
        "reward_mean": -0.4224249999999999,
        "reward_max": 0.5642812500000002,
        "reward_min": -1.66399375,
        "leartime_s": 0.07917180098593235,
        "sampletime": 0.9719631870102603,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 287,
        "timesteps": 57400,
        "reward_mean": -0.5363499999999999,
        "reward_max": 0.54448125,
        "reward_min": -2.2183375000000005,
        "leartime_s": 0.08035672100959346,
        "sampletime": 0.9320673160254955,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 288,
        "timesteps": 57600,
        "reward_mean": -0.300525,
        "reward_max": 0.7091624999999998,
        "reward_min": -1.5436625000000004,
        "leartime_s": 0.0739956560137216,
        "sampletime": 0.6988676940090954,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 289,
        "timesteps": 57800,
        "reward_mean": -0.3131499999999999,
        "reward_max": 0.4540000000000003,
        "reward_min": -1.8747499999999997,
        "leartime_s": 0.0379161529999692,
        "sampletime": 0.7958771919948049,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 290,
        "timesteps": 58000,
        "reward_mean": -0.341225,
        "reward_max": 0.8685687499999999,
        "reward_min": -1.68930625,
        "leartime_s": 0.07060342500335537,
        "sampletime": 0.9916388730052859,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 291,
        "timesteps": 58200,
        "reward_mean": -0.4232499999999996,
        "reward_max": 0.4885812500000004,
        "reward_min": -1.4915124999999996,
        "leartime_s": 0.07640802199603058,
        "sampletime": 0.8279840860050172,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 292,
        "timesteps": 58400,
        "reward_mean": -0.38772499999999993,
        "reward_max": 0.5393125000000002,
        "reward_min": -1.5372687499999995,
        "leartime_s": 0.03000295499805361,
        "sampletime": 0.8038416910276283,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 293,
        "timesteps": 58600,
        "reward_mean": -0.352825,
        "reward_max": 0.6995812499999999,
        "reward_min": -1.7462187500000004,
        "leartime_s": 0.028589867986738682,
        "sampletime": 1.0150465510087088,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 294,
        "timesteps": 58800,
        "reward_mean": -0.22607499999999983,
        "reward_max": 0.7921062500000003,
        "reward_min": -1.3410624999999992,
        "leartime_s": 0.07083981100004166,
        "sampletime": 0.7874983979854733,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 295,
        "timesteps": 59000,
        "reward_mean": -0.1309499999999999,
        "reward_max": 0.5380124999999999,
        "reward_min": -1.1748124999999994,
        "leartime_s": 0.0410618009918835,
        "sampletime": 0.7749110170116182,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 296,
        "timesteps": 59200,
        "reward_mean": -0.37127499999999997,
        "reward_max": 0.48903750000000024,
        "reward_min": -1.4424812500000002,
        "leartime_s": 0.04896595899481326,
        "sampletime": 0.8812923589721322,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 297,
        "timesteps": 59400,
        "reward_mean": -0.5701249999999999,
        "reward_max": 0.5040375,
        "reward_min": -2.0723562500000003,
        "leartime_s": 0.05204669400700368,
        "sampletime": 1.104027927009156,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 298,
        "timesteps": 59600,
        "reward_mean": -0.4026249999999999,
        "reward_max": 0.5431312500000002,
        "reward_min": -2.1508499999999997,
        "leartime_s": 0.08003137100604363,
        "sampletime": 0.848581896018004,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 299,
        "timesteps": 59800,
        "reward_mean": -0.26724999999999965,
        "reward_max": 0.6848875000000004,
        "reward_min": -1.3796812499999997,
        "leartime_s": 0.018068169010803103,
        "sampletime": 0.8633063790039159,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 300,
        "timesteps": 60000,
        "reward_mean": -0.6779749999999999,
        "reward_max": 0.5353125000000002,
        "reward_min": -1.9314749999999998,
        "leartime_s": 0.06468464701902121,
        "sampletime": 0.8986471380048897,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 301,
        "timesteps": 60200,
        "reward_mean": -0.6869499999999998,
        "reward_max": 0.16102499999999995,
        "reward_min": -1.8598375000000003,
        "leartime_s": 0.03801070398185402,
        "sampletime": 0.8606030849914532,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 302,
        "timesteps": 60400,
        "reward_mean": -0.5144499999999999,
        "reward_max": 0.5470687500000002,
        "reward_min": -1.9120812499999997,
        "leartime_s": 0.03159786298056133,
        "sampletime": 0.8979496789979748,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 303,
        "timesteps": 60600,
        "reward_mean": -0.42379999999999973,
        "reward_max": 0.5145937500000001,
        "reward_min": -1.809299999999999,
        "leartime_s": 0.0706312750116922,
        "sampletime": 0.7412604079872835,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 304,
        "timesteps": 60800,
        "reward_mean": -0.3458499999999999,
        "reward_max": 0.7428687500000003,
        "reward_min": -1.7083249999999999,
        "leartime_s": 0.02890746999764815,
        "sampletime": 0.8088291200110689,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 305,
        "timesteps": 61000,
        "reward_mean": -0.43089999999999967,
        "reward_max": 0.5121125000000003,
        "reward_min": -2.0571624999999996,
        "leartime_s": 0.05346966200158931,
        "sampletime": 0.7302986449794844,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 306,
        "timesteps": 61200,
        "reward_mean": -0.49322499999999986,
        "reward_max": 0.36405625000000014,
        "reward_min": -1.5651499999999998,
        "leartime_s": 0.08583952399203554,
        "sampletime": 0.8142588689806871,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 307,
        "timesteps": 61400,
        "reward_mean": -0.49862499999999976,
        "reward_max": 0.27356250000000015,
        "reward_min": -1.7183812499999993,
        "leartime_s": 0.07864084601169452,
        "sampletime": 0.8229409549967386,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 308,
        "timesteps": 61600,
        "reward_mean": -0.1938249999999998,
        "reward_max": 0.7209625,
        "reward_min": -1.3659625000000004,
        "leartime_s": 0.045591595000587404,
        "sampletime": 0.7117841339786537,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 309,
        "timesteps": 61800,
        "reward_mean": -0.6379999999999998,
        "reward_max": 0.25986250000000005,
        "reward_min": -1.8675125000000001,
        "leartime_s": 0.05061841700808145,
        "sampletime": 1.015792649006471,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 310,
        "timesteps": 62000,
        "reward_mean": -0.6612999999999999,
        "reward_max": 0.560225,
        "reward_min": -1.8439250000000005,
        "leartime_s": 0.06386487500276417,
        "sampletime": 0.7789166769944131,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 311,
        "timesteps": 62200,
        "reward_mean": -0.47254999999999975,
        "reward_max": 0.4916437500000002,
        "reward_min": -1.6329624999999999,
        "leartime_s": 0.0697013039898593,
        "sampletime": 0.8598398180038203,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 312,
        "timesteps": 62400,
        "reward_mean": -0.38779999999999987,
        "reward_max": 0.515175,
        "reward_min": -1.4074812500000005,
        "leartime_s": 0.0776788409857545,
        "sampletime": 0.8993393249984365,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 313,
        "timesteps": 62600,
        "reward_mean": -0.3312999999999998,
        "reward_max": 0.612675,
        "reward_min": -1.3895125,
        "leartime_s": 0.04346172302030027,
        "sampletime": 0.7951234270003624,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 314,
        "timesteps": 62800,
        "reward_mean": -0.5865499999999997,
        "reward_max": 0.2991125000000002,
        "reward_min": -1.7622812500000002,
        "leartime_s": 0.022596140974201262,
        "sampletime": 0.8352533449942712,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 315,
        "timesteps": 63000,
        "reward_mean": -0.3931999999999997,
        "reward_max": 0.5532687500000004,
        "reward_min": -1.68954375,
        "leartime_s": 0.03428774999338202,
        "sampletime": 0.9379857660096604,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 316,
        "timesteps": 63200,
        "reward_mean": -0.4412749999999998,
        "reward_max": 0.507975,
        "reward_min": -1.7492437499999993,
        "leartime_s": 0.08289150000200607,
        "sampletime": 0.7297707190155052,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 317,
        "timesteps": 63400,
        "reward_mean": -0.43129999999999963,
        "reward_max": 0.5932437500000004,
        "reward_min": -1.7690624999999993,
        "leartime_s": 0.03829537102137692,
        "sampletime": 0.8115740259818267,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 318,
        "timesteps": 63600,
        "reward_mean": -0.5013999999999998,
        "reward_max": 0.4972375000000003,
        "reward_min": -1.6460624999999998,
        "leartime_s": 0.07382141400012188,
        "sampletime": 0.8283812640001997,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 319,
        "timesteps": 63800,
        "reward_mean": -0.40564999999999984,
        "reward_max": 0.6032000000000002,
        "reward_min": -1.5756875,
        "leartime_s": 0.07727542298380286,
        "sampletime": 0.9376547349966131,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 320,
        "timesteps": 64000,
        "reward_mean": -0.5324999999999999,
        "reward_max": 0.34850000000000014,
        "reward_min": -1.6590624999999994,
        "leartime_s": 0.0403408000129275,
        "sampletime": 0.744999212998664,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 321,
        "timesteps": 64200,
        "reward_mean": -0.33122499999999977,
        "reward_max": 0.5664750000000001,
        "reward_min": -1.489975,
        "leartime_s": 0.029327205993467942,
        "sampletime": 0.7952544279978611,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 322,
        "timesteps": 64400,
        "reward_mean": -0.6556749999999997,
        "reward_max": 0.36791875000000024,
        "reward_min": -1.7716812499999992,
        "leartime_s": 0.05759034398943186,
        "sampletime": 0.8594970379781444,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 323,
        "timesteps": 64600,
        "reward_mean": -0.705325,
        "reward_max": 0.33762500000000006,
        "reward_min": -2.47098125,
        "leartime_s": 0.05857719198684208,
        "sampletime": 1.0417868829972576,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 324,
        "timesteps": 64800,
        "reward_mean": -0.4154749999999998,
        "reward_max": 0.5020875000000004,
        "reward_min": -1.5612812500000002,
        "leartime_s": 0.039702195004792884,
        "sampletime": 0.8196366699994542,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 325,
        "timesteps": 65000,
        "reward_mean": -0.517975,
        "reward_max": 0.6169812500000001,
        "reward_min": -2.0132875,
        "leartime_s": 0.04627679902478121,
        "sampletime": 0.941779744985979,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 326,
        "timesteps": 65200,
        "reward_mean": -0.5742999999999997,
        "reward_max": 0.4788625000000001,
        "reward_min": -2.2083999999999997,
        "leartime_s": 0.11483694799244404,
        "sampletime": 0.8059650039940607,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 327,
        "timesteps": 65400,
        "reward_mean": -0.5699499999999998,
        "reward_max": 0.34731250000000014,
        "reward_min": -1.6181374999999998,
        "leartime_s": 0.08925291599007323,
        "sampletime": 0.8409783900133334,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 328,
        "timesteps": 65600,
        "reward_mean": -0.8363999999999998,
        "reward_max": 0.07865000000000016,
        "reward_min": -2.2556499999999997,
        "leartime_s": 0.029653986974153668,
        "sampletime": 0.9007758089865092,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 329,
        "timesteps": 65800,
        "reward_mean": -0.46404999999999996,
        "reward_max": 0.3509500000000001,
        "reward_min": -1.6981312500000003,
        "leartime_s": 0.03332125599263236,
        "sampletime": 0.7489314489939716,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 330,
        "timesteps": 66000,
        "reward_mean": -0.7180749999999997,
        "reward_max": 0.28258125000000034,
        "reward_min": -2.126537499999999,
        "leartime_s": 0.07657673000358045,
        "sampletime": 0.7794323319976684,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 331,
        "timesteps": 66200,
        "reward_mean": -0.719875,
        "reward_max": 0.2742875,
        "reward_min": -2.22815,
        "leartime_s": 0.04247043302166276,
        "sampletime": 0.8679103330068756,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 332,
        "timesteps": 66400,
        "reward_mean": -0.6632249999999997,
        "reward_max": 0.3194187500000003,
        "reward_min": -2.3955562500000003,
        "leartime_s": 0.052992343000369146,
        "sampletime": 1.1181786080123857,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 333,
        "timesteps": 66600,
        "reward_mean": -0.5692999999999999,
        "reward_max": 0.3837125,
        "reward_min": -1.780725,
        "leartime_s": 0.06658438299200498,
        "sampletime": 0.9848169239994604,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 334,
        "timesteps": 66800,
        "reward_mean": -0.4458,
        "reward_max": 0.3964750000000001,
        "reward_min": -1.4100437499999996,
        "leartime_s": 0.03382963998592459,
        "sampletime": 0.780102426011581,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 335,
        "timesteps": 67000,
        "reward_mean": -0.4412249999999999,
        "reward_max": 0.4953937499999999,
        "reward_min": -1.59836875,
        "leartime_s": 0.05029829099657945,
        "sampletime": 0.901111564016901,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 336,
        "timesteps": 67200,
        "reward_mean": -0.3607999999999997,
        "reward_max": 0.4942625000000004,
        "reward_min": -1.7000749999999998,
        "leartime_s": 0.06543336599133909,
        "sampletime": 0.7478200499899685,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 337,
        "timesteps": 67400,
        "reward_mean": -0.549225,
        "reward_max": 0.4469937500000002,
        "reward_min": -1.5058812500000003,
        "leartime_s": 0.0576910300005693,
        "sampletime": 0.77926517999731,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 338,
        "timesteps": 67600,
        "reward_mean": -0.47027499999999983,
        "reward_max": 0.4009625000000001,
        "reward_min": -1.5407437499999996,
        "leartime_s": 0.07709875301225111,
        "sampletime": 0.7112262120062951,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 339,
        "timesteps": 67800,
        "reward_mean": -0.509875,
        "reward_max": 0.6046875,
        "reward_min": -1.6504749999999995,
        "leartime_s": 0.05378398799803108,
        "sampletime": 0.8266803230217192,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 340,
        "timesteps": 68000,
        "reward_mean": -0.40792499999999987,
        "reward_max": 0.4051687500000001,
        "reward_min": -1.34748125,
        "leartime_s": 0.03778425802011043,
        "sampletime": 0.8233281679858919,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 341,
        "timesteps": 68200,
        "reward_mean": -0.7910249999999999,
        "reward_max": 0.28247500000000003,
        "reward_min": -2.29605625,
        "leartime_s": 0.04308233701158315,
        "sampletime": 0.9136647200211883,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 342,
        "timesteps": 68400,
        "reward_mean": -0.6378499999999999,
        "reward_max": 0.5224125000000002,
        "reward_min": -2.0978125,
        "leartime_s": 0.08774507199996151,
        "sampletime": 0.828849841025658,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 343,
        "timesteps": 68600,
        "reward_mean": -0.6451500000000002,
        "reward_max": 0.4495125,
        "reward_min": -1.74911875,
        "leartime_s": 0.04934939602389932,
        "sampletime": 0.8630884560116101,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 344,
        "timesteps": 68800,
        "reward_mean": -0.81225,
        "reward_max": 0.14829999999999982,
        "reward_min": -2.1111187500000006,
        "leartime_s": 0.05418348000966944,
        "sampletime": 0.8925025550124701,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 345,
        "timesteps": 69000,
        "reward_mean": -0.58605,
        "reward_max": 0.36230000000000007,
        "reward_min": -1.8692874999999998,
        "leartime_s": 0.08481419601594098,
        "sampletime": 0.9173446559871081,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 346,
        "timesteps": 69200,
        "reward_mean": -0.40389999999999987,
        "reward_max": 0.6095187500000001,
        "reward_min": -1.4827625000000002,
        "leartime_s": 0.018428860988933593,
        "sampletime": 0.751911834027851,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 347,
        "timesteps": 69400,
        "reward_mean": -0.7368499999999999,
        "reward_max": 0.2633250000000001,
        "reward_min": -1.9363687499999995,
        "leartime_s": 0.03494907700223848,
        "sampletime": 0.8114270440128166,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 348,
        "timesteps": 69600,
        "reward_mean": -0.7648499999999999,
        "reward_max": 0.15843750000000006,
        "reward_min": -2.207325,
        "leartime_s": 0.04495838601724245,
        "sampletime": 0.9857220469857566,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 349,
        "timesteps": 69800,
        "reward_mean": -0.5723249999999999,
        "reward_max": 0.51264375,
        "reward_min": -1.801593749999999,
        "leartime_s": 0.07517039100639522,
        "sampletime": 0.8695020530140027,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 350,
        "timesteps": 70000,
        "reward_mean": -0.6558249999999999,
        "reward_max": 0.33236875000000005,
        "reward_min": -2.12633125,
        "leartime_s": 0.06131116798496805,
        "sampletime": 0.8118601659953129,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 351,
        "timesteps": 70200,
        "reward_mean": -0.71775,
        "reward_max": 0.49475,
        "reward_min": -2.13246875,
        "leartime_s": 0.04852904498693533,
        "sampletime": 1.0505172229895834,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 352,
        "timesteps": 70400,
        "reward_mean": -0.7125499999999999,
        "reward_max": 0.1482562500000001,
        "reward_min": -2.30073125,
        "leartime_s": 0.07506438900600187,
        "sampletime": 1.1257778569997754,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 353,
        "timesteps": 70600,
        "reward_mean": -0.6049249999999999,
        "reward_max": 0.2665000000000001,
        "reward_min": -1.9104250000000003,
        "leartime_s": 0.07746837200829759,
        "sampletime": 0.7573244709928986,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 354,
        "timesteps": 70800,
        "reward_mean": -0.7553749999999999,
        "reward_max": 0.32120624999999997,
        "reward_min": -1.99825625,
        "leartime_s": 0.04489405601634644,
        "sampletime": 0.8162220469966996,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 355,
        "timesteps": 71000,
        "reward_mean": -0.676625,
        "reward_max": 0.5926312499999999,
        "reward_min": -1.9338625,
        "leartime_s": 0.07772975499392487,
        "sampletime": 0.8460232010111213,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 356,
        "timesteps": 71200,
        "reward_mean": -0.6239250000000001,
        "reward_max": 0.38334999999999997,
        "reward_min": -1.7402374999999999,
        "leartime_s": 0.09638081598677672,
        "sampletime": 0.8733278760046232,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 357,
        "timesteps": 71400,
        "reward_mean": -0.4771999999999999,
        "reward_max": 0.3860125000000001,
        "reward_min": -1.5662375,
        "leartime_s": 0.07467671899939887,
        "sampletime": 0.8471940309973434,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 358,
        "timesteps": 71600,
        "reward_mean": -0.7297250000000002,
        "reward_max": 0.38278749999999995,
        "reward_min": -2.0569625000000005,
        "leartime_s": 0.07189924499834888,
        "sampletime": 0.7978362859867048,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 359,
        "timesteps": 71800,
        "reward_mean": -0.73335,
        "reward_max": 0.17629375000000003,
        "reward_min": -1.9852499999999997,
        "leartime_s": 0.0852425140037667,
        "sampletime": 1.039075831999071,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 360,
        "timesteps": 72000,
        "reward_mean": -0.24582499999999974,
        "reward_max": 0.7377062500000005,
        "reward_min": -1.7736749999999992,
        "leartime_s": 0.07558809398324229,
        "sampletime": 0.9173304160067346,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 361,
        "timesteps": 72200,
        "reward_mean": -0.6873999999999999,
        "reward_max": 0.5079125,
        "reward_min": -2.3104125,
        "leartime_s": 0.047692524996818975,
        "sampletime": 0.7720955910044722,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 362,
        "timesteps": 72400,
        "reward_mean": -0.48867499999999986,
        "reward_max": 0.7697749999999999,
        "reward_min": -1.40224375,
        "leartime_s": 0.03904840798350051,
        "sampletime": 0.8524946059915237,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 363,
        "timesteps": 72600,
        "reward_mean": -0.6737999999999998,
        "reward_max": 0.33870000000000006,
        "reward_min": -1.85088125,
        "leartime_s": 0.06636668700957671,
        "sampletime": 1.0004941369988956,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 364,
        "timesteps": 72800,
        "reward_mean": -0.41064999999999985,
        "reward_max": 0.6338625000000001,
        "reward_min": -1.3920875,
        "leartime_s": 0.07895556098083034,
        "sampletime": 0.7999446250032634,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 365,
        "timesteps": 73000,
        "reward_mean": -0.6575249999999998,
        "reward_max": 0.3595437500000003,
        "reward_min": -1.8306062500000002,
        "leartime_s": 0.03208834401448257,
        "sampletime": 0.8162744650035165,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 366,
        "timesteps": 73200,
        "reward_mean": -0.4539749999999999,
        "reward_max": 0.6818687500000002,
        "reward_min": -1.74591875,
        "leartime_s": 0.08436746199731715,
        "sampletime": 0.9244083020021208,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 367,
        "timesteps": 73400,
        "reward_mean": -0.7349249999999998,
        "reward_max": 0.19141875000000014,
        "reward_min": -1.7554249999999993,
        "leartime_s": 0.06363749201409519,
        "sampletime": 0.7512922339956276,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 368,
        "timesteps": 73600,
        "reward_mean": -0.15742499999999973,
        "reward_max": 0.6977625,
        "reward_min": -1.4439062499999995,
        "leartime_s": 0.0488357059948612,
        "sampletime": 0.8236907859973144,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 369,
        "timesteps": 73800,
        "reward_mean": -0.6820249999999998,
        "reward_max": 0.20903750000000015,
        "reward_min": -1.9694937499999994,
        "leartime_s": 0.026290834008250386,
        "sampletime": 1.0700157530081924,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 370,
        "timesteps": 74000,
        "reward_mean": -0.48017499999999985,
        "reward_max": 0.4113125000000001,
        "reward_min": -1.5201500000000001,
        "leartime_s": 0.06366233300650492,
        "sampletime": 0.8969050620216876,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 371,
        "timesteps": 74200,
        "reward_mean": -0.6818,
        "reward_max": 0.2609687500000001,
        "reward_min": -1.7778624999999997,
        "leartime_s": 0.05493666199618019,
        "sampletime": 0.8036465169861913,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 372,
        "timesteps": 74400,
        "reward_mean": -0.5545999999999996,
        "reward_max": 0.6307000000000004,
        "reward_min": -1.6905812499999993,
        "leartime_s": 0.037597532995278016,
        "sampletime": 0.9387508310028352,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 373,
        "timesteps": 74600,
        "reward_mean": -0.5438249999999998,
        "reward_max": 0.42428750000000015,
        "reward_min": -1.8793312500000001,
        "leartime_s": 0.05110619298648089,
        "sampletime": 0.8547642439953052,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 374,
        "timesteps": 74800,
        "reward_mean": -0.6346999999999997,
        "reward_max": 0.3433812500000002,
        "reward_min": -1.8058062499999992,
        "leartime_s": 0.04965108499163762,
        "sampletime": 0.7651396479923278,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 375,
        "timesteps": 75000,
        "reward_mean": -0.705575,
        "reward_max": 0.3552625000000001,
        "reward_min": -1.7390625,
        "leartime_s": 0.050759671023115516,
        "sampletime": 0.8032521239947528,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 376,
        "timesteps": 75200,
        "reward_mean": -0.774375,
        "reward_max": 0.25738125,
        "reward_min": -1.9647437499999998,
        "leartime_s": 0.02949106099549681,
        "sampletime": 0.7684535990119912,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 377,
        "timesteps": 75400,
        "reward_mean": -0.5381499999999999,
        "reward_max": 0.46300000000000024,
        "reward_min": -1.855074999999999,
        "leartime_s": 0.03042082700994797,
        "sampletime": 0.8045645989768673,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 378,
        "timesteps": 75600,
        "reward_mean": -0.5252249999999997,
        "reward_max": 0.5574500000000002,
        "reward_min": -1.4894437499999995,
        "leartime_s": 0.028758538013789803,
        "sampletime": 0.9412794219970237,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 379,
        "timesteps": 75800,
        "reward_mean": -0.6350749999999998,
        "reward_max": 0.4784000000000002,
        "reward_min": -1.9632500000000002,
        "leartime_s": 0.03144344099564478,
        "sampletime": 0.8112559939909261,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 380,
        "timesteps": 76000,
        "reward_mean": -0.5100249999999997,
        "reward_max": 0.5369750000000003,
        "reward_min": -1.8108999999999997,
        "leartime_s": 0.03403292500297539,
        "sampletime": 0.773210237006424,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 381,
        "timesteps": 76200,
        "reward_mean": -0.26977499999999976,
        "reward_max": 0.83224375,
        "reward_min": -1.6128624999999992,
        "leartime_s": 0.03690477999043651,
        "sampletime": 1.0178976239985786,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 382,
        "timesteps": 76400,
        "reward_mean": -0.5549999999999996,
        "reward_max": 0.4669187500000003,
        "reward_min": -1.7991124999999994,
        "leartime_s": 0.05744036499527283,
        "sampletime": 0.9068060729769059,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 383,
        "timesteps": 76600,
        "reward_mean": -0.5928499999999998,
        "reward_max": 0.3136625000000002,
        "reward_min": -1.8779375000000003,
        "leartime_s": 0.06996121001429856,
        "sampletime": 0.7831270220049191,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 384,
        "timesteps": 76800,
        "reward_mean": -0.44624999999999987,
        "reward_max": 0.4778687499999999,
        "reward_min": -1.8241312499999995,
        "leartime_s": 0.07684803500887938,
        "sampletime": 0.9236290490080137,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 385,
        "timesteps": 77000,
        "reward_mean": -0.3257749999999998,
        "reward_max": 0.5637625000000003,
        "reward_min": -1.507775,
        "leartime_s": 0.03755875301430933,
        "sampletime": 0.7475867210014258,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 386,
        "timesteps": 77200,
        "reward_mean": -0.35612499999999964,
        "reward_max": 0.6245750000000001,
        "reward_min": -1.6921687499999993,
        "leartime_s": 0.025968976988224313,
        "sampletime": 0.9039049569983035,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 387,
        "timesteps": 77400,
        "reward_mean": -0.3053249999999998,
        "reward_max": 0.6879125000000001,
        "reward_min": -1.9405124999999996,
        "leartime_s": 0.04892140600713901,
        "sampletime": 0.9032116580056027,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 388,
        "timesteps": 77600,
        "reward_mean": -0.3180249999999999,
        "reward_max": 0.5459500000000002,
        "reward_min": -1.665025,
        "leartime_s": 0.08237451300374232,
        "sampletime": 1.0208263520034961,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 389,
        "timesteps": 77800,
        "reward_mean": -0.6944249999999998,
        "reward_max": 0.33100625000000006,
        "reward_min": -2.09920625,
        "leartime_s": 0.06867822300409898,
        "sampletime": 0.7595489239902236,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 390,
        "timesteps": 78000,
        "reward_mean": -0.6527749999999998,
        "reward_max": 0.38139375000000003,
        "reward_min": -1.7422062499999997,
        "leartime_s": 0.04630965899559669,
        "sampletime": 0.8103060490102507,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 391,
        "timesteps": 78200,
        "reward_mean": -0.6607749999999999,
        "reward_max": 0.25796250000000026,
        "reward_min": -1.6511874999999998,
        "leartime_s": 0.04612331700627692,
        "sampletime": 0.9908527560182847,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 392,
        "timesteps": 78400,
        "reward_mean": -0.28417499999999973,
        "reward_max": 0.7465125000000001,
        "reward_min": -1.6154999999999997,
        "leartime_s": 0.04750503398827277,
        "sampletime": 0.7910019350238144,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 393,
        "timesteps": 78600,
        "reward_mean": -0.40645,
        "reward_max": 0.6188937499999999,
        "reward_min": -1.5041,
        "leartime_s": 0.07771962901460938,
        "sampletime": 0.7741739790071733,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 394,
        "timesteps": 78800,
        "reward_mean": -0.7643249999999998,
        "reward_max": 0.22168125000000016,
        "reward_min": -2.0974375000000003,
        "leartime_s": 0.08578697498887777,
        "sampletime": 1.0201158249983564,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 395,
        "timesteps": 79000,
        "reward_mean": -0.5057249999999999,
        "reward_max": 0.7118062500000002,
        "reward_min": -1.8539375000000002,
        "leartime_s": 0.05638285999884829,
        "sampletime": 0.8441601769882254,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 396,
        "timesteps": 79200,
        "reward_mean": -0.4218249999999998,
        "reward_max": 0.4745312500000002,
        "reward_min": -1.7630812500000002,
        "leartime_s": 0.03727151299244724,
        "sampletime": 0.8539982599904761,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 397,
        "timesteps": 79400,
        "reward_mean": -0.2603749999999997,
        "reward_max": 0.6882062500000002,
        "reward_min": -1.3706874999999998,
        "leartime_s": 0.07825027700164355,
        "sampletime": 0.7097519820090383,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 398,
        "timesteps": 79600,
        "reward_mean": -0.4709,
        "reward_max": 0.2792125,
        "reward_min": -1.5388249999999997,
        "leartime_s": 0.07921035098843277,
        "sampletime": 0.9307221900089644,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 399,
        "timesteps": 79800,
        "reward_mean": -0.4333249999999997,
        "reward_max": 0.5984937500000003,
        "reward_min": -1.4584874999999997,
        "leartime_s": 0.0698374739731662,
        "sampletime": 0.831488919997355,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 400,
        "timesteps": 80000,
        "reward_mean": -0.24082499999999965,
        "reward_max": 0.6262000000000003,
        "reward_min": -1.3012687499999995,
        "leartime_s": 0.04698874201858416,
        "sampletime": 0.7673536910151597,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 401,
        "timesteps": 80200,
        "reward_mean": -0.5998249999999998,
        "reward_max": 0.72995625,
        "reward_min": -2.3979312499999996,
        "leartime_s": 0.09323545297957025,
        "sampletime": 1.1253863830061164,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 402,
        "timesteps": 80400,
        "reward_mean": -0.49822499999999986,
        "reward_max": 0.38407500000000017,
        "reward_min": -1.9167625000000001,
        "leartime_s": 0.03262960899155587,
        "sampletime": 0.8614033220219426,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 403,
        "timesteps": 80600,
        "reward_mean": -0.35457499999999986,
        "reward_max": 0.74748125,
        "reward_min": -1.6389749999999994,
        "leartime_s": 0.04810417100088671,
        "sampletime": 0.7679037790221628,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 404,
        "timesteps": 80800,
        "reward_mean": -0.7786499999999996,
        "reward_max": 0.4136125000000001,
        "reward_min": -1.9549124999999994,
        "leartime_s": 0.0664867160085123,
        "sampletime": 0.9222181939985603,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 405,
        "timesteps": 81000,
        "reward_mean": -0.2579999999999999,
        "reward_max": 0.6017375000000003,
        "reward_min": -1.6415875000000002,
        "leartime_s": 0.0953993090079166,
        "sampletime": 0.7443669680214953,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 406,
        "timesteps": 81200,
        "reward_mean": -0.4647999999999999,
        "reward_max": 0.31895624999999994,
        "reward_min": -1.6499000000000001,
        "leartime_s": 0.06275153701426461,
        "sampletime": 0.7675790750072338,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 407,
        "timesteps": 81400,
        "reward_mean": -0.20537499999999967,
        "reward_max": 0.9263750000000005,
        "reward_min": -1.5228687500000002,
        "leartime_s": 0.06732770998496562,
        "sampletime": 0.906372719007777,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 408,
        "timesteps": 81600,
        "reward_mean": -0.18694999999999987,
        "reward_max": 0.79256875,
        "reward_min": -1.3943937499999994,
        "leartime_s": 0.07652851098100655,
        "sampletime": 1.0624320869974326,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 409,
        "timesteps": 81800,
        "reward_mean": -0.3861499999999999,
        "reward_max": 0.6504500000000001,
        "reward_min": -1.473075,
        "leartime_s": 0.061109168018447235,
        "sampletime": 0.83479549002368,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 410,
        "timesteps": 82000,
        "reward_mean": -0.4566749999999997,
        "reward_max": 0.4180312500000002,
        "reward_min": -1.83844375,
        "leartime_s": 0.03984659898560494,
        "sampletime": 0.7761661879776511,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 411,
        "timesteps": 82200,
        "reward_mean": -0.4772499999999999,
        "reward_max": 0.28765000000000024,
        "reward_min": -1.45486875,
        "leartime_s": 0.07600857500801794,
        "sampletime": 0.8650759939919226,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 412,
        "timesteps": 82400,
        "reward_mean": -0.20719999999999972,
        "reward_max": 0.7239000000000004,
        "reward_min": -1.4634,
        "leartime_s": 0.07058083199081011,
        "sampletime": 0.7086674270103686,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 413,
        "timesteps": 82600,
        "reward_mean": -0.12912499999999982,
        "reward_max": 0.79379375,
        "reward_min": -1.1810437499999997,
        "leartime_s": 0.06427246500970796,
        "sampletime": 0.6502716859977227,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 414,
        "timesteps": 82800,
        "reward_mean": -0.48329999999999973,
        "reward_max": 0.4844500000000002,
        "reward_min": -1.8038999999999996,
        "leartime_s": 0.08601588898454793,
        "sampletime": 1.0094921459967736,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 415,
        "timesteps": 83000,
        "reward_mean": -0.4567499999999999,
        "reward_max": 0.47913124999999995,
        "reward_min": -1.8737562499999998,
        "leartime_s": 0.09150838101049885,
        "sampletime": 1.0727842839842197,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 416,
        "timesteps": 83200,
        "reward_mean": -0.20237499999999972,
        "reward_max": 0.8876437500000002,
        "reward_min": -1.1671812499999994,
        "leartime_s": 0.07846724800765514,
        "sampletime": 0.8174022479797713,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 417,
        "timesteps": 83400,
        "reward_mean": -0.2696499999999997,
        "reward_max": 0.5964250000000002,
        "reward_min": -1.4908999999999997,
        "leartime_s": 0.08035058199311607,
        "sampletime": 0.8419646979891695,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 418,
        "timesteps": 83600,
        "reward_mean": -0.13427499999999987,
        "reward_max": 0.7579437500000002,
        "reward_min": -1.6366437500000002,
        "leartime_s": 0.07890566499554552,
        "sampletime": 1.015965374012012,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 419,
        "timesteps": 83800,
        "reward_mean": -0.48012499999999975,
        "reward_max": 0.4074562500000001,
        "reward_min": -1.7124062499999997,
        "leartime_s": 0.03307045201654546,
        "sampletime": 0.7515537579893135,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 420,
        "timesteps": 84000,
        "reward_mean": -0.2823249999999998,
        "reward_max": 0.7605250000000001,
        "reward_min": -1.3308625000000003,
        "leartime_s": 0.07542816599016078,
        "sampletime": 0.8153970150160603,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 421,
        "timesteps": 84200,
        "reward_mean": -0.14897499999999964,
        "reward_max": 0.6658625000000004,
        "reward_min": -1.2400624999999998,
        "leartime_s": 0.05609015398658812,
        "sampletime": 0.9262486490188166,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 422,
        "timesteps": 84400,
        "reward_mean": -0.30709999999999976,
        "reward_max": 0.6400000000000003,
        "reward_min": -1.4871125000000003,
        "leartime_s": 0.07946801098296419,
        "sampletime": 1.0235838940134272,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 423,
        "timesteps": 84600,
        "reward_mean": -0.25597499999999973,
        "reward_max": 0.6018625000000003,
        "reward_min": -1.2135562500000001,
        "leartime_s": 0.06345616400358267,
        "sampletime": 0.7569955970102455,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 424,
        "timesteps": 84800,
        "reward_mean": -0.47717499999999985,
        "reward_max": 0.4355125000000003,
        "reward_min": -1.9216937499999998,
        "leartime_s": 0.06532582300133072,
        "sampletime": 0.7525322249857709,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 425,
        "timesteps": 85000,
        "reward_mean": -0.30539999999999967,
        "reward_max": 0.41496250000000023,
        "reward_min": -1.2151375,
        "leartime_s": 0.05607981199864298,
        "sampletime": 0.928801806003321,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 426,
        "timesteps": 85200,
        "reward_mean": -0.22497499999999968,
        "reward_max": 0.8670250000000004,
        "reward_min": -1.5006187499999997,
        "leartime_s": 0.056285747996298596,
        "sampletime": 0.8927788559813052,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 427,
        "timesteps": 85400,
        "reward_mean": -0.3592249999999997,
        "reward_max": 0.5984250000000001,
        "reward_min": -1.7106312499999996,
        "leartime_s": 0.05988439699285664,
        "sampletime": 0.7487495980167296,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 428,
        "timesteps": 85600,
        "reward_mean": -0.09872499999999973,
        "reward_max": 0.7934000000000002,
        "reward_min": -1.1840625,
        "leartime_s": 0.0635631250042934,
        "sampletime": 0.9774598589865491,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 429,
        "timesteps": 85800,
        "reward_mean": -0.3487249999999998,
        "reward_max": 0.4422812500000004,
        "reward_min": -1.6811624999999994,
        "leartime_s": 0.07742910701199435,
        "sampletime": 0.7452700779831503,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 430,
        "timesteps": 86000,
        "reward_mean": -0.36297499999999977,
        "reward_max": 0.6768750000000002,
        "reward_min": -1.7753999999999994,
        "leartime_s": 0.04277217501658015,
        "sampletime": 0.9009937520022504,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 431,
        "timesteps": 86200,
        "reward_mean": 0.0027000000000001554,
        "reward_max": 0.9048875000000001,
        "reward_min": -1.0684749999999994,
        "leartime_s": 0.07618078999803402,
        "sampletime": 0.8808186179958284,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 432,
        "timesteps": 86400,
        "reward_mean": -0.10189999999999977,
        "reward_max": 0.8270312500000004,
        "reward_min": -1.1733687500000003,
        "leartime_s": 0.09318816199083813,
        "sampletime": 0.9295603069767822,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 433,
        "timesteps": 86600,
        "reward_mean": -0.08347499999999988,
        "reward_max": 0.8635812500000001,
        "reward_min": -1.4543562500000002,
        "leartime_s": 0.061395924014505,
        "sampletime": 0.7585907629982103,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 434,
        "timesteps": 86800,
        "reward_mean": -0.2529249999999999,
        "reward_max": 0.6368250000000002,
        "reward_min": -1.67423125,
        "leartime_s": 0.03924335999181494,
        "sampletime": 0.841902268002741,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 435,
        "timesteps": 87000,
        "reward_mean": -0.23379999999999984,
        "reward_max": 0.6464000000000001,
        "reward_min": -1.3969687499999999,
        "leartime_s": 0.07479469300596975,
        "sampletime": 1.0879646039975341,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 436,
        "timesteps": 87200,
        "reward_mean": -0.30654999999999977,
        "reward_max": 0.6782687500000001,
        "reward_min": -1.8636749999999993,
        "leartime_s": 0.038749675994040444,
        "sampletime": 0.763547706999816,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 437,
        "timesteps": 87400,
        "reward_mean": -0.3252249999999998,
        "reward_max": 0.5974375000000005,
        "reward_min": -1.2807750000000002,
        "leartime_s": 0.041156258987030014,
        "sampletime": 0.8093495109933428,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 438,
        "timesteps": 87600,
        "reward_mean": -0.26919999999999983,
        "reward_max": 0.44531250000000017,
        "reward_min": -1.3687374999999997,
        "leartime_s": 0.08436568698380142,
        "sampletime": 1.0437537189864088,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 439,
        "timesteps": 87800,
        "reward_mean": -0.30754999999999977,
        "reward_max": 0.6214812500000002,
        "reward_min": -1.48279375,
        "leartime_s": 0.057099703000858426,
        "sampletime": 0.8513858290098142,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 440,
        "timesteps": 88000,
        "reward_mean": -0.4275749999999999,
        "reward_max": 0.43718124999999997,
        "reward_min": -1.8705124999999996,
        "leartime_s": 0.0677534080168698,
        "sampletime": 0.7106652049988043,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 441,
        "timesteps": 88200,
        "reward_mean": -0.45789999999999986,
        "reward_max": 0.6610187500000001,
        "reward_min": -1.8501874999999999,
        "leartime_s": 0.05998242099303752,
        "sampletime": 0.715495648997603,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 442,
        "timesteps": 88400,
        "reward_mean": -0.25924999999999987,
        "reward_max": 0.6908125000000002,
        "reward_min": -1.6204499999999993,
        "leartime_s": 0.07252672599861398,
        "sampletime": 0.9638353539921809,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 443,
        "timesteps": 88600,
        "reward_mean": -0.34309999999999974,
        "reward_max": 0.6785875000000002,
        "reward_min": -1.5638312499999996,
        "leartime_s": 0.06280675399466418,
        "sampletime": 0.8496480899921153,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 444,
        "timesteps": 88800,
        "reward_mean": -0.047824999999999805,
        "reward_max": 0.8728000000000001,
        "reward_min": -1.3108562499999998,
        "leartime_s": 0.06593625000095926,
        "sampletime": 0.8244211780256592,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 445,
        "timesteps": 89000,
        "reward_mean": -0.017549999999999663,
        "reward_max": 0.9502687500000004,
        "reward_min": -0.9995624999999996,
        "leartime_s": 0.03942597901914269,
        "sampletime": 1.0607680579996668,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 446,
        "timesteps": 89200,
        "reward_mean": -0.4794999999999998,
        "reward_max": 0.45728750000000007,
        "reward_min": -1.8426062499999993,
        "leartime_s": 0.07354507100535557,
        "sampletime": 0.7411637800105382,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 447,
        "timesteps": 89400,
        "reward_mean": -0.2321499999999998,
        "reward_max": 0.7132187500000002,
        "reward_min": -1.48710625,
        "leartime_s": 0.030301969993161038,
        "sampletime": 0.7155802630004473,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 448,
        "timesteps": 89600,
        "reward_mean": -0.16162499999999974,
        "reward_max": 0.9478687500000003,
        "reward_min": -1.2738999999999994,
        "leartime_s": 0.03563993200077675,
        "sampletime": 0.7147869990149047,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 449,
        "timesteps": 89800,
        "reward_mean": -0.27039999999999986,
        "reward_max": 0.5693312500000002,
        "reward_min": -1.7324749999999998,
        "leartime_s": 0.024189880001358688,
        "sampletime": 0.7361673470004462,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 450,
        "timesteps": 90000,
        "reward_mean": -0.44447499999999984,
        "reward_max": 0.4689500000000003,
        "reward_min": -1.6024812499999999,
        "leartime_s": 0.08584839801187627,
        "sampletime": 0.7660200859827455,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 451,
        "timesteps": 90200,
        "reward_mean": -0.0816749999999999,
        "reward_max": 0.75395,
        "reward_min": -1.6878062500000002,
        "leartime_s": 0.05007689102785662,
        "sampletime": 0.9750138729868922,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 452,
        "timesteps": 90400,
        "reward_mean": -0.07764999999999973,
        "reward_max": 0.6908125000000003,
        "reward_min": -1.2393312500000002,
        "leartime_s": 0.10410350700840354,
        "sampletime": 0.955400623002788,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 453,
        "timesteps": 90600,
        "reward_mean": -0.1605749999999999,
        "reward_max": 0.8117437500000002,
        "reward_min": -1.0631249999999997,
        "leartime_s": 0.08179817599011585,
        "sampletime": 0.7601170640264172,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 454,
        "timesteps": 90800,
        "reward_mean": -0.27027499999999965,
        "reward_max": 0.5237250000000004,
        "reward_min": -1.3554874999999997,
        "leartime_s": 0.07628684700466692,
        "sampletime": 0.8947628760070074,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 455,
        "timesteps": 91000,
        "reward_mean": -0.23667499999999983,
        "reward_max": 0.4920875000000004,
        "reward_min": -1.5686937499999998,
        "leartime_s": 0.07858670799760148,
        "sampletime": 1.1029185609950218,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 456,
        "timesteps": 91200,
        "reward_mean": -0.3845999999999998,
        "reward_max": 0.5217875000000001,
        "reward_min": -1.7026124999999996,
        "leartime_s": 0.0659996040049009,
        "sampletime": 0.7885080910054967,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 457,
        "timesteps": 91400,
        "reward_mean": -0.11017499999999981,
        "reward_max": 0.7541312500000001,
        "reward_min": -1.0741249999999993,
        "leartime_s": 0.06050336401676759,
        "sampletime": 0.914100714988308,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 458,
        "timesteps": 91600,
        "reward_mean": -0.1498249999999997,
        "reward_max": 0.7128750000000004,
        "reward_min": -1.5574374999999996,
        "leartime_s": 0.062234772980445996,
        "sampletime": 0.9802694230165798,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 459,
        "timesteps": 91800,
        "reward_mean": -0.26704999999999984,
        "reward_max": 0.6524375,
        "reward_min": -1.551025,
        "leartime_s": 0.05602336101583205,
        "sampletime": 0.851721366023412,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 460,
        "timesteps": 92000,
        "reward_mean": -0.06269999999999964,
        "reward_max": 0.7650187500000005,
        "reward_min": -1.4854812499999994,
        "leartime_s": 0.058809254987863824,
        "sampletime": 0.8012173380120657,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 461,
        "timesteps": 92200,
        "reward_mean": -0.00514999999999959,
        "reward_max": 0.7613750000000005,
        "reward_min": -1.0092749999999997,
        "leartime_s": 0.07307720300741494,
        "sampletime": 0.8833766409952659,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 462,
        "timesteps": 92400,
        "reward_mean": -0.2060249999999999,
        "reward_max": 0.745525,
        "reward_min": -1.4779437500000001,
        "leartime_s": 0.07473937200848013,
        "sampletime": 0.8567703590088058,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 463,
        "timesteps": 92600,
        "reward_mean": -0.2966999999999998,
        "reward_max": 0.4368875000000001,
        "reward_min": -1.5309812499999995,
        "leartime_s": 0.07276636298047379,
        "sampletime": 0.8111284729966428,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 464,
        "timesteps": 92800,
        "reward_mean": -0.34222499999999983,
        "reward_max": 0.5803312500000002,
        "reward_min": -1.8515499999999998,
        "leartime_s": 0.04738227598136291,
        "sampletime": 0.9063630210002884,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 465,
        "timesteps": 93000,
        "reward_mean": -0.16157499999999983,
        "reward_max": 0.8840124999999998,
        "reward_min": -1.22858125,
        "leartime_s": 0.09288263000780717,
        "sampletime": 1.0400742320052814,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 466,
        "timesteps": 93200,
        "reward_mean": -0.3744249999999998,
        "reward_max": 0.4447312500000003,
        "reward_min": -1.3675812499999995,
        "leartime_s": 0.0803249440214131,
        "sampletime": 0.7725902060046792,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 467,
        "timesteps": 93400,
        "reward_mean": -0.3903249999999998,
        "reward_max": 0.4389187500000002,
        "reward_min": -1.3604562500000004,
        "leartime_s": 0.047361215023556724,
        "sampletime": 0.7653348890016787,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 468,
        "timesteps": 93600,
        "reward_mean": -0.11439999999999984,
        "reward_max": 0.8062125,
        "reward_min": -1.3652562499999998,
        "leartime_s": 0.07558021601289511,
        "sampletime": 0.8827778920240235,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 469,
        "timesteps": 93800,
        "reward_mean": -0.29882499999999973,
        "reward_max": 0.6459750000000002,
        "reward_min": -2.32801875,
        "leartime_s": 0.09918747597839683,
        "sampletime": 0.8781558710034005,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 470,
        "timesteps": 94000,
        "reward_mean": -0.2574749999999998,
        "reward_max": 0.7842875000000001,
        "reward_min": -1.5852124999999995,
        "leartime_s": 0.06954783498076722,
        "sampletime": 0.8161457889946178,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 471,
        "timesteps": 94200,
        "reward_mean": -0.14369999999999983,
        "reward_max": 0.7436625000000002,
        "reward_min": -1.69135,
        "leartime_s": 0.08407742201234214,
        "sampletime": 1.0407398460083641,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 472,
        "timesteps": 94400,
        "reward_mean": -0.46612499999999985,
        "reward_max": 0.5489937500000002,
        "reward_min": -1.9632624999999995,
        "leartime_s": 0.04748624298372306,
        "sampletime": 0.8757114949985407,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 473,
        "timesteps": 94600,
        "reward_mean": -0.32482499999999986,
        "reward_max": 0.4994500000000001,
        "reward_min": -1.8845999999999998,
        "leartime_s": 0.07512856597895734,
        "sampletime": 0.6734589480038267,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 474,
        "timesteps": 94800,
        "reward_mean": -0.32557499999999984,
        "reward_max": 0.6283500000000003,
        "reward_min": -1.56923125,
        "leartime_s": 0.07785356798558496,
        "sampletime": 0.9628046689904295,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 475,
        "timesteps": 95000,
        "reward_mean": -0.14594999999999983,
        "reward_max": 0.7632500000000001,
        "reward_min": -1.4975374999999995,
        "leartime_s": 0.07612516198423691,
        "sampletime": 1.0608841229986865,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 476,
        "timesteps": 95200,
        "reward_mean": -0.1363,
        "reward_max": 0.8837249999999999,
        "reward_min": -1.3004125000000006,
        "leartime_s": 0.06262420999701135,
        "sampletime": 0.8467077749955934,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 477,
        "timesteps": 95400,
        "reward_mean": -0.11209999999999985,
        "reward_max": 0.7641937500000004,
        "reward_min": -1.1105687499999997,
        "leartime_s": 0.07746644999133423,
        "sampletime": 0.7834416970144957,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 478,
        "timesteps": 95600,
        "reward_mean": -0.4400999999999998,
        "reward_max": 0.36743125,
        "reward_min": -1.6759874999999997,
        "leartime_s": 0.06519216400920413,
        "sampletime": 0.8648426299914718,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 479,
        "timesteps": 95800,
        "reward_mean": -0.22572499999999984,
        "reward_max": 0.6691125,
        "reward_min": -1.5090874999999997,
        "leartime_s": 0.08600881398888305,
        "sampletime": 0.8754074299940839,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 480,
        "timesteps": 96000,
        "reward_mean": -0.15137499999999987,
        "reward_max": 0.7612562500000001,
        "reward_min": -1.2298687499999996,
        "leartime_s": 0.05393046300741844,
        "sampletime": 0.7494322670099791,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 481,
        "timesteps": 96200,
        "reward_mean": -0.23564999999999983,
        "reward_max": 0.6571500000000001,
        "reward_min": -1.3289000000000002,
        "leartime_s": 0.07887926700641401,
        "sampletime": 0.8356822899950203,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 482,
        "timesteps": 96400,
        "reward_mean": -0.4549999999999999,
        "reward_max": 0.51855,
        "reward_min": -1.6688749999999994,
        "leartime_s": 0.07982112202444114,
        "sampletime": 0.9428815099818166,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 483,
        "timesteps": 96600,
        "reward_mean": -0.40269999999999995,
        "reward_max": 0.6083812499999999,
        "reward_min": -2.0116875,
        "leartime_s": 0.05542724300175905,
        "sampletime": 0.7293619069969282,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 484,
        "timesteps": 96800,
        "reward_mean": -0.19279999999999978,
        "reward_max": 0.6984500000000001,
        "reward_min": -1.7895499999999995,
        "leartime_s": 0.07927267902414314,
        "sampletime": 0.7028537949954625,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 485,
        "timesteps": 97000,
        "reward_mean": -0.33304999999999974,
        "reward_max": 0.5330000000000003,
        "reward_min": -1.5244812499999996,
        "leartime_s": 0.07623249202151783,
        "sampletime": 0.897352169995429,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 486,
        "timesteps": 97200,
        "reward_mean": -0.5047499999999998,
        "reward_max": 0.2758875000000002,
        "reward_min": -1.9027374999999995,
        "leartime_s": 0.04376404901267961,
        "sampletime": 0.8522614569810685,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 487,
        "timesteps": 97400,
        "reward_mean": -0.376475,
        "reward_max": 0.37107499999999977,
        "reward_min": -1.4140875,
        "leartime_s": 0.06663571301032789,
        "sampletime": 0.9720641119929496,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 488,
        "timesteps": 97600,
        "reward_mean": -0.5449999999999998,
        "reward_max": 0.3998875000000001,
        "reward_min": -1.8441124999999996,
        "leartime_s": 0.08122176001779735,
        "sampletime": 0.7994914770242758,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 489,
        "timesteps": 97800,
        "reward_mean": -0.40502499999999997,
        "reward_max": 0.47909375000000015,
        "reward_min": -1.8231249999999994,
        "leartime_s": 0.054355756990844384,
        "sampletime": 0.8339702539960854,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 490,
        "timesteps": 98000,
        "reward_mean": -0.3636999999999998,
        "reward_max": 0.5359500000000001,
        "reward_min": -1.5396312500000005,
        "leartime_s": 0.06647155198152177,
        "sampletime": 0.8576020860054996,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 491,
        "timesteps": 98200,
        "reward_mean": -0.36004999999999965,
        "reward_max": 0.5703000000000004,
        "reward_min": -1.4296999999999995,
        "leartime_s": 0.05959814300877042,
        "sampletime": 0.8910008519887924,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 492,
        "timesteps": 98400,
        "reward_mean": -0.3926999999999998,
        "reward_max": 0.7049875000000002,
        "reward_min": -1.4822624999999998,
        "leartime_s": 0.08950925598037429,
        "sampletime": 0.7598573380091693,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 493,
        "timesteps": 98600,
        "reward_mean": -0.40884999999999977,
        "reward_max": 0.5648000000000003,
        "reward_min": -2.1209499999999992,
        "leartime_s": 0.07746225301525556,
        "sampletime": 1.0462102589954156,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 494,
        "timesteps": 98800,
        "reward_mean": -0.5072499999999998,
        "reward_max": 0.4291312500000002,
        "reward_min": -1.8857312499999992,
        "leartime_s": 0.06296150400885381,
        "sampletime": 0.7268586120044347,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 495,
        "timesteps": 99000,
        "reward_mean": -0.3142249999999998,
        "reward_max": 0.6052437500000001,
        "reward_min": -1.45345625,
        "leartime_s": 0.04519782500574365,
        "sampletime": 0.7310829389898572,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 496,
        "timesteps": 99200,
        "reward_mean": -0.5372249999999998,
        "reward_max": 0.41281875000000023,
        "reward_min": -1.9120812499999995,
        "leartime_s": 0.03566545300418511,
        "sampletime": 0.8788643949956167,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 497,
        "timesteps": 99400,
        "reward_mean": -0.25492499999999985,
        "reward_max": 0.71853125,
        "reward_min": -1.4015687499999998,
        "leartime_s": 0.029476410010829568,
        "sampletime": 0.8722470499924384,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 498,
        "timesteps": 99600,
        "reward_mean": -0.3374499999999998,
        "reward_max": 0.8902750000000003,
        "reward_min": -1.6135312499999996,
        "leartime_s": 0.05348173397942446,
        "sampletime": 0.8298784679791424,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 499,
        "timesteps": 99800,
        "reward_mean": -0.4081249999999997,
        "reward_max": 0.6356312500000002,
        "reward_min": -1.7964874999999996,
        "leartime_s": 0.041704689007019624,
        "sampletime": 0.9710168020101264,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    },
    {
        "generation": 500,
        "timesteps": 100000,
        "reward_mean": -0.4756499999999998,
        "reward_max": 0.3957187500000001,
        "reward_min": -1.9165562499999997,
        "leartime_s": 0.03789365798002109,
        "sampletime": 0.719771434989525,
        "best_mean": 0.40622500000000006,
        "best_max": 1.2823249999999995,
        "params": {
            "agentsize": 1000,
            "yellow": 0,
            "seeds": 212,
            "it": 500,
            "envs": 4,
            "population": 250,
            "sampling": 16,
            "method": "oes"
        }
    }
]