[
  {
    "gen": 1,
    "reward_mean": -45.6842667088364,
    "reward_max": -42.22419270833331,
    "reward_min": -47.18926136363635,
    "reward_std": 1.009698151307871,
    "timesteps": 360720,
    "learntime": 1.1220512390136719,
    "sampletime": 21.32838537101634,
    "best_max_mean": -45.6842667088364,
    "best_max": -42.22419270833331
  },
  {
    "gen": 2,
    "reward_mean": -45.66339738325638,
    "reward_max": -43.321979166666665,
    "reward_min": -47.160113636363604,
    "reward_std": 0.9888759708229943,
    "timesteps": 721440,
    "learntime": 0.5375441440846771,
    "sampletime": 20.99331415304914,
    "best_max_mean": -45.6842667088364,
    "best_max": -42.22419270833331
  },
  {
    "gen": 3,
    "reward_mean": -45.294811086943646,
    "reward_max": -42.69238636363638,
    "reward_min": -46.88596590909089,
    "reward_std": 0.9527020203846929,
    "timesteps": 1082160,
    "learntime": 0.1658126888796687,
    "sampletime": 21.414646149147302,
    "best_max_mean": -45.6842667088364,
    "best_max": -42.22419270833331
  },
  {
    "gen": 4,
    "reward_mean": -44.52848655007102,
    "reward_max": -40.54478693181817,
    "reward_min": -46.948607954545466,
    "reward_std": 1.4028616854100195,
    "timesteps": 1442880,
    "learntime": 0.17411657003685832,
    "sampletime": 21.092765622073784,
    "best_max_mean": -44.52848655007102,
    "best_max": -40.54478693181817
  },
  {
    "gen": 5,
    "reward_mean": -44.655524328983184,
    "reward_max": -41.09082386363636,
    "reward_min": -46.43217329545455,
    "reward_std": 1.1640840685057063,
    "timesteps": 1803600,
    "learntime": 0.19191756891086698,
    "sampletime": 21.16677652997896,
    "best_max_mean": -44.52848655007102,
    "best_max": -40.54478693181817
  },
  {
    "gen": 6,
    "reward_mean": -45.292744806463055,
    "reward_max": -41.98177556818182,
    "reward_min": -47.04391927083331,
    "reward_std": 1.0917994315010602,
    "timesteps": 2164320,
    "learntime": 0.255708415992558,
    "sampletime": 21.467236537951976,
    "best_max_mean": -44.52848655007102,
    "best_max": -40.54478693181817
  },
  {
    "gen": 7,
    "reward_mean": -44.23686199766216,
    "reward_max": -38.95954545454546,
    "reward_min": -46.676065340909076,
    "reward_std": 1.5464598558156477,
    "timesteps": 2525040,
    "learntime": 0.29443408199585974,
    "sampletime": 21.163144340040162,
    "best_max_mean": -44.23686199766216,
    "best_max": -38.95954545454546
  },
  {
    "gen": 8,
    "reward_mean": -45.444644072561545,
    "reward_max": -41.94380681818182,
    "reward_min": -47.019545454545465,
    "reward_std": 1.1002829037186288,
    "timesteps": 2885760,
    "learntime": 0.20625929906964302,
    "sampletime": 21.19685628497973,
    "best_max_mean": -44.23686199766216,
    "best_max": -38.95954545454546
  },
  {
    "gen": 9,
    "reward_mean": -43.97668986002603,
    "reward_max": -39.900369318181816,
    "reward_min": -46.785482954545415,
    "reward_std": 1.5488023310701506,
    "timesteps": 3246480,
    "learntime": 0.30049811000935733,
    "sampletime": 20.838871947024018,
    "best_max_mean": -44.23686199766216,
    "best_max": -38.95954545454546
  },
  {
    "gen": 10,
    "reward_mean": -44.23601281368371,
    "reward_max": -40.406523437500006,
    "reward_min": -46.62055397727273,
    "reward_std": 1.4869130979568481,
    "timesteps": 3607200,
    "learntime": 0.20112726115621626,
    "sampletime": 21.170543473912403,
    "best_max_mean": -44.23686199766216,
    "best_max": -38.95954545454546
  },
  {
    "gen": 11,
    "reward_mean": -45.28575929583925,
    "reward_max": -42.09348011363639,
    "reward_min": -47.26894531249999,
    "reward_std": 1.1005827324890303,
    "timesteps": 3967920,
    "learntime": 0.20061004720628262,
    "sampletime": 21.228267691796646,
    "best_max_mean": -44.23686199766216,
    "best_max": -38.95954545454546
  },
  {
    "gen": 12,
    "reward_mean": -43.737262499260176,
    "reward_max": -39.2762784090909,
    "reward_min": -46.522627840909095,
    "reward_std": 1.4994318062072427,
    "timesteps": 4328640,
    "learntime": 0.18296887702308595,
    "sampletime": 20.670637317933142,
    "best_max_mean": -44.23686199766216,
    "best_max": -38.95954545454546
  },
  {
    "gen": 13,
    "reward_mean": -44.63819369229403,
    "reward_max": -40.70294034090908,
    "reward_min": -46.853997395833325,
    "reward_std": 1.1950216694445859,
    "timesteps": 4689360,
    "learntime": 0.18470868305303156,
    "sampletime": 21.116054587997496,
    "best_max_mean": -44.23686199766216,
    "best_max": -38.95954545454546
  },
  {
    "gen": 14,
    "reward_mean": -43.38234027284564,
    "reward_max": -38.073849431818175,
    "reward_min": -46.634914772727264,
    "reward_std": 1.8309472362825667,
    "timesteps": 5050080,
    "learntime": 0.18841878208331764,
    "sampletime": 20.83127658907324,
    "best_max_mean": -43.38234027284564,
    "best_max": -38.073849431818175
  },
  {
    "gen": 15,
    "reward_mean": -44.022618519176135,
    "reward_max": -38.930468749999996,
    "reward_min": -46.94330965909087,
    "reward_std": 1.7330744418452306,
    "timesteps": 5410800,
    "learntime": 0.1858511168975383,
    "sampletime": 20.893898020964116,
    "best_max_mean": -43.38234027284564,
    "best_max": -38.073849431818175
  },
  {
    "gen": 16,
    "reward_mean": -45.00853243741121,
    "reward_max": -42.378252840909106,
    "reward_min": -46.90031249999998,
    "reward_std": 1.1885219337809039,
    "timesteps": 5771520,
    "learntime": 0.3047615170944482,
    "sampletime": 21.052003222052008,
    "best_max_mean": -43.38234027284564,
    "best_max": -38.073849431818175
  },
  {
    "gen": 17,
    "reward_mean": -42.140252888997395,
    "reward_max": -37.118606770833345,
    "reward_min": -46.33389204545455,
    "reward_std": 2.0547926313485956,
    "timesteps": 6132240,
    "learntime": 0.2679807129316032,
    "sampletime": 20.806827127933502,
    "best_max_mean": -42.140252888997395,
    "best_max": -37.118606770833345
  },
  {
    "gen": 18,
    "reward_mean": -42.70607717803031,
    "reward_max": -37.07639204545457,
    "reward_min": -46.29251420454547,
    "reward_std": 2.110058995703171,
    "timesteps": 6492960,
    "learntime": 0.275072606978938,
    "sampletime": 20.747668860014528,
    "best_max_mean": -42.70607717803031,
    "best_max": -37.07639204545457
  },
  {
    "gen": 19,
    "reward_mean": -42.804760483250476,
    "reward_max": -37.24470170454545,
    "reward_min": -46.51622159090911,
    "reward_std": 1.9820257953340938,
    "timesteps": 6853680,
    "learntime": 0.26859856909140944,
    "sampletime": 20.872198384953663,
    "best_max_mean": -42.70607717803031,
    "best_max": -37.07639204545457
  },
  {
    "gen": 20,
    "reward_mean": -43.36591162479285,
    "reward_max": -39.0851846590909,
    "reward_min": -45.8729119318182,
    "reward_std": 1.4913873032916782,
    "timesteps": 7214400,
    "learntime": 0.2975136791355908,
    "sampletime": 20.768903992837295,
    "best_max_mean": -42.70607717803031,
    "best_max": -37.07639204545457
  },
  {
    "gen": 21,
    "reward_mean": -43.28071609034684,
    "reward_max": -37.86078125000001,
    "reward_min": -45.99855113636363,
    "reward_std": 1.7861573531152164,
    "timesteps": 7575120,
    "learntime": 0.2695986849721521,
    "sampletime": 20.640545454109088,
    "best_max_mean": -42.70607717803031,
    "best_max": -37.07639204545457
  },
  {
    "gen": 22,
    "reward_mean": -44.35966057054926,
    "reward_max": -39.256406250000005,
    "reward_min": -47.366036931818236,
    "reward_std": 1.7643765503370716,
    "timesteps": 7935840,
    "learntime": 0.29328645090572536,
    "sampletime": 20.618863214040175,
    "best_max_mean": -42.70607717803031,
    "best_max": -37.07639204545457
  },
  {
    "gen": 23,
    "reward_mean": -43.37248721960821,
    "reward_max": -38.50805989583335,
    "reward_min": -46.416505681818194,
    "reward_std": 1.4970629115145446,
    "timesteps": 8296560,
    "learntime": 0.27402617991901934,
    "sampletime": 20.63779238704592,
    "best_max_mean": -42.70607717803031,
    "best_max": -37.07639204545457
  },
  {
    "gen": 24,
    "reward_mean": -41.56898074988163,
    "reward_max": -34.468607954545476,
    "reward_min": -46.20093750000002,
    "reward_std": 2.0261633182748264,
    "timesteps": 8657280,
    "learntime": 0.2663868328090757,
    "sampletime": 20.646767833037302,
    "best_max_mean": -41.56898074988163,
    "best_max": -34.468607954545476
  },
  {
    "gen": 25,
    "reward_mean": -43.711368907581694,
    "reward_max": -39.72653409090915,
    "reward_min": -46.1502130681819,
    "reward_std": 1.4693696677755153,
    "timesteps": 9018000,
    "learntime": 0.2639304460026324,
    "sampletime": 20.793869332876056,
    "best_max_mean": -41.56898074988163,
    "best_max": -34.468607954545476
  },
  {
    "gen": 26,
    "reward_mean": -41.17515532522492,
    "reward_max": -36.71139322916671,
    "reward_min": -45.041704545454564,
    "reward_std": 1.9586992309256501,
    "timesteps": 9378720,
    "learntime": 0.27973730489611626,
    "sampletime": 20.755917644128203,
    "best_max_mean": -41.56898074988163,
    "best_max": -34.468607954545476
  },
  {
    "gen": 27,
    "reward_mean": -40.32309154163708,
    "reward_max": -36.04024147727276,
    "reward_min": -45.19563920454546,
    "reward_std": 2.038750446663727,
    "timesteps": 9739440,
    "learntime": 0.2631279961206019,
    "sampletime": 20.43220985098742,
    "best_max_mean": -41.56898074988163,
    "best_max": -34.468607954545476
  },
  {
    "gen": 28,
    "reward_mean": -42.30533643317946,
    "reward_max": -37.64267045454546,
    "reward_min": -45.49389322916667,
    "reward_std": 1.5966200274826765,
    "timesteps": 10100160,
    "learntime": 0.31211839406751096,
    "sampletime": 20.68751030997373,
    "best_max_mean": -41.56898074988163,
    "best_max": -34.468607954545476
  },
  {
    "gen": 29,
    "reward_mean": -42.81897392504144,
    "reward_max": -39.34511363636364,
    "reward_min": -45.51906250000005,
    "reward_std": 1.3683538927561587,
    "timesteps": 10460880,
    "learntime": 0.27544696000404656,
    "sampletime": 20.699544006958604,
    "best_max_mean": -41.56898074988163,
    "best_max": -34.468607954545476
  },
  {
    "gen": 30,
    "reward_mean": -40.405350193832874,
    "reward_max": -33.7596022727273,
    "reward_min": -45.268125000000026,
    "reward_std": 2.388801780560081,
    "timesteps": 10821600,
    "learntime": 0.28909359918907285,
    "sampletime": 20.52007736102678,
    "best_max_mean": -40.405350193832874,
    "best_max": -33.7596022727273
  },
  {
    "gen": 31,
    "reward_mean": -40.40172254157791,
    "reward_max": -33.378565340909155,
    "reward_min": -44.91886363636364,
    "reward_std": 2.802166417404671,
    "timesteps": 11182320,
    "learntime": 0.27887349389493465,
    "sampletime": 20.23524600896053,
    "best_max_mean": -40.40172254157791,
    "best_max": -33.378565340909155
  },
  {
    "gen": 32,
    "reward_mean": -38.8949490079013,
    "reward_max": -33.690703125000034,
    "reward_min": -43.72458806818183,
    "reward_std": 2.035468789744942,
    "timesteps": 11543040,
    "learntime": 0.2921665289904922,
    "sampletime": 20.197128784144297,
    "best_max_mean": -40.40172254157791,
    "best_max": -33.378565340909155
  },
  {
    "gen": 33,
    "reward_mean": -41.18066866787998,
    "reward_max": -33.32254261363639,
    "reward_min": -44.82971590909091,
    "reward_std": 2.118251987278207,
    "timesteps": 11903760,
    "learntime": 0.2883072670083493,
    "sampletime": 20.62879035505466,
    "best_max_mean": -41.18066866787998,
    "best_max": -33.32254261363639
  },
  {
    "gen": 34,
    "reward_mean": -40.09867966160632,
    "reward_max": -34.70707386363639,
    "reward_min": -44.000653409090916,
    "reward_std": 2.1307425885631326,
    "timesteps": 12264480,
    "learntime": 0.3148332240525633,
    "sampletime": 20.379068786045536,
    "best_max_mean": -41.18066866787998,
    "best_max": -33.32254261363639
  },
  {
    "gen": 35,
    "reward_mean": -39.63690734863282,
    "reward_max": -35.94525568181821,
    "reward_min": -45.314289772727264,
    "reward_std": 2.0563488257228015,
    "timesteps": 12625200,
    "learntime": 0.27504719980061054,
    "sampletime": 20.596419513924047,
    "best_max_mean": -41.18066866787998,
    "best_max": -33.32254261363639
  },
  {
    "gen": 36,
    "reward_mean": -38.59375264485678,
    "reward_max": -33.34087239583333,
    "reward_min": -43.495213068181826,
    "reward_std": 2.368468898959729,
    "timesteps": 12985920,
    "learntime": 0.2992323499638587,
    "sampletime": 20.567579622846097,
    "best_max_mean": -41.18066866787998,
    "best_max": -33.32254261363639
  },
  {
    "gen": 37,
    "reward_mean": -37.90924351547703,
    "reward_max": -32.31913352272726,
    "reward_min": -42.82409090909091,
    "reward_std": 2.492016289826199,
    "timesteps": 13346640,
    "learntime": 0.28019987884908915,
    "sampletime": 20.335463647032157,
    "best_max_mean": -37.90924351547703,
    "best_max": -32.31913352272726
  },
  {
    "gen": 38,
    "reward_mean": -35.31383208303741,
    "reward_max": -29.22335227272728,
    "reward_min": -40.72677556818183,
    "reward_std": 2.552413272019617,
    "timesteps": 13707360,
    "learntime": 0.30910125002264977,
    "sampletime": 19.858738879906014,
    "best_max_mean": -35.31383208303741,
    "best_max": -29.22335227272728
  },
  {
    "gen": 39,
    "reward_mean": -37.46180806477865,
    "reward_max": -33.05268465909091,
    "reward_min": -42.88399147727273,
    "reward_std": 1.7563007628143414,
    "timesteps": 14068080,
    "learntime": 0.3061348448973149,
    "sampletime": 20.431729309028015,
    "best_max_mean": -35.31383208303741,
    "best_max": -29.22335227272728
  },
  {
    "gen": 40,
    "reward_mean": -36.60543225837478,
    "reward_max": -31.351491477272734,
    "reward_min": -40.85876420454547,
    "reward_std": 1.8896991042854927,
    "timesteps": 14428800,
    "learntime": 0.2932160431519151,
    "sampletime": 20.246326590888202,
    "best_max_mean": -35.31383208303741,
    "best_max": -29.22335227272728
  },
  {
    "gen": 41,
    "reward_mean": -36.51734524813567,
    "reward_max": -31.09005681818189,
    "reward_min": -40.63561079545456,
    "reward_std": 2.308475202108888,
    "timesteps": 14789520,
    "learntime": 0.2888882691040635,
    "sampletime": 20.300064651994035,
    "best_max_mean": -35.31383208303741,
    "best_max": -29.22335227272728
  },
  {
    "gen": 42,
    "reward_mean": -35.96007257634944,
    "reward_max": -31.521463068181845,
    "reward_min": -42.305397727272705,
    "reward_std": 2.2867755308923727,
    "timesteps": 15150240,
    "learntime": 0.30559752183035016,
    "sampletime": 20.4048953759484,
    "best_max_mean": -35.31383208303741,
    "best_max": -29.22335227272728
  },
  {
    "gen": 43,
    "reward_mean": -38.42820630622634,
    "reward_max": -34.31258522727274,
    "reward_min": -41.76240056818183,
    "reward_std": 1.7591378375206412,
    "timesteps": 15510960,
    "learntime": 0.298884489107877,
    "sampletime": 20.152611311990768,
    "best_max_mean": -35.31383208303741,
    "best_max": -29.22335227272728
  },
  {
    "gen": 44,
    "reward_mean": -34.10315766305635,
    "reward_max": -28.29571022727273,
    "reward_min": -39.06225852272728,
    "reward_std": 2.5648692341614816,
    "timesteps": 15871680,
    "learntime": 0.3062321441248059,
    "sampletime": 20.12723342096433,
    "best_max_mean": -34.10315766305635,
    "best_max": -28.29571022727273
  },
  {
    "gen": 45,
    "reward_mean": -33.97939503062855,
    "reward_max": -28.187883522727248,
    "reward_min": -38.98686079545455,
    "reward_std": 2.496234169017522,
    "timesteps": 16232400,
    "learntime": 0.3097844470757991,
    "sampletime": 20.37719956203364,
    "best_max_mean": -33.97939503062855,
    "best_max": -28.187883522727248
  },
  {
    "gen": 46,
    "reward_mean": -33.26717394279713,
    "reward_max": -26.01986979166669,
    "reward_min": -37.70914772727275,
    "reward_std": 2.4483993999045213,
    "timesteps": 16593120,
    "learntime": 0.297423732932657,
    "sampletime": 20.477023568935692,
    "best_max_mean": -33.26717394279713,
    "best_max": -26.01986979166669
  },
  {
    "gen": 47,
    "reward_mean": -32.406082523230374,
    "reward_max": -26.669886363636383,
    "reward_min": -37.51232954545455,
    "reward_std": 2.5317971055761865,
    "timesteps": 16953840,
    "learntime": 0.2773179148789495,
    "sampletime": 19.946250359993428,
    "best_max_mean": -33.26717394279713,
    "best_max": -26.01986979166669
  },
  {
    "gen": 48,
    "reward_mean": -32.90404968261721,
    "reward_max": -27.787855113636432,
    "reward_min": -38.590227272727276,
    "reward_std": 2.1869910538779678,
    "timesteps": 17314560,
    "learntime": 0.30895976396277547,
    "sampletime": 20.01169679593295,
    "best_max_mean": -33.26717394279713,
    "best_max": -26.01986979166669
  },
  {
    "gen": 49,
    "reward_mean": -32.18060929731891,
    "reward_max": -26.065820312500023,
    "reward_min": -36.90268465909092,
    "reward_std": 2.4696120067760416,
    "timesteps": 17675280,
    "learntime": 0.28853863500989974,
    "sampletime": 19.792192975990474,
    "best_max_mean": -33.26717394279713,
    "best_max": -26.01986979166669
  },
  {
    "gen": 50,
    "reward_mean": -36.80916920055044,
    "reward_max": -29.293763020833367,
    "reward_min": -42.2499005681818,
    "reward_std": 2.9550244281293705,
    "timesteps": 18036000,
    "learntime": 0.2774068901780993,
    "sampletime": 20.2205647691153,
    "best_max_mean": -33.26717394279713,
    "best_max": -26.01986979166669
  },
  {
    "gen": 51,
    "reward_mean": -35.03869832356773,
    "reward_max": -30.15811079545455,
    "reward_min": -39.60819010416671,
    "reward_std": 2.0957932384390956,
    "timesteps": 18396720,
    "learntime": 0.2757884890306741,
    "sampletime": 20.478221155004576,
    "best_max_mean": -33.26717394279713,
    "best_max": -26.01986979166669
  },
  {
    "gen": 52,
    "reward_mean": -35.257399717388765,
    "reward_max": -27.456321022727295,
    "reward_min": -41.17930397727278,
    "reward_std": 2.8462927400049414,
    "timesteps": 18757440,
    "learntime": 0.30275348108261824,
    "sampletime": 20.02594033605419,
    "best_max_mean": -33.26717394279713,
    "best_max": -26.01986979166669
  },
  {
    "gen": 53,
    "reward_mean": -32.904585219874555,
    "reward_max": -26.476420454545462,
    "reward_min": -39.0969460227273,
    "reward_std": 2.8934202902443,
    "timesteps": 19118160,
    "learntime": 0.31212720298208296,
    "sampletime": 19.86833711597137,
    "best_max_mean": -33.26717394279713,
    "best_max": -26.01986979166669
  },
  {
    "gen": 54,
    "reward_mean": -31.602485518022036,
    "reward_max": -21.856979166666687,
    "reward_min": -40.00528409090909,
    "reward_std": 3.3798585754336203,
    "timesteps": 19478880,
    "learntime": 0.2984396549873054,
    "sampletime": 20.383645958965644,
    "best_max_mean": -31.602485518022036,
    "best_max": -21.856979166666687
  },
  {
    "gen": 55,
    "reward_mean": -33.45252110336771,
    "reward_max": -24.89563920454548,
    "reward_min": -40.21434659090911,
    "reward_std": 2.6599466058783374,
    "timesteps": 19839600,
    "learntime": 0.2977248909883201,
    "sampletime": 19.807800204027444,
    "best_max_mean": -31.602485518022036,
    "best_max": -21.856979166666687
  },
  {
    "gen": 56,
    "reward_mean": -30.627278405391845,
    "reward_max": -25.4858238636364,
    "reward_min": -35.54133522727279,
    "reward_std": 2.534365611337338,
    "timesteps": 20200320,
    "learntime": 0.28067698096856475,
    "sampletime": 19.884007818065584,
    "best_max_mean": -31.602485518022036,
    "best_max": -21.856979166666687
  },
  {
    "gen": 57,
    "reward_mean": -31.90036536014444,
    "reward_max": -23.191903409090926,
    "reward_min": -37.24558238636366,
    "reward_std": 2.9262920138500252,
    "timesteps": 20561040,
    "learntime": 0.2697190521284938,
    "sampletime": 19.87676222110167,
    "best_max_mean": -31.602485518022036,
    "best_max": -21.856979166666687
  },
  {
    "gen": 58,
    "reward_mean": -30.222018118193684,
    "reward_max": -23.4487109375,
    "reward_min": -35.83117897727274,
    "reward_std": 2.6660119036623997,
    "timesteps": 20921760,
    "learntime": 0.31182922003790736,
    "sampletime": 19.978427448077127,
    "best_max_mean": -31.602485518022036,
    "best_max": -21.856979166666687
  },
  {
    "gen": 59,
    "reward_mean": -31.476011167584076,
    "reward_max": -26.949401041666718,
    "reward_min": -35.70546875000005,
    "reward_std": 1.967144503948941,
    "timesteps": 21282480,
    "learntime": 0.2685441239736974,
    "sampletime": 19.715087469900027,
    "best_max_mean": -31.602485518022036,
    "best_max": -21.856979166666687
  },
  {
    "gen": 60,
    "reward_mean": -28.86086780894891,
    "reward_max": -20.602769886363664,
    "reward_min": -36.099908854166756,
    "reward_std": 3.1933560390180644,
    "timesteps": 21643200,
    "learntime": 0.29738840693607926,
    "sampletime": 19.34220671793446,
    "best_max_mean": -28.86086780894891,
    "best_max": -20.602769886363664
  },
  {
    "gen": 61,
    "reward_mean": -31.43188903808597,
    "reward_max": -26.341548295454576,
    "reward_min": -37.46998697916669,
    "reward_std": 2.920287907758118,
    "timesteps": 22003920,
    "learntime": 0.2992866919375956,
    "sampletime": 19.616715349955484,
    "best_max_mean": -28.86086780894891,
    "best_max": -20.602769886363664
  },
  {
    "gen": 62,
    "reward_mean": -32.385587953509756,
    "reward_max": -24.822897727272746,
    "reward_min": -37.786432291666735,
    "reward_std": 2.7861591351913524,
    "timesteps": 22364640,
    "learntime": 0.2881356899160892,
    "sampletime": 19.949034406105056,
    "best_max_mean": -28.86086780894891,
    "best_max": -20.602769886363664
  },
  {
    "gen": 63,
    "reward_mean": -32.047205588600875,
    "reward_max": -26.050820312500033,
    "reward_min": -38.4414453125,
    "reward_std": 2.3461022225639336,
    "timesteps": 22725360,
    "learntime": 0.2787969259079546,
    "sampletime": 19.83608095999807,
    "best_max_mean": -28.86086780894891,
    "best_max": -20.602769886363664
  },
  {
    "gen": 64,
    "reward_mean": -31.460273252545036,
    "reward_max": -24.51177556818186,
    "reward_min": -38.45701822916674,
    "reward_std": 2.6207081742588305,
    "timesteps": 23086080,
    "learntime": 0.3137074939440936,
    "sampletime": 19.62930061505176,
    "best_max_mean": -28.86086780894891,
    "best_max": -20.602769886363664
  },
  {
    "gen": 65,
    "reward_mean": -28.210081528172385,
    "reward_max": -20.591974431818183,
    "reward_min": -33.582343750000035,
    "reward_std": 2.345627682513926,
    "timesteps": 23446800,
    "learntime": 0.2859445142094046,
    "sampletime": 19.89894314482808,
    "best_max_mean": -28.210081528172385,
    "best_max": -20.591974431818183
  },
  {
    "gen": 66,
    "reward_mean": -27.29575820460467,
    "reward_max": -22.18974431818182,
    "reward_min": -33.17313920454547,
    "reward_std": 2.4440491611522703,
    "timesteps": 23807520,
    "learntime": 0.28924835100769997,
    "sampletime": 19.4856019760482,
    "best_max_mean": -28.210081528172385,
    "best_max": -20.591974431818183
  },
  {
    "gen": 67,
    "reward_mean": -29.241499374852097,
    "reward_max": -23.77109375000007,
    "reward_min": -33.15870738636368,
    "reward_std": 2.183246188303811,
    "timesteps": 24168240,
    "learntime": 0.28733316087163985,
    "sampletime": 19.760582567891106,
    "best_max_mean": -28.210081528172385,
    "best_max": -20.591974431818183
  },
  {
    "gen": 68,
    "reward_mean": -26.663784031723527,
    "reward_max": -20.98907552083335,
    "reward_min": -34.69677083333336,
    "reward_std": 2.966907540132063,
    "timesteps": 24528960,
    "learntime": 0.2823856049217284,
    "sampletime": 19.301611131988466,
    "best_max_mean": -28.210081528172385,
    "best_max": -20.591974431818183
  },
  {
    "gen": 69,
    "reward_mean": -24.286578887014713,
    "reward_max": -16.452713068181826,
    "reward_min": -29.02173295454553,
    "reward_std": 2.3902498610689773,
    "timesteps": 24889680,
    "learntime": 0.28750259918160737,
    "sampletime": 19.34106424008496,
    "best_max_mean": -24.286578887014713,
    "best_max": -16.452713068181826
  },
  {
    "gen": 70,
    "reward_mean": -24.76611979166671,
    "reward_max": -16.851548295454577,
    "reward_min": -30.508465909091,
    "reward_std": 3.3757520140315154,
    "timesteps": 25250400,
    "learntime": 0.30157063412480056,
    "sampletime": 19.272753125987947,
    "best_max_mean": -24.286578887014713,
    "best_max": -16.452713068181826
  },
  {
    "gen": 71,
    "reward_mean": -25.086960726651306,
    "reward_max": -17.93934895833335,
    "reward_min": -32.17600852272729,
    "reward_std": 3.319808131724265,
    "timesteps": 25611120,
    "learntime": 0.29613157408311963,
    "sampletime": 19.796378226019442,
    "best_max_mean": -24.286578887014713,
    "best_max": -16.452713068181826
  },
  {
    "gen": 72,
    "reward_mean": -28.31245433460586,
    "reward_max": -19.017130681818184,
    "reward_min": -35.20958806818183,
    "reward_std": 2.8475030197146998,
    "timesteps": 25971840,
    "learntime": 0.28621033602394164,
    "sampletime": 19.48836191603914,
    "best_max_mean": -24.286578887014713,
    "best_max": -16.452713068181826
  },
  {
    "gen": 73,
    "reward_mean": -29.82295868844703,
    "reward_max": -20.763320312500053,
    "reward_min": -38.60088068181823,
    "reward_std": 3.4103637252773757,
    "timesteps": 26332560,
    "learntime": 0.2814822760410607,
    "sampletime": 19.75250741513446,
    "best_max_mean": -24.286578887014713,
    "best_max": -16.452713068181826
  },
  {
    "gen": 74,
    "reward_mean": -31.15480759129386,
    "reward_max": -25.675260416666717,
    "reward_min": -38.184232954545514,
    "reward_std": 2.645502680734453,
    "timesteps": 26693280,
    "learntime": 0.2920819001737982,
    "sampletime": 19.749563456047326,
    "best_max_mean": -24.286578887014713,
    "best_max": -16.452713068181826
  },
  {
    "gen": 75,
    "reward_mean": -29.91538818359381,
    "reward_max": -24.06568181818184,
    "reward_min": -36.06228693181825,
    "reward_std": 2.594664683952855,
    "timesteps": 27054000,
    "learntime": 0.2823547809384763,
    "sampletime": 19.740234188036993,
    "best_max_mean": -24.286578887014713,
    "best_max": -16.452713068181826
  },
  {
    "gen": 76,
    "reward_mean": -26.178573441938966,
    "reward_max": -21.21497395833337,
    "reward_min": -30.710028409090953,
    "reward_std": 2.076027479072398,
    "timesteps": 27414720,
    "learntime": 0.28934513917192817,
    "sampletime": 19.316252124030143,
    "best_max_mean": -24.286578887014713,
    "best_max": -16.452713068181826
  },
  {
    "gen": 77,
    "reward_mean": -27.905260250207213,
    "reward_max": -21.813622159090965,
    "reward_min": -35.05098958333346,
    "reward_std": 2.7392929149148335,
    "timesteps": 27775440,
    "learntime": 0.318270456045866,
    "sampletime": 19.527246922953054,
    "best_max_mean": -24.286578887014713,
    "best_max": -16.452713068181826
  },
  {
    "gen": 78,
    "reward_mean": -28.954065884676915,
    "reward_max": -21.057059659090964,
    "reward_min": -37.088593750000086,
    "reward_std": 3.026124810879625,
    "timesteps": 28136160,
    "learntime": 0.3066179188899696,
    "sampletime": 19.478093444835395,
    "best_max_mean": -24.286578887014713,
    "best_max": -16.452713068181826
  },
  {
    "gen": 79,
    "reward_mean": -28.125555771336465,
    "reward_max": -18.226846590909133,
    "reward_min": -33.803053977272775,
    "reward_std": 2.8021694346713186,
    "timesteps": 28496880,
    "learntime": 0.29753295006230474,
    "sampletime": 19.712190184975043,
    "best_max_mean": -24.286578887014713,
    "best_max": -16.452713068181826
  },
  {
    "gen": 80,
    "reward_mean": -26.129757024591683,
    "reward_max": -19.78927556818185,
    "reward_min": -31.140170454545554,
    "reward_std": 2.480935664717303,
    "timesteps": 28857600,
    "learntime": 0.318327713990584,
    "sampletime": 19.528198933927342,
    "best_max_mean": -24.286578887014713,
    "best_max": -16.452713068181826
  },
  {
    "gen": 81,
    "reward_mean": -24.796321540601372,
    "reward_max": -14.278920454545453,
    "reward_min": -34.890738636363764,
    "reward_std": 4.095325117236833,
    "timesteps": 29218320,
    "learntime": 0.29244309081695974,
    "sampletime": 19.10568408994004,
    "best_max_mean": -24.796321540601372,
    "best_max": -14.278920454545453
  },
  {
    "gen": 82,
    "reward_mean": -28.086604873194915,
    "reward_max": -21.84936079545458,
    "reward_min": -33.74330965909103,
    "reward_std": 2.653330725707046,
    "timesteps": 29579040,
    "learntime": 0.3028264711610973,
    "sampletime": 19.502827011980116,
    "best_max_mean": -24.796321540601372,
    "best_max": -14.278920454545453
  },
  {
    "gen": 83,
    "reward_mean": -26.727555578983242,
    "reward_max": -16.867940340909133,
    "reward_min": -35.58811079545465,
    "reward_std": 3.8043123024756196,
    "timesteps": 29939760,
    "learntime": 0.2917944260407239,
    "sampletime": 19.617543433094397,
    "best_max_mean": -24.796321540601372,
    "best_max": -14.278920454545453
  },
  {
    "gen": 84,
    "reward_mean": -24.790429835464053,
    "reward_max": -14.94759943181818,
    "reward_min": -32.2674857954546,
    "reward_std": 2.9054131924230537,
    "timesteps": 30300480,
    "learntime": 0.3017005859874189,
    "sampletime": 19.375746475998312,
    "best_max_mean": -24.796321540601372,
    "best_max": -14.278920454545453
  },
  {
    "gen": 85,
    "reward_mean": -23.294662845496024,
    "reward_max": -15.494829545454548,
    "reward_min": -30.24622159090917,
    "reward_std": 2.8754017219233763,
    "timesteps": 30661200,
    "learntime": 0.29661528393626213,
    "sampletime": 19.190223451936617,
    "best_max_mean": -24.796321540601372,
    "best_max": -14.278920454545453
  },
  {
    "gen": 86,
    "reward_mean": -26.247341290098305,
    "reward_max": -19.275625000000037,
    "reward_min": -32.03410511363642,
    "reward_std": 2.8920622510297047,
    "timesteps": 31021920,
    "learntime": 0.28233229205943644,
    "sampletime": 19.23214190802537,
    "best_max_mean": -24.796321540601372,
    "best_max": -14.278920454545453
  },
  {
    "gen": 87,
    "reward_mean": -19.025796823212623,
    "reward_max": -11.977286931818169,
    "reward_min": -27.611164772727328,
    "reward_std": 3.3686147078935655,
    "timesteps": 31382640,
    "learntime": 0.2684711429756135,
    "sampletime": 18.96625022799708,
    "best_max_mean": -19.025796823212623,
    "best_max": -11.977286931818169
  },
  {
    "gen": 88,
    "reward_mean": -24.93147128018471,
    "reward_max": -18.8033854166667,
    "reward_min": -32.481647727272836,
    "reward_std": 2.7691331892525146,
    "timesteps": 31743360,
    "learntime": 0.30952973011881113,
    "sampletime": 19.294533159816638,
    "best_max_mean": -19.025796823212623,
    "best_max": -11.977286931818169
  },
  {
    "gen": 89,
    "reward_mean": -23.641835974491052,
    "reward_max": -16.817571022727282,
    "reward_min": -31.85774147727284,
    "reward_std": 2.6812669267954483,
    "timesteps": 32104080,
    "learntime": 0.2736738750245422,
    "sampletime": 19.33252345584333,
    "best_max_mean": -19.025796823212623,
    "best_max": -11.977286931818169
  },
  {
    "gen": 90,
    "reward_mean": -27.70896654533625,
    "reward_max": -16.828437500000028,
    "reward_min": -35.449971590909236,
    "reward_std": 3.8667829194294865,
    "timesteps": 32464800,
    "learntime": 0.1760760168544948,
    "sampletime": 19.674250239972025,
    "best_max_mean": -19.025796823212623,
    "best_max": -11.977286931818169
  },
  {
    "gen": 91,
    "reward_mean": -27.848993141867968,
    "reward_max": -22.9367045454546,
    "reward_min": -33.504687500000074,
    "reward_std": 2.500840528738439,
    "timesteps": 32825520,
    "learntime": 0.1893710228614509,
    "sampletime": 19.387265847995877,
    "best_max_mean": -19.025796823212623,
    "best_max": -11.977286931818169
  },
  {
    "gen": 92,
    "reward_mean": -22.917898134173825,
    "reward_max": -14.760980113636355,
    "reward_min": -29.24059659090917,
    "reward_std": 3.2340110055148004,
    "timesteps": 33186240,
    "learntime": 0.1890020731370896,
    "sampletime": 19.090225832071155,
    "best_max_mean": -19.025796823212623,
    "best_max": -11.977286931818169
  },
  {
    "gen": 93,
    "reward_mean": -25.419813750295987,
    "reward_max": -14.235525568181822,
    "reward_min": -32.42528409090921,
    "reward_std": 3.2348370595476856,
    "timesteps": 33546960,
    "learntime": 0.28262782096862793,
    "sampletime": 19.251294646179304,
    "best_max_mean": -19.025796823212623,
    "best_max": -11.977286931818169
  },
  {
    "gen": 94,
    "reward_mean": -26.347626120827464,
    "reward_max": -18.68883522727276,
    "reward_min": -35.44412760416676,
    "reward_std": 3.2388797824306508,
    "timesteps": 33907680,
    "learntime": 0.29551613912917674,
    "sampletime": 19.601243081036955,
    "best_max_mean": -19.025796823212623,
    "best_max": -11.977286931818169
  },
  {
    "gen": 95,
    "reward_mean": -24.34426979758527,
    "reward_max": -19.935965909090918,
    "reward_min": -28.98335227272736,
    "reward_std": 2.126916687940687,
    "timesteps": 34268400,
    "learntime": 0.19046055781655014,
    "sampletime": 19.42654094705358,
    "best_max_mean": -19.025796823212623,
    "best_max": -11.977286931818169
  },
  {
    "gen": 96,
    "reward_mean": -24.27004183682534,
    "reward_max": -17.194257812500023,
    "reward_min": -29.822713068181887,
    "reward_std": 2.3379250293055183,
    "timesteps": 34629120,
    "learntime": 0.18883580015972257,
    "sampletime": 19.375679075019434,
    "best_max_mean": -19.025796823212623,
    "best_max": -11.977286931818169
  },
  {
    "gen": 97,
    "reward_mean": -24.840522405451054,
    "reward_max": -19.991576704545505,
    "reward_min": -29.00605113636368,
    "reward_std": 2.050061366732814,
    "timesteps": 34989840,
    "learntime": 0.28033951204270124,
    "sampletime": 19.37195945996791,
    "best_max_mean": -19.025796823212623,
    "best_max": -11.977286931818169
  },
  {
    "gen": 98,
    "reward_mean": -26.79868476636488,
    "reward_max": -20.605028409090945,
    "reward_min": -33.44589488636375,
    "reward_std": 2.715131552004558,
    "timesteps": 35350560,
    "learntime": 0.20054450095631182,
    "sampletime": 19.86589926900342,
    "best_max_mean": -19.025796823212623,
    "best_max": -11.977286931818169
  },
  {
    "gen": 99,
    "reward_mean": -17.845177260890168,
    "reward_max": -10.095752840909073,
    "reward_min": -24.220781250000048,
    "reward_std": 2.9767602281665853,
    "timesteps": 35711280,
    "learntime": 0.30239679710939527,
    "sampletime": 19.05824142601341,
    "best_max_mean": -17.845177260890168,
    "best_max": -10.095752840909073
  },
  {
    "gen": 100,
    "reward_mean": -21.48048546993375,
    "reward_max": -12.030965909090918,
    "reward_min": -30.185582386363684,
    "reward_std": 3.2420674764176702,
    "timesteps": 36072000,
    "learntime": 0.20405799290165305,
    "sampletime": 19.275725577957928,
    "best_max_mean": -17.845177260890168,
    "best_max": -10.095752840909073
  },
  {
    "gen": 101,
    "reward_mean": -21.39909925056231,
    "reward_max": -10.000156250000035,
    "reward_min": -29.34795454545463,
    "reward_std": 3.9220087610754577,
    "timesteps": 36432720,
    "learntime": 0.28064014995470643,
    "sampletime": 19.356462633004412,
    "best_max_mean": -21.39909925056231,
    "best_max": -10.000156250000035
  },
  {
    "gen": 102,
    "reward_mean": -22.043766091086702,
    "reward_max": -12.720482954545485,
    "reward_min": -30.83800781250008,
    "reward_std": 2.9136949373143777,
    "timesteps": 36793440,
    "learntime": 0.20402154396288097,
    "sampletime": 19.353721254039556,
    "best_max_mean": -21.39909925056231,
    "best_max": -10.000156250000035
  },
  {
    "gen": 103,
    "reward_mean": -21.20478637695316,
    "reward_max": -10.867102272727267,
    "reward_min": -26.554588068181843,
    "reward_std": 2.8694468916500147,
    "timesteps": 37154160,
    "learntime": 0.20695750787854195,
    "sampletime": 19.31670145317912,
    "best_max_mean": -21.39909925056231,
    "best_max": -10.000156250000035
  },
  {
    "gen": 104,
    "reward_mean": -17.886291873816326,
    "reward_max": -9.010143229166678,
    "reward_min": -25.69977272727281,
    "reward_std": 3.552040159694986,
    "timesteps": 37514880,
    "learntime": 0.1966520978603512,
    "sampletime": 19.168466767994687,
    "best_max_mean": -17.886291873816326,
    "best_max": -9.010143229166678
  },
  {
    "gen": 105,
    "reward_mean": -21.11743731874411,
    "reward_max": -15.003480113636387,
    "reward_min": -28.74623697916671,
    "reward_std": 3.314481672430763,
    "timesteps": 37875600,
    "learntime": 0.19154456700198352,
    "sampletime": 19.28347640717402,
    "best_max_mean": -17.886291873816326,
    "best_max": -9.010143229166678
  },
  {
    "gen": 106,
    "reward_mean": -20.49088319720648,
    "reward_max": -12.899247159090937,
    "reward_min": -26.52298295454551,
    "reward_std": 2.781534477430204,
    "timesteps": 38236320,
    "learntime": 0.19256330793723464,
    "sampletime": 19.066499158972874,
    "best_max_mean": -17.886291873816326,
    "best_max": -9.010143229166678
  },
  {
    "gen": 107,
    "reward_mean": -19.050466012665737,
    "reward_max": -11.64254261363635,
    "reward_min": -26.634140625000043,
    "reward_std": 2.8641425770536326,
    "timesteps": 38597040,
    "learntime": 0.19961480796337128,
    "sampletime": 19.28832022100687,
    "best_max_mean": -17.886291873816326,
    "best_max": -9.010143229166678
  },
  {
    "gen": 108,
    "reward_mean": -21.50602441036346,
    "reward_max": -15.305468750000024,
    "reward_min": -27.31110795454558,
    "reward_std": 2.7985103390445576,
    "timesteps": 38957760,
    "learntime": 0.17813134007155895,
    "sampletime": 19.342507716966793,
    "best_max_mean": -17.886291873816326,
    "best_max": -9.010143229166678
  },
  {
    "gen": 109,
    "reward_mean": -22.868884776722354,
    "reward_max": -15.595397727272712,
    "reward_min": -28.18598011363646,
    "reward_std": 2.6028482064625407,
    "timesteps": 39318480,
    "learntime": 0.18040645401924849,
    "sampletime": 19.187375439796597,
    "best_max_mean": -17.886291873816326,
    "best_max": -9.010143229166678
  },
  {
    "gen": 110,
    "reward_mean": -21.285558952562774,
    "reward_max": -15.211931818181817,
    "reward_min": -27.5681250000001,
    "reward_std": 2.5127438572293035,
    "timesteps": 39679200,
    "learntime": 0.19196678791195154,
    "sampletime": 19.365948293125257,
    "best_max_mean": -17.886291873816326,
    "best_max": -9.010143229166678
  },
  {
    "gen": 111,
    "reward_mean": -22.11576075698396,
    "reward_max": -16.03833806818187,
    "reward_min": -28.907301136363746,
    "reward_std": 2.760628128909958,
    "timesteps": 40039920,
    "learntime": 0.19286396983079612,
    "sampletime": 19.142151166917756,
    "best_max_mean": -17.886291873816326,
    "best_max": -9.010143229166678
  },
  {
    "gen": 112,
    "reward_mean": -23.582958355527985,
    "reward_max": -18.317005208333352,
    "reward_min": -29.483039772727377,
    "reward_std": 2.4261018229961278,
    "timesteps": 40400640,
    "learntime": 0.18822575104422867,
    "sampletime": 19.41390497982502,
    "best_max_mean": -17.886291873816326,
    "best_max": -9.010143229166678
  },
  {
    "gen": 113,
    "reward_mean": -18.25357420025452,
    "reward_max": -11.870894886363637,
    "reward_min": -24.860852272727296,
    "reward_std": 2.7816056659042476,
    "timesteps": 40761360,
    "learntime": 0.1918634958565235,
    "sampletime": 19.15959963784553,
    "best_max_mean": -17.886291873816326,
    "best_max": -9.010143229166678
  },
  {
    "gen": 114,
    "reward_mean": -18.59707125577062,
    "reward_max": -11.239127604166667,
    "reward_min": -26.361207386363716,
    "reward_std": 3.1607148547275843,
    "timesteps": 41122080,
    "learntime": 0.18915562494657934,
    "sampletime": 18.967367065139115,
    "best_max_mean": -17.886291873816326,
    "best_max": -9.010143229166678
  },
  {
    "gen": 115,
    "reward_mean": -21.752533606326985,
    "reward_max": -16.122798295454533,
    "reward_min": -26.78262784090917,
    "reward_std": 2.4453172614790484,
    "timesteps": 41482800,
    "learntime": 0.19546520081348717,
    "sampletime": 19.190415264107287,
    "best_max_mean": -17.886291873816326,
    "best_max": -9.010143229166678
  },
  {
    "gen": 116,
    "reward_mean": -20.769931215228503,
    "reward_max": -13.648776041666665,
    "reward_min": -26.070696022727308,
    "reward_std": 2.7937959745865277,
    "timesteps": 41843520,
    "learntime": 0.19409392308443785,
    "sampletime": 19.24333015899174,
    "best_max_mean": -17.886291873816326,
    "best_max": -9.010143229166678
  },
  {
    "gen": 117,
    "reward_mean": -24.794726229581023,
    "reward_max": -18.39730468750001,
    "reward_min": -30.19017045454557,
    "reward_std": 3.044703288292833,
    "timesteps": 42204240,
    "learntime": 0.19184955209493637,
    "sampletime": 19.308214735938236,
    "best_max_mean": -17.886291873816326,
    "best_max": -9.010143229166678
  },
  {
    "gen": 118,
    "reward_mean": -21.291194624467366,
    "reward_max": -15.496818181818197,
    "reward_min": -28.725653409090977,
    "reward_std": 2.7424494733103693,
    "timesteps": 42564960,
    "learntime": 0.18409440689720213,
    "sampletime": 19.390221090987325,
    "best_max_mean": -17.886291873816326,
    "best_max": -9.010143229166678
  },
  {
    "gen": 119,
    "reward_mean": -18.364125532670464,
    "reward_max": -13.303281249999998,
    "reward_min": -24.23002604166669,
    "reward_std": 2.8699570500656173,
    "timesteps": 42925680,
    "learntime": 0.1818418928887695,
    "sampletime": 18.983078884892166,
    "best_max_mean": -17.886291873816326,
    "best_max": -9.010143229166678
  },
  {
    "gen": 120,
    "reward_mean": -19.15504307602393,
    "reward_max": -11.26884943181817,
    "reward_min": -25.977514204545482,
    "reward_std": 2.8752834245919847,
    "timesteps": 43286400,
    "learntime": 0.19596627494320273,
    "sampletime": 19.30301185301505,
    "best_max_mean": -17.886291873816326,
    "best_max": -9.010143229166678
  },
  {
    "gen": 121,
    "reward_mean": -20.17150816021548,
    "reward_max": -11.816079545454606,
    "reward_min": -29.109257812500093,
    "reward_std": 3.1977815368089915,
    "timesteps": 43647120,
    "learntime": 0.20592386508360505,
    "sampletime": 19.105570896994323,
    "best_max_mean": -17.886291873816326,
    "best_max": -9.010143229166678
  },
  {
    "gen": 122,
    "reward_mean": -20.72944263805047,
    "reward_max": -15.397812500000027,
    "reward_min": -27.917457386363743,
    "reward_std": 2.3568279130619163,
    "timesteps": 44007840,
    "learntime": 0.1880221718456596,
    "sampletime": 19.093804251868278,
    "best_max_mean": -17.886291873816326,
    "best_max": -9.010143229166678
  },
  {
    "gen": 123,
    "reward_mean": -18.09180277506512,
    "reward_max": -10.352201704545434,
    "reward_min": -26.312528409090977,
    "reward_std": 3.339373835983942,
    "timesteps": 44368560,
    "learntime": 0.2026455500163138,
    "sampletime": 19.15011384896934,
    "best_max_mean": -17.886291873816326,
    "best_max": -9.010143229166678
  },
  {
    "gen": 124,
    "reward_mean": -17.730876908735823,
    "reward_max": -9.213828125000072,
    "reward_min": -25.206335227272803,
    "reward_std": 3.0861014669455704,
    "timesteps": 44729280,
    "learntime": 0.18580470280721784,
    "sampletime": 18.948416315950453,
    "best_max_mean": -17.886291873816326,
    "best_max": -9.010143229166678
  },
  {
    "gen": 125,
    "reward_mean": -18.813156904740787,
    "reward_max": -8.088551136363636,
    "reward_min": -27.468906250000057,
    "reward_std": 3.9372977726039475,
    "timesteps": 45090000,
    "learntime": 0.20113848708570004,
    "sampletime": 19.03389728302136,
    "best_max_mean": -18.813156904740787,
    "best_max": -8.088551136363636
  },
  {
    "gen": 126,
    "reward_mean": -15.920267833362935,
    "reward_max": -5.618835227272794,
    "reward_min": -24.845411931818216,
    "reward_std": 3.419016363734353,
    "timesteps": 45450720,
    "learntime": 0.18441157112829387,
    "sampletime": 19.062989428872243,
    "best_max_mean": -15.920267833362935,
    "best_max": -5.618835227272794
  },
  {
    "gen": 127,
    "reward_mean": -20.459088745117235,
    "reward_max": -11.69757102272727,
    "reward_min": -28.89308238636377,
    "reward_std": 3.6339114935683936,
    "timesteps": 45811440,
    "learntime": 0.19845142401754856,
    "sampletime": 19.354889736976475,
    "best_max_mean": -15.920267833362935,
    "best_max": -5.618835227272794
  },
  {
    "gen": 128,
    "reward_mean": -19.429162505178777,
    "reward_max": -12.220142045454558,
    "reward_min": -29.57112215909103,
    "reward_std": 3.7460590678196097,
    "timesteps": 46172160,
    "learntime": 0.17881443188525736,
    "sampletime": 19.149753476958722,
    "best_max_mean": -15.920267833362935,
    "best_max": -5.618835227272794
  },
  {
    "gen": 129,
    "reward_mean": -19.969651859167882,
    "reward_max": -11.666150568181818,
    "reward_min": -26.58723011363642,
    "reward_std": 3.5014999525997306,
    "timesteps": 46532880,
    "learntime": 0.17906540189869702,
    "sampletime": 19.19002422806807,
    "best_max_mean": -15.920267833362935,
    "best_max": -5.618835227272794
  },
  {
    "gen": 130,
    "reward_mean": -16.593897594105137,
    "reward_max": -7.460533854166663,
    "reward_min": -26.674928977272803,
    "reward_std": 3.6417714622584385,
    "timesteps": 46893600,
    "learntime": 0.19212952186353505,
    "sampletime": 19.28192541678436,
    "best_max_mean": -15.920267833362935,
    "best_max": -5.618835227272794
  },
  {
    "gen": 131,
    "reward_mean": -15.383221028645858,
    "reward_max": -5.74585227272728,
    "reward_min": -21.020170454545504,
    "reward_std": 2.9631453885974666,
    "timesteps": 47254320,
    "learntime": 0.18726768414489925,
    "sampletime": 19.246733812149614,
    "best_max_mean": -15.920267833362935,
    "best_max": -5.618835227272794
  },
  {
    "gen": 132,
    "reward_mean": -21.930399743282482,
    "reward_max": -16.081974431818207,
    "reward_min": -27.420909090909188,
    "reward_std": 2.545013438706101,
    "timesteps": 47615040,
    "learntime": 0.1808834259863943,
    "sampletime": 19.473874300019816,
    "best_max_mean": -15.920267833362935,
    "best_max": -5.618835227272794
  },
  {
    "gen": 133,
    "reward_mean": -18.146843890565847,
    "reward_max": -9.95857954545457,
    "reward_min": -24.290767045454594,
    "reward_std": 3.095018373434094,
    "timesteps": 47975760,
    "learntime": 0.18120395694859326,
    "sampletime": 19.029762726044282,
    "best_max_mean": -15.920267833362935,
    "best_max": -5.618835227272794
  },
  {
    "gen": 134,
    "reward_mean": -20.58795678341032,
    "reward_max": -13.575411931818188,
    "reward_min": -27.765247395833438,
    "reward_std": 3.203793932446369,
    "timesteps": 48336480,
    "learntime": 0.1944520811084658,
    "sampletime": 19.11161598796025,
    "best_max_mean": -15.920267833362935,
    "best_max": -5.618835227272794
  },
  {
    "gen": 135,
    "reward_mean": -19.641213970762344,
    "reward_max": -11.511633522727244,
    "reward_min": -27.606250000000113,
    "reward_std": 3.1055413213420096,
    "timesteps": 48697200,
    "learntime": 0.1941351848654449,
    "sampletime": 18.973486496135592,
    "best_max_mean": -15.920267833362935,
    "best_max": -5.618835227272794
  },
  {
    "gen": 136,
    "reward_mean": -17.847811945134964,
    "reward_max": -9.892301136363615,
    "reward_min": -23.44937500000006,
    "reward_std": 3.0968084147394155,
    "timesteps": 49057920,
    "learntime": 0.17774972296319902,
    "sampletime": 19.08231278997846,
    "best_max_mean": -15.920267833362935,
    "best_max": -5.618835227272794
  },
  {
    "gen": 137,
    "reward_mean": -18.46340344978104,
    "reward_max": -9.117826704545424,
    "reward_min": -30.429502840909198,
    "reward_std": 3.7379047724920764,
    "timesteps": 49418640,
    "learntime": 0.1901049700099975,
    "sampletime": 19.18492282414809,
    "best_max_mean": -15.920267833362935,
    "best_max": -5.618835227272794
  },
  {
    "gen": 138,
    "reward_mean": -18.29380010431465,
    "reward_max": -11.658721590909074,
    "reward_min": -24.200681818181863,
    "reward_std": 2.572162404367288,
    "timesteps": 49779360,
    "learntime": 0.19440121296793222,
    "sampletime": 19.3355342799332,
    "best_max_mean": -15.920267833362935,
    "best_max": -5.618835227272794
  },
  {
    "gen": 139,
    "reward_mean": -16.575226181492685,
    "reward_max": -3.5902272727272617,
    "reward_min": -27.08072443181827,
    "reward_std": 4.013435487008679,
    "timesteps": 50140080,
    "learntime": 0.17543694586493075,
    "sampletime": 19.092386010102928,
    "best_max_mean": -16.575226181492685,
    "best_max": -3.5902272727272617
  },
  {
    "gen": 140,
    "reward_mean": -13.947864527846843,
    "reward_max": -6.232642045454553,
    "reward_min": -21.16226562500005,
    "reward_std": 3.542628349700303,
    "timesteps": 50500800,
    "learntime": 0.19123980007134378,
    "sampletime": 18.791881007840857,
    "best_max_mean": -16.575226181492685,
    "best_max": -3.5902272727272617
  },
  {
    "gen": 141,
    "reward_mean": -16.53033828272966,
    "reward_max": -10.611448863636376,
    "reward_min": -25.30074218750008,
    "reward_std": 2.7779494180297095,
    "timesteps": 50861520,
    "learntime": 0.17968626017682254,
    "sampletime": 19.1959363988135,
    "best_max_mean": -16.575226181492685,
    "best_max": -3.5902272727272617
  },
  {
    "gen": 142,
    "reward_mean": -16.76208296342332,
    "reward_max": -9.238693181818181,
    "reward_min": -23.521079545454562,
    "reward_std": 3.078080367074111,
    "timesteps": 51222240,
    "learntime": 0.1701535249594599,
    "sampletime": 19.262678997125477,
    "best_max_mean": -16.575226181492685,
    "best_max": -3.5902272727272617
  },
  {
    "gen": 143,
    "reward_mean": -17.683490582090453,
    "reward_max": -9.352226562500025,
    "reward_min": -24.716789772727306,
    "reward_std": 3.3259812995737748,
    "timesteps": 51582960,
    "learntime": 0.20077195903286338,
    "sampletime": 19.066600560909137,
    "best_max_mean": -16.575226181492685,
    "best_max": -3.5902272727272617
  },
  {
    "gen": 144,
    "reward_mean": -14.632274928237461,
    "reward_max": -4.9441619318181775,
    "reward_min": -22.6810085227273,
    "reward_std": 3.6603738930378866,
    "timesteps": 51943680,
    "learntime": 0.19683916913345456,
    "sampletime": 19.347009822027758,
    "best_max_mean": -16.575226181492685,
    "best_max": -3.5902272727272617
  },
  {
    "gen": 145,
    "reward_mean": -9.11555741743608,
    "reward_max": -0.9631510416666788,
    "reward_min": -20.164900568181892,
    "reward_std": 4.121022821482347,
    "timesteps": 52304400,
    "learntime": 0.1896460319403559,
    "sampletime": 18.65162267605774,
    "best_max_mean": -9.11555741743608,
    "best_max": -0.9631510416666788
  },
  {
    "gen": 146,
    "reward_mean": -11.576484356504505,
    "reward_max": 2.6413068181818162,
    "reward_min": -18.476278409090927,
    "reward_std": 3.750636578197613,
    "timesteps": 52665120,
    "learntime": 0.18380691995844245,
    "sampletime": 19.045278331963345,
    "best_max_mean": -11.576484356504505,
    "best_max": 2.6413068181818162
  },
  {
    "gen": 147,
    "reward_mean": -18.307743955670013,
    "reward_max": -12.175852272727257,
    "reward_min": -26.126747159091,
    "reward_std": 3.4033410606702987,
    "timesteps": 53025840,
    "learntime": 0.17856265511363745,
    "sampletime": 19.178143020020798,
    "best_max_mean": -11.576484356504505,
    "best_max": 2.6413068181818162
  },
  {
    "gen": 148,
    "reward_mean": -15.957042365796651,
    "reward_max": -8.85632102272725,
    "reward_min": -22.43023437500003,
    "reward_std": 2.7585511175791795,
    "timesteps": 53386560,
    "learntime": 0.18930935813114047,
    "sampletime": 19.04893981316127,
    "best_max_mean": -11.576484356504505,
    "best_max": 2.6413068181818162
  },
  {
    "gen": 149,
    "reward_mean": -19.75604989716505,
    "reward_max": -13.851022727272708,
    "reward_min": -25.50454545454555,
    "reward_std": 2.87243501118152,
    "timesteps": 53747280,
    "learntime": 0.18835225980728865,
    "sampletime": 19.11232348298654,
    "best_max_mean": -11.576484356504505,
    "best_max": 2.6413068181818162
  },
  {
    "gen": 150,
    "reward_mean": -16.510640018347573,
    "reward_max": -7.552265625000035,
    "reward_min": -25.146732954545552,
    "reward_std": 3.681110861731733,
    "timesteps": 54108000,
    "learntime": 0.19436017610132694,
    "sampletime": 18.905649117892608,
    "best_max_mean": -11.576484356504505,
    "best_max": 2.6413068181818162
  },
  {
    "gen": 151,
    "reward_mean": -11.126567493785508,
    "reward_max": -2.994815340909065,
    "reward_min": -19.988632812500043,
    "reward_std": 3.9731538554841523,
    "timesteps": 54468720,
    "learntime": 0.18088788213208318,
    "sampletime": 19.174238718114793,
    "best_max_mean": -11.576484356504505,
    "best_max": 2.6413068181818162
  },
  {
    "gen": 152,
    "reward_mean": -14.426642678000722,
    "reward_max": -5.261235795454542,
    "reward_min": -21.173764204545467,
    "reward_std": 3.2128214983983603,
    "timesteps": 54829440,
    "learntime": 0.19671289599500597,
    "sampletime": 18.887168538058177,
    "best_max_mean": -11.576484356504505,
    "best_max": 2.6413068181818162
  },
  {
    "gen": 153,
    "reward_mean": -19.573461303710985,
    "reward_max": -9.184659090909095,
    "reward_min": -30.18656250000011,
    "reward_std": 3.8141677283043394,
    "timesteps": 55190160,
    "learntime": 0.19312766985967755,
    "sampletime": 19.13323577004485,
    "best_max_mean": -11.576484356504505,
    "best_max": 2.6413068181818162
  },
  {
    "gen": 154,
    "reward_mean": -15.411498819987,
    "reward_max": -8.392755681818182,
    "reward_min": -24.06447443181827,
    "reward_std": 3.4556431790470334,
    "timesteps": 55550880,
    "learntime": 0.1804558769799769,
    "sampletime": 18.869511392898858,
    "best_max_mean": -11.576484356504505,
    "best_max": 2.6413068181818162
  },
  {
    "gen": 155,
    "reward_mean": -13.78047516793918,
    "reward_max": -5.3292329545454855,
    "reward_min": -24.21686197916677,
    "reward_std": 3.6378879122658407,
    "timesteps": 55911600,
    "learntime": 0.18375063803978264,
    "sampletime": 18.79421133804135,
    "best_max_mean": -11.576484356504505,
    "best_max": 2.6413068181818162
  },
  {
    "gen": 156,
    "reward_mean": -18.193756195993167,
    "reward_max": -10.615553977272732,
    "reward_min": -25.738528645833394,
    "reward_std": 3.279309332915721,
    "timesteps": 56272320,
    "learntime": 0.1888401210308075,
    "sampletime": 19.063221846008673,
    "best_max_mean": -11.576484356504505,
    "best_max": 2.6413068181818162
  },
  {
    "gen": 157,
    "reward_mean": -17.279549042672848,
    "reward_max": -10.202187500000006,
    "reward_min": -26.501590909091036,
    "reward_std": 3.2156707187084956,
    "timesteps": 56633040,
    "learntime": 0.18556169187650084,
    "sampletime": 19.165213574189693,
    "best_max_mean": -11.576484356504505,
    "best_max": 2.6413068181818162
  },
  {
    "gen": 158,
    "reward_mean": -11.238218716708094,
    "reward_max": -4.294296874999987,
    "reward_min": -18.6505681818182,
    "reward_std": 3.2464787277600857,
    "timesteps": 56993760,
    "learntime": 0.19719820702448487,
    "sampletime": 18.67696761689149,
    "best_max_mean": -11.576484356504505,
    "best_max": 2.6413068181818162
  },
  {
    "gen": 159,
    "reward_mean": -9.889659201882104,
    "reward_max": -0.5051278409090659,
    "reward_min": -18.744076704545538,
    "reward_std": 4.166148365452034,
    "timesteps": 57354480,
    "learntime": 0.20083895605057478,
    "sampletime": 18.83992429706268,
    "best_max_mean": -11.576484356504505,
    "best_max": 2.6413068181818162
  },
  {
    "gen": 160,
    "reward_mean": -17.319754527698883,
    "reward_max": -7.999133522727259,
    "reward_min": -24.28002840909094,
    "reward_std": 2.8935585035149196,
    "timesteps": 57715200,
    "learntime": 0.1974300011061132,
    "sampletime": 19.037215953925624,
    "best_max_mean": -11.576484356504505,
    "best_max": 2.6413068181818162
  },
  {
    "gen": 161,
    "reward_mean": -16.885104296135193,
    "reward_max": -11.262187499999994,
    "reward_min": -22.797382812500043,
    "reward_std": 2.8388189352159405,
    "timesteps": 58075920,
    "learntime": 0.1812616589013487,
    "sampletime": 19.382105085998774,
    "best_max_mean": -11.576484356504505,
    "best_max": 2.6413068181818162
  },
  {
    "gen": 162,
    "reward_mean": -15.45308029637193,
    "reward_max": -8.50946614583331,
    "reward_min": -23.228622159090936,
    "reward_std": 2.8531962346714024,
    "timesteps": 58436640,
    "learntime": 0.18840818805620074,
    "sampletime": 18.96261392789893,
    "best_max_mean": -11.576484356504505,
    "best_max": 2.6413068181818162
  },
  {
    "gen": 163,
    "reward_mean": -13.644386374733678,
    "reward_max": -7.5667968749999615,
    "reward_min": -22.898821022727358,
    "reward_std": 3.253244474323469,
    "timesteps": 58797360,
    "learntime": 0.19067549798637629,
    "sampletime": 18.813697195146233,
    "best_max_mean": -11.576484356504505,
    "best_max": 2.6413068181818162
  },
  {
    "gen": 164,
    "reward_mean": -15.863647128018489,
    "reward_max": -3.605085227272697,
    "reward_min": -22.82673295454548,
    "reward_std": 3.8770319605525767,
    "timesteps": 59158080,
    "learntime": 0.18739359104074538,
    "sampletime": 18.818052700953558,
    "best_max_mean": -11.576484356504505,
    "best_max": 2.6413068181818162
  },
  {
    "gen": 165,
    "reward_mean": -12.730939978397265,
    "reward_max": -5.373323863636363,
    "reward_min": -20.333098958333405,
    "reward_std": 3.4052974718552784,
    "timesteps": 59518800,
    "learntime": 0.1884758248925209,
    "sampletime": 18.796296671964228,
    "best_max_mean": -11.576484356504505,
    "best_max": 2.6413068181818162
  },
  {
    "gen": 166,
    "reward_mean": -12.456558708422124,
    "reward_max": -4.6818892045454366,
    "reward_min": -19.319403409090942,
    "reward_std": 3.1694283302320327,
    "timesteps": 59879520,
    "learntime": 0.18723012297414243,
    "sampletime": 18.63821293017827,
    "best_max_mean": -11.576484356504505,
    "best_max": 2.6413068181818162
  },
  {
    "gen": 167,
    "reward_mean": -14.617902721058275,
    "reward_max": -4.708465909090885,
    "reward_min": -23.34184659090923,
    "reward_std": 3.8347639095655235,
    "timesteps": 60240240,
    "learntime": 0.17340095690451562,
    "sampletime": 18.772343361051753,
    "best_max_mean": -11.576484356504505,
    "best_max": 2.6413068181818162
  },
  {
    "gen": 168,
    "reward_mean": -12.821376287286927,
    "reward_max": -6.693991477272715,
    "reward_min": -22.433224431818275,
    "reward_std": 2.9183416611487285,
    "timesteps": 60600960,
    "learntime": 0.1821746330242604,
    "sampletime": 18.700548351043835,
    "best_max_mean": -11.576484356504505,
    "best_max": 2.6413068181818162
  },
  {
    "gen": 169,
    "reward_mean": -12.98877330433239,
    "reward_max": -5.039947916666653,
    "reward_min": -21.40032670454548,
    "reward_std": 3.6789118972662416,
    "timesteps": 60961680,
    "learntime": 0.197598815895617,
    "sampletime": 18.94806258706376,
    "best_max_mean": -11.576484356504505,
    "best_max": 2.6413068181818162
  },
  {
    "gen": 170,
    "reward_mean": -17.178507486979193,
    "reward_max": -7.192585227272709,
    "reward_min": -22.892734375000064,
    "reward_std": 3.119192694770861,
    "timesteps": 61322400,
    "learntime": 0.18712253705598414,
    "sampletime": 18.904548479942605,
    "best_max_mean": -11.576484356504505,
    "best_max": 2.6413068181818162
  },
  {
    "gen": 171,
    "reward_mean": -13.931336244525351,
    "reward_max": -7.2732528409091,
    "reward_min": -22.746835937500055,
    "reward_std": 3.4042427476941364,
    "timesteps": 61683120,
    "learntime": 0.18949724291451275,
    "sampletime": 19.02649450302124,
    "best_max_mean": -11.576484356504505,
    "best_max": 2.6413068181818162
  },
  {
    "gen": 172,
    "reward_mean": -11.899853182705982,
    "reward_max": -1.3162760416666954,
    "reward_min": -18.769275568181857,
    "reward_std": 3.9690612872602755,
    "timesteps": 62043840,
    "learntime": 0.20100126997567713,
    "sampletime": 18.777613347163424,
    "best_max_mean": -11.576484356504505,
    "best_max": 2.6413068181818162
  },
  {
    "gen": 173,
    "reward_mean": -12.608364572236034,
    "reward_max": -4.716377840909087,
    "reward_min": -18.297317708333352,
    "reward_std": 3.0400527620465176,
    "timesteps": 62404560,
    "learntime": 0.18719583796337247,
    "sampletime": 18.892362505896017,
    "best_max_mean": -11.576484356504505,
    "best_max": 2.6413068181818162
  },
  {
    "gen": 174,
    "reward_mean": -15.23735198049837,
    "reward_max": -7.435255681818154,
    "reward_min": -24.04215909090917,
    "reward_std": 3.70206040435983,
    "timesteps": 62765280,
    "learntime": 0.18291708198376,
    "sampletime": 19.098376610083506,
    "best_max_mean": -11.576484356504505,
    "best_max": 2.6413068181818162
  },
  {
    "gen": 175,
    "reward_mean": -13.47864553740532,
    "reward_max": -4.454374999999994,
    "reward_min": -19.658242187500047,
    "reward_std": 3.166369742243351,
    "timesteps": 63126000,
    "learntime": 0.18747499282471836,
    "sampletime": 19.20931398193352,
    "best_max_mean": -11.576484356504505,
    "best_max": 2.6413068181818162
  },
  {
    "gen": 176,
    "reward_mean": -12.05093200683593,
    "reward_max": -7.315894886363597,
    "reward_min": -17.685696022727285,
    "reward_std": 2.2882351389977136,
    "timesteps": 63486720,
    "learntime": 0.19506262592040002,
    "sampletime": 18.89527761307545,
    "best_max_mean": -11.576484356504505,
    "best_max": 2.6413068181818162
  },
  {
    "gen": 177,
    "reward_mean": -12.575569661458331,
    "reward_max": -5.12113636363633,
    "reward_min": -19.695781250000035,
    "reward_std": 2.748323596631034,
    "timesteps": 63847440,
    "learntime": 0.18430737499147654,
    "sampletime": 18.681038926821202,
    "best_max_mean": -11.576484356504505,
    "best_max": 2.6413068181818162
  },
  {
    "gen": 178,
    "reward_mean": -13.951922903349903,
    "reward_max": -6.8692045454545045,
    "reward_min": -19.539545454545475,
    "reward_std": 2.596448727293136,
    "timesteps": 64208160,
    "learntime": 0.19590357900597155,
    "sampletime": 18.769136276096106,
    "best_max_mean": -11.576484356504505,
    "best_max": 2.6413068181818162
  },
  {
    "gen": 179,
    "reward_mean": -7.943537042791183,
    "reward_max": -0.8346306818181742,
    "reward_min": -16.877002840909103,
    "reward_std": 3.586216940592422,
    "timesteps": 64568880,
    "learntime": 0.18496028403751552,
    "sampletime": 18.575448971940205,
    "best_max_mean": -11.576484356504505,
    "best_max": 2.6413068181818162
  },
  {
    "gen": 180,
    "reward_mean": -11.548804191820548,
    "reward_max": -5.283977272727266,
    "reward_min": -17.36848011363641,
    "reward_std": 2.950557962422964,
    "timesteps": 64929600,
    "learntime": 0.16953176097013056,
    "sampletime": 18.747417092788965,
    "best_max_mean": -11.576484356504505,
    "best_max": 2.6413068181818162
  },
  {
    "gen": 181,
    "reward_mean": -10.29345329515862,
    "reward_max": -3.5274147727272545,
    "reward_min": -18.84338068181822,
    "reward_std": 3.699615901906676,
    "timesteps": 65290320,
    "learntime": 0.1938541131094098,
    "sampletime": 19.018694917904213,
    "best_max_mean": -11.576484356504505,
    "best_max": 2.6413068181818162
  },
  {
    "gen": 182,
    "reward_mean": -11.684274920839256,
    "reward_max": -4.3807102272726866,
    "reward_min": -18.244218750000037,
    "reward_std": 3.3870382444650793,
    "timesteps": 65651040,
    "learntime": 0.19008564809337258,
    "sampletime": 21.278611483983696,
    "best_max_mean": -11.576484356504505,
    "best_max": 2.6413068181818162
  },
  {
    "gen": 183,
    "reward_mean": -11.7574647660689,
    "reward_max": -4.427045454545445,
    "reward_min": -18.692571022727332,
    "reward_std": 3.566094778905968,
    "timesteps": 66011760,
    "learntime": 0.18657530611380935,
    "sampletime": 21.24023636803031,
    "best_max_mean": -11.576484356504505,
    "best_max": 2.6413068181818162
  },
  {
    "gen": 184,
    "reward_mean": -10.292928614760884,
    "reward_max": -4.403893229166648,
    "reward_min": -15.525014204545506,
    "reward_std": 2.6151809295909376,
    "timesteps": 66372480,
    "learntime": 0.19972324487753212,
    "sampletime": 24.264300614129752,
    "best_max_mean": -11.576484356504505,
    "best_max": 2.6413068181818162
  },
  {
    "gen": 185,
    "reward_mean": -11.567019024473257,
    "reward_max": -2.3601704545454605,
    "reward_min": -19.601901041666686,
    "reward_std": 3.4820866529896053,
    "timesteps": 66733200,
    "learntime": 0.1809561720583588,
    "sampletime": 20.384441274916753,
    "best_max_mean": -11.576484356504505,
    "best_max": 2.6413068181818162
  },
  {
    "gen": 186,
    "reward_mean": -8.300336377692943,
    "reward_max": -1.1141477272727298,
    "reward_min": -15.000454545454595,
    "reward_std": 3.481848114309173,
    "timesteps": 67093920,
    "learntime": 0.18720453092828393,
    "sampletime": 20.33372929203324,
    "best_max_mean": -11.576484356504505,
    "best_max": 2.6413068181818162
  },
  {
    "gen": 187,
    "reward_mean": -8.971254901308003,
    "reward_max": -0.3296306818182074,
    "reward_min": -15.892329545454556,
    "reward_std": 3.5708228157912156,
    "timesteps": 67454640,
    "learntime": 0.20340954093262553,
    "sampletime": 18.756192032946274,
    "best_max_mean": -11.576484356504505,
    "best_max": 2.6413068181818162
  },
  {
    "gen": 188,
    "reward_mean": -10.831674490263968,
    "reward_max": -3.574140624999991,
    "reward_min": -21.501264204545503,
    "reward_std": 3.474200567332697,
    "timesteps": 67815360,
    "learntime": 0.1850881848949939,
    "sampletime": 18.976553736953065,
    "best_max_mean": -11.576484356504505,
    "best_max": 2.6413068181818162
  },
  {
    "gen": 189,
    "reward_mean": -16.091643343838815,
    "reward_max": -9.19921874999997,
    "reward_min": -25.492443181818295,
    "reward_std": 3.4028030955219375,
    "timesteps": 68176080,
    "learntime": 0.19708593492396176,
    "sampletime": 18.883775003952906,
    "best_max_mean": -11.576484356504505,
    "best_max": 2.6413068181818162
  },
  {
    "gen": 190,
    "reward_mean": -16.564922892252635,
    "reward_max": -7.09836647727273,
    "reward_min": -22.38044034090916,
    "reward_std": 3.2111586911213084,
    "timesteps": 68536800,
    "learntime": 0.18478570692241192,
    "sampletime": 18.784991333959624,
    "best_max_mean": -11.576484356504505,
    "best_max": 2.6413068181818162
  },
  {
    "gen": 191,
    "reward_mean": -13.50668525464609,
    "reward_max": -6.271136363636342,
    "reward_min": -21.062343750000036,
    "reward_std": 3.6426441654837767,
    "timesteps": 68897520,
    "learntime": 0.18161888304166496,
    "sampletime": 18.62831947207451,
    "best_max_mean": -11.576484356504505,
    "best_max": 2.6413068181818162
  },
  {
    "gen": 192,
    "reward_mean": -15.025717773437522,
    "reward_max": -8.690989583333314,
    "reward_min": -21.05401041666674,
    "reward_std": 3.117645404957441,
    "timesteps": 69258240,
    "learntime": 0.19176290510222316,
    "sampletime": 19.044650776078925,
    "best_max_mean": -11.576484356504505,
    "best_max": 2.6413068181818162
  },
  {
    "gen": 193,
    "reward_mean": -14.682266660748123,
    "reward_max": -6.740807291666634,
    "reward_min": -25.229687500000082,
    "reward_std": 3.6831313099144745,
    "timesteps": 69618960,
    "learntime": 0.19483325793407857,
    "sampletime": 18.82094537001103,
    "best_max_mean": -11.576484356504505,
    "best_max": 2.6413068181818162
  },
  {
    "gen": 194,
    "reward_mean": -13.508794555664075,
    "reward_max": -6.296576704545452,
    "reward_min": -21.76291193181824,
    "reward_std": 3.646373496696929,
    "timesteps": 69979680,
    "learntime": 0.18322797189466655,
    "sampletime": 18.88682628888637,
    "best_max_mean": -11.576484356504505,
    "best_max": 2.6413068181818162
  },
  {
    "gen": 195,
    "reward_mean": -11.939361276337586,
    "reward_max": -4.216605113636365,
    "reward_min": -18.906008522727284,
    "reward_std": 3.5790055653225123,
    "timesteps": 70340400,
    "learntime": 0.18057807604782283,
    "sampletime": 18.7166362979915,
    "best_max_mean": -11.576484356504505,
    "best_max": 2.6413068181818162
  },
  {
    "gen": 196,
    "reward_mean": -13.514043172200532,
    "reward_max": -6.167059659090879,
    "reward_min": -21.767698863636387,
    "reward_std": 3.537581020780602,
    "timesteps": 70701120,
    "learntime": 0.1944711070973426,
    "sampletime": 18.904633661033586,
    "best_max_mean": -11.576484356504505,
    "best_max": 2.6413068181818162
  },
  {
    "gen": 197,
    "reward_mean": -11.541859019886378,
    "reward_max": -2.3557954545454445,
    "reward_min": -19.48608072916674,
    "reward_std": 3.3208873065530127,
    "timesteps": 71061840,
    "learntime": 0.18058092799037695,
    "sampletime": 18.611250026151538,
    "best_max_mean": -11.576484356504505,
    "best_max": 2.6413068181818162
  },
  {
    "gen": 198,
    "reward_mean": -8.97888052275686,
    "reward_max": 1.9920596590909128,
    "reward_min": -20.24832386363641,
    "reward_std": 4.040697483887802,
    "timesteps": 71422560,
    "learntime": 0.18819091096520424,
    "sampletime": 18.785753811942413,
    "best_max_mean": -11.576484356504505,
    "best_max": 2.6413068181818162
  },
  {
    "gen": 199,
    "reward_mean": -7.242151322798288,
    "reward_max": -1.4898863636363542,
    "reward_min": -15.469062499999994,
    "reward_std": 3.284000839187453,
    "timesteps": 71783280,
    "learntime": 0.17363537102937698,
    "sampletime": 18.637289142934605,
    "best_max_mean": -11.576484356504505,
    "best_max": 2.6413068181818162
  },
  {
    "gen": 200,
    "reward_mean": -12.09023080536815,
    "reward_max": -6.029446022727257,
    "reward_min": -19.15893465909099,
    "reward_std": 2.92070139046456,
    "timesteps": 72144000,
    "learntime": 0.17150438693352044,
    "sampletime": 19.806347663979977,
    "best_max_mean": -11.576484356504505,
    "best_max": 2.6413068181818162
  },
  {
    "gen": 201,
    "reward_mean": -12.437928300337367,
    "reward_max": -3.998934659090911,
    "reward_min": -18.860596590909157,
    "reward_std": 3.346861019978653,
    "timesteps": 72504720,
    "learntime": 0.16293191304430366,
    "sampletime": 20.882052503991872,
    "best_max_mean": -11.576484356504505,
    "best_max": 2.6413068181818162
  },
  {
    "gen": 202,
    "reward_mean": -17.529570294004543,
    "reward_max": -8.833338068181789,
    "reward_min": -27.743991477272825,
    "reward_std": 4.191973743413692,
    "timesteps": 72865440,
    "learntime": 0.18304755096323788,
    "sampletime": 19.074965396896005,
    "best_max_mean": -11.576484356504505,
    "best_max": 2.6413068181818162
  },
  {
    "gen": 203,
    "reward_mean": -12.07220618045692,
    "reward_max": -4.847684659090917,
    "reward_min": -21.196335227272776,
    "reward_std": 3.166047194259458,
    "timesteps": 73226160,
    "learntime": 0.30179193895310163,
    "sampletime": 18.89852914190851,
    "best_max_mean": -11.576484356504505,
    "best_max": 2.6413068181818162
  },
  {
    "gen": 204,
    "reward_mean": -13.462886315548086,
    "reward_max": -0.2947869318181679,
    "reward_min": -22.750429687500063,
    "reward_std": 4.227721663370144,
    "timesteps": 73586880,
    "learntime": 0.1881695599295199,
    "sampletime": 18.833459376124665,
    "best_max_mean": -11.576484356504505,
    "best_max": 2.6413068181818162
  },
  {
    "gen": 205,
    "reward_mean": -10.353144660718513,
    "reward_max": -2.9270738636363647,
    "reward_min": -18.507840909090945,
    "reward_std": 3.7845917453600664,
    "timesteps": 73947600,
    "learntime": 0.17765606194734573,
    "sampletime": 18.69187250593677,
    "best_max_mean": -11.576484356504505,
    "best_max": 2.6413068181818162
  },
  {
    "gen": 206,
    "reward_mean": -5.77556019176135,
    "reward_max": 7.604758522727284,
    "reward_min": -17.11910511363638,
    "reward_std": 4.541318171939748,
    "timesteps": 74308320,
    "learntime": 0.19115284201689065,
    "sampletime": 18.6502054000739,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 207,
    "reward_mean": -12.71541574189158,
    "reward_max": -4.705639204545431,
    "reward_min": -19.047613636363664,
    "reward_std": 3.4273986441108746,
    "timesteps": 74669040,
    "learntime": 0.19918866595253348,
    "sampletime": 18.659350421046838,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 208,
    "reward_mean": -10.937210822827913,
    "reward_max": 2.8916796874999666,
    "reward_min": -19.286051136363714,
    "reward_std": 3.9654844192523107,
    "timesteps": 75029760,
    "learntime": 0.1891027798410505,
    "sampletime": 18.776291124057025,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 209,
    "reward_mean": -11.7922832142223,
    "reward_max": -5.08349431818181,
    "reward_min": -18.722486979166725,
    "reward_std": 2.8619462656367305,
    "timesteps": 75390480,
    "learntime": 0.19403184088878334,
    "sampletime": 18.762048826087266,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 210,
    "reward_mean": -11.621944154681596,
    "reward_max": -3.8888068181818003,
    "reward_min": -18.120156250000015,
    "reward_std": 3.20266820845847,
    "timesteps": 75751200,
    "learntime": 0.19337382982484996,
    "sampletime": 18.676754043903202,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 211,
    "reward_mean": -12.948783994732496,
    "reward_max": -4.947955729166647,
    "reward_min": -21.34907552083341,
    "reward_std": 3.7482213424770854,
    "timesteps": 76111920,
    "learntime": 0.1987752381246537,
    "sampletime": 18.542884564958513,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 212,
    "reward_mean": -10.913120709043579,
    "reward_max": -1.5681107954545908,
    "reward_min": -19.96336647727278,
    "reward_std": 3.9898734971408127,
    "timesteps": 76472640,
    "learntime": 0.19564135582186282,
    "sampletime": 18.725735421990976,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 213,
    "reward_mean": -15.47174826882106,
    "reward_max": -7.991946022727257,
    "reward_min": -24.46007102272738,
    "reward_std": 4.064971102894119,
    "timesteps": 76833360,
    "learntime": 0.18900331389158964,
    "sampletime": 18.79751018388197,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 214,
    "reward_mean": -16.892089640299517,
    "reward_max": -9.010572916666666,
    "reward_min": -26.861510416666842,
    "reward_std": 3.862143347113509,
    "timesteps": 77194080,
    "learntime": 0.1857526721432805,
    "sampletime": 18.88529093703255,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 215,
    "reward_mean": -13.301713404799969,
    "reward_max": -5.130482954545437,
    "reward_min": -25.322102272727385,
    "reward_std": 3.5284775574777894,
    "timesteps": 77554800,
    "learntime": 0.1974762638565153,
    "sampletime": 18.64627311285585,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 216,
    "reward_mean": -11.540199843897973,
    "reward_max": -1.9210416666666406,
    "reward_min": -17.738508522727354,
    "reward_std": 3.327594314462569,
    "timesteps": 77915520,
    "learntime": 0.1936527860816568,
    "sampletime": 18.693836004007608,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 217,
    "reward_mean": -8.8171064157197,
    "reward_max": -1.9620596590908965,
    "reward_min": -18.267200520833388,
    "reward_std": 3.41585991572797,
    "timesteps": 78276240,
    "learntime": 0.18261702195741236,
    "sampletime": 18.694535380927846,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 218,
    "reward_mean": -11.055558138760656,
    "reward_max": 0.0009090909091189884,
    "reward_min": -20.211221590909144,
    "reward_std": 4.01228498938318,
    "timesteps": 78636960,
    "learntime": 0.18676171987317502,
    "sampletime": 18.717243151040748,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 219,
    "reward_mean": -9.416485170306583,
    "reward_max": -1.6036848958333205,
    "reward_min": -15.49940340909093,
    "reward_std": 3.3084374287546345,
    "timesteps": 78997680,
    "learntime": 0.19947532191872597,
    "sampletime": 18.7851663751062,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 220,
    "reward_mean": -9.642568581321004,
    "reward_max": -4.353494318181777,
    "reward_min": -15.01242897727275,
    "reward_std": 2.7947028808569816,
    "timesteps": 79358400,
    "learntime": 0.20052637811750174,
    "sampletime": 18.57225116994232,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 221,
    "reward_mean": -11.295698334665005,
    "reward_max": -3.689886363636356,
    "reward_min": -17.38400568181825,
    "reward_std": 2.821892185394531,
    "timesteps": 79719120,
    "learntime": 0.20330643188208342,
    "sampletime": 18.57260467321612,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 222,
    "reward_mean": -11.414135908647017,
    "reward_max": -4.511458333333306,
    "reward_min": -17.442825520833377,
    "reward_std": 2.7066765830392883,
    "timesteps": 80079840,
    "learntime": 0.18318941094912589,
    "sampletime": 18.605431685922667,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 223,
    "reward_mean": -12.2797617964311,
    "reward_max": -6.763153409090919,
    "reward_min": -18.85756510416673,
    "reward_std": 2.5069042388611584,
    "timesteps": 80440560,
    "learntime": 0.18412510002963245,
    "sampletime": 18.802951857913285,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 224,
    "reward_mean": -14.428709679805877,
    "reward_max": -5.285596590909076,
    "reward_min": -19.867741477272734,
    "reward_std": 2.8987718600601884,
    "timesteps": 80801280,
    "learntime": 0.1933724321424961,
    "sampletime": 18.824929245049134,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 225,
    "reward_mean": -10.595234338008998,
    "reward_max": -1.7203835227272668,
    "reward_min": -20.169602272727328,
    "reward_std": 3.778848784645276,
    "timesteps": 81162000,
    "learntime": 0.18832160695455968,
    "sampletime": 20.18052912899293,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 226,
    "reward_mean": -8.424640946821713,
    "reward_max": -1.2458948863635835,
    "reward_min": -15.585454545454551,
    "reward_std": 3.0500206112734713,
    "timesteps": 81522720,
    "learntime": 0.2825910041574389,
    "sampletime": 18.522799763130024,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 227,
    "reward_mean": -10.781589466441769,
    "reward_max": -3.4864488636363826,
    "reward_min": -18.01552556818192,
    "reward_std": 3.6572839706849325,
    "timesteps": 81883440,
    "learntime": 0.1873428130056709,
    "sampletime": 18.867818463826552,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 228,
    "reward_mean": -10.963934215198865,
    "reward_max": -3.254744318181808,
    "reward_min": -20.119417613636426,
    "reward_std": 3.3696414292701893,
    "timesteps": 82244160,
    "learntime": 0.2017950308509171,
    "sampletime": 18.646195844979957,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 229,
    "reward_mean": -13.945084561434662,
    "reward_max": -7.301732954545451,
    "reward_min": -21.240724431818226,
    "reward_std": 2.8812018576046117,
    "timesteps": 82604880,
    "learntime": 0.3030970790423453,
    "sampletime": 18.765568566974252,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 230,
    "reward_mean": -10.938597911487916,
    "reward_max": -5.179914772727262,
    "reward_min": -16.96025568181818,
    "reward_std": 2.8856871762878202,
    "timesteps": 82965600,
    "learntime": 0.18768182606436312,
    "sampletime": 18.72216066112742,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 231,
    "reward_mean": -9.565680800929204,
    "reward_max": -2.8892897727272393,
    "reward_min": -14.833153409090892,
    "reward_std": 2.939722457724428,
    "timesteps": 83326320,
    "learntime": 0.2927571239415556,
    "sampletime": 20.298664287198335,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 232,
    "reward_mean": -12.819089096531721,
    "reward_max": -6.440454545454534,
    "reward_min": -18.95816406250002,
    "reward_std": 3.2066837191434994,
    "timesteps": 83687040,
    "learntime": 0.19722660700790584,
    "sampletime": 20.621771628968418,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 233,
    "reward_mean": -15.027905439897047,
    "reward_max": -6.815703125000007,
    "reward_min": -21.900639204545495,
    "reward_std": 3.324235828784244,
    "timesteps": 84047760,
    "learntime": 0.2891155700199306,
    "sampletime": 18.80998092191294,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 234,
    "reward_mean": -10.697640380859376,
    "reward_max": -2.111605113636355,
    "reward_min": -18.28731534090913,
    "reward_std": 3.4953985893158483,
    "timesteps": 84408480,
    "learntime": 0.17360427090898156,
    "sampletime": 18.701275675790384,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 235,
    "reward_mean": -7.818338512073851,
    "reward_max": 2.2164630681818567,
    "reward_min": -14.115227272727248,
    "reward_std": 3.5168677767695034,
    "timesteps": 84769200,
    "learntime": 0.2891059648245573,
    "sampletime": 18.75165972393006,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 236,
    "reward_mean": -7.567740755948139,
    "reward_max": 3.2665234375000245,
    "reward_min": -15.699815340909117,
    "reward_std": 3.9087926521433074,
    "timesteps": 85129920,
    "learntime": 0.19418738689273596,
    "sampletime": 18.68821909208782,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 237,
    "reward_mean": -12.697534420129044,
    "reward_max": -3.857201704545426,
    "reward_min": -21.20058593750007,
    "reward_std": 3.7849930108028262,
    "timesteps": 85490640,
    "learntime": 0.30381432897411287,
    "sampletime": 18.716534197097644,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 238,
    "reward_mean": -11.905405920780062,
    "reward_max": -6.042230113636319,
    "reward_min": -20.060326704545545,
    "reward_std": 2.7551545369105788,
    "timesteps": 85851360,
    "learntime": 0.2023289219941944,
    "sampletime": 18.671666611917317,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 239,
    "reward_mean": -9.489231086499755,
    "reward_max": -3.828450520833325,
    "reward_min": -19.136184895833356,
    "reward_std": 3.3893264840549064,
    "timesteps": 86212080,
    "learntime": 0.3077551748137921,
    "sampletime": 19.30308868107386,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 240,
    "reward_mean": -8.468857366388502,
    "reward_max": -1.2648295454545362,
    "reward_min": -19.73751420454556,
    "reward_std": 3.203364083085819,
    "timesteps": 86572800,
    "learntime": 0.18828799086622894,
    "sampletime": 18.86658884002827,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 241,
    "reward_mean": -15.573147527521352,
    "reward_max": -6.812741477272765,
    "reward_min": -23.73763020833344,
    "reward_std": 3.6402626191624536,
    "timesteps": 86933520,
    "learntime": 0.3044722031336278,
    "sampletime": 18.78144627297297,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 242,
    "reward_mean": -15.182952510949356,
    "reward_max": -9.02954545454545,
    "reward_min": -21.67817708333341,
    "reward_std": 2.920011767812331,
    "timesteps": 87294240,
    "learntime": 0.184349404880777,
    "sampletime": 18.95470303297043,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 243,
    "reward_mean": -12.565482584635408,
    "reward_max": -7.0064583333333035,
    "reward_min": -18.656321022727276,
    "reward_std": 2.6187868451203253,
    "timesteps": 87654960,
    "learntime": 0.299699051072821,
    "sampletime": 18.583929480053484,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 244,
    "reward_mean": -9.797694387724903,
    "reward_max": -3.283039772727292,
    "reward_min": -17.27161931818188,
    "reward_std": 3.2563258800735824,
    "timesteps": 88015680,
    "learntime": 0.19910005386918783,
    "sampletime": 18.863818732788786,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 245,
    "reward_mean": -10.628969560102975,
    "reward_max": -3.3166406249999927,
    "reward_min": -17.084034090909103,
    "reward_std": 2.9952807361684046,
    "timesteps": 88376400,
    "learntime": 0.29772466514259577,
    "sampletime": 19.354619208956137,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 246,
    "reward_mean": -10.223212095318404,
    "reward_max": -3.546661931818154,
    "reward_min": -17.26450284090912,
    "reward_std": 2.9996672653450367,
    "timesteps": 88737120,
    "learntime": 0.19856279878877103,
    "sampletime": 18.790687423199415,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 247,
    "reward_mean": -5.457218905362224,
    "reward_max": 2.9267755681817844,
    "reward_min": -14.571419270833365,
    "reward_std": 3.4423301900282413,
    "timesteps": 89097840,
    "learntime": 0.30803346494212747,
    "sampletime": 18.614324033958837,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 248,
    "reward_mean": -8.126434529622392,
    "reward_max": -1.2909374999999874,
    "reward_min": -16.669730113636398,
    "reward_std": 3.0384915261483356,
    "timesteps": 89458560,
    "learntime": 0.18549115513451397,
    "sampletime": 18.53890596795827,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 249,
    "reward_mean": -9.778938358191267,
    "reward_max": -3.4226420454545288,
    "reward_min": -14.577329545454546,
    "reward_std": 2.5399020665111594,
    "timesteps": 89819280,
    "learntime": 0.2952120928093791,
    "sampletime": 18.63259562989697,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 250,
    "reward_mean": -8.358430305249748,
    "reward_max": -2.4778835227272538,
    "reward_min": -13.761979166666668,
    "reward_std": 2.7815168898265994,
    "timesteps": 90180000,
    "learntime": 0.19563004304654896,
    "sampletime": 18.67799415718764,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 251,
    "reward_mean": -12.076254993785522,
    "reward_max": 3.331477272727258,
    "reward_min": -19.93000000000002,
    "reward_std": 3.770241831719347,
    "timesteps": 90540720,
    "learntime": 0.3216350208967924,
    "sampletime": 18.86930450401269,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 252,
    "reward_mean": -9.24162558815696,
    "reward_max": -1.2315767045454409,
    "reward_min": -20.030468750000068,
    "reward_std": 4.122517873606646,
    "timesteps": 90901440,
    "learntime": 0.19226597412489355,
    "sampletime": 18.7132077740971,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 253,
    "reward_mean": -11.550337376450047,
    "reward_max": -6.1610416666666445,
    "reward_min": -21.575198863636455,
    "reward_std": 3.056354010039126,
    "timesteps": 91262160,
    "learntime": 0.31474367692135274,
    "sampletime": 18.879431118955836,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 254,
    "reward_mean": -10.792104140772974,
    "reward_max": -1.7481250000000133,
    "reward_min": -19.42933238636366,
    "reward_std": 3.4749260056602833,
    "timesteps": 91622880,
    "learntime": 0.19054301991127431,
    "sampletime": 18.88560742000118,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 255,
    "reward_mean": -8.477809725674714,
    "reward_max": 1.8552864583333608,
    "reward_min": -14.855681818181825,
    "reward_std": 3.620616265106016,
    "timesteps": 91983600,
    "learntime": 0.2916551090311259,
    "sampletime": 18.61198026780039,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 256,
    "reward_mean": -10.727794633345155,
    "reward_max": -2.835142045454539,
    "reward_min": -18.142613636363638,
    "reward_std": 2.9857269345435857,
    "timesteps": 92344320,
    "learntime": 0.1940569430589676,
    "sampletime": 18.63044006587006,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 257,
    "reward_mean": -10.804668597597074,
    "reward_max": -2.7287784090908946,
    "reward_min": -18.532414772727318,
    "reward_std": 3.665343967493343,
    "timesteps": 92705040,
    "learntime": 0.3173446769360453,
    "sampletime": 18.84638619585894,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 258,
    "reward_mean": -8.42473484848485,
    "reward_max": -2.0092897727272523,
    "reward_min": -15.901036931818231,
    "reward_std": 3.2189373486341144,
    "timesteps": 93065760,
    "learntime": 0.20326069393195212,
    "sampletime": 18.53973241406493,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 259,
    "reward_mean": -11.626352465080492,
    "reward_max": -6.364133522727272,
    "reward_min": -17.949921875000037,
    "reward_std": 2.990642240509112,
    "timesteps": 93426480,
    "learntime": 0.2928634418640286,
    "sampletime": 18.833912032889202,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 260,
    "reward_mean": -11.706865863222065,
    "reward_max": -3.0081380208333113,
    "reward_min": -23.403338068181895,
    "reward_std": 4.100604184975349,
    "timesteps": 93787200,
    "learntime": 0.20345392799936235,
    "sampletime": 18.62636083899997,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 261,
    "reward_mean": -6.097182321259451,
    "reward_max": 1.0490494791667062,
    "reward_min": -12.657215909090873,
    "reward_std": 3.1910680702225735,
    "timesteps": 94147920,
    "learntime": 0.27938184002414346,
    "sampletime": 18.545349988155067,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 262,
    "reward_mean": -9.152881136807531,
    "reward_max": 0.39532670454545527,
    "reward_min": -18.629247159090916,
    "reward_std": 4.105678184928451,
    "timesteps": 94508640,
    "learntime": 0.19608426606282592,
    "sampletime": 18.55078084510751,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 263,
    "reward_mean": -9.605836181640601,
    "reward_max": -5.451676136363619,
    "reward_min": -16.107291666666686,
    "reward_std": 2.3277536536828944,
    "timesteps": 94869360,
    "learntime": 0.29500439879484475,
    "sampletime": 20.188822569092736,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 264,
    "reward_mean": -14.832956006599193,
    "reward_max": -7.615340909090881,
    "reward_min": -20.14390625000003,
    "reward_std": 2.389593666245841,
    "timesteps": 95230080,
    "learntime": 0.18339999904856086,
    "sampletime": 18.759511848911643,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 265,
    "reward_mean": -8.608691387754476,
    "reward_max": -0.6161079545454134,
    "reward_min": -15.37771306818184,
    "reward_std": 2.852221496162979,
    "timesteps": 95590800,
    "learntime": 0.30601693713106215,
    "sampletime": 18.81214605504647,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 266,
    "reward_mean": -10.244917343602038,
    "reward_max": 1.624232954545473,
    "reward_min": -17.80281250000001,
    "reward_std": 3.7735032804975943,
    "timesteps": 95951520,
    "learntime": 0.20529303699731827,
    "sampletime": 18.73263764497824,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 267,
    "reward_mean": -11.238888605291184,
    "reward_max": -5.119661458333333,
    "reward_min": -18.00181818181818,
    "reward_std": 3.0679194956692255,
    "timesteps": 96312240,
    "learntime": 0.2900733279529959,
    "sampletime": 18.58212460298091,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 268,
    "reward_mean": -10.051109082771085,
    "reward_max": -2.509474431818241,
    "reward_min": -19.46850852272734,
    "reward_std": 3.3001128789623517,
    "timesteps": 96672960,
    "learntime": 0.19555750908330083,
    "sampletime": 18.778110028943047,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 269,
    "reward_mean": -9.631306355794262,
    "reward_max": -1.0686221590908713,
    "reward_min": -17.748932291666723,
    "reward_std": 3.6929171894355033,
    "timesteps": 97033680,
    "learntime": 0.3144660310354084,
    "sampletime": 18.75632688216865,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 270,
    "reward_mean": -11.41310491388494,
    "reward_max": -5.773210227272687,
    "reward_min": -18.928636363636397,
    "reward_std": 3.4394557987536896,
    "timesteps": 97394400,
    "learntime": 0.2008656591642648,
    "sampletime": 18.763908718014136,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 271,
    "reward_mean": -8.997908066258287,
    "reward_max": -3.5804687499999774,
    "reward_min": -14.327840909090908,
    "reward_std": 2.824451897719705,
    "timesteps": 97755120,
    "learntime": 0.309465458849445,
    "sampletime": 18.62981840199791,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 272,
    "reward_mean": -9.314716593424485,
    "reward_max": 2.489758522727256,
    "reward_min": -15.980127840909098,
    "reward_std": 3.7859524264578415,
    "timesteps": 98115840,
    "learntime": 0.19989932398311794,
    "sampletime": 18.578172417124733,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 273,
    "reward_mean": -8.04256149754379,
    "reward_max": -2.532642045454521,
    "reward_min": -15.710625000000027,
    "reward_std": 2.7786155641603725,
    "timesteps": 98476560,
    "learntime": 0.29889035387896,
    "sampletime": 18.488019361160696,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 274,
    "reward_mean": -10.408013842033618,
    "reward_max": -3.922883522727263,
    "reward_min": -16.541491477272764,
    "reward_std": 2.9924829869127594,
    "timesteps": 98837280,
    "learntime": 0.18661872996017337,
    "sampletime": 18.724013328086585,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 275,
    "reward_mean": -5.657662372011108,
    "reward_max": 0.18781250000001426,
    "reward_min": -11.324630681818181,
    "reward_std": 2.6713954422139796,
    "timesteps": 99198000,
    "learntime": 0.3052952568978071,
    "sampletime": 18.692404102999717,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 276,
    "reward_mean": -8.206041962594682,
    "reward_max": 4.8895880681818165,
    "reward_min": -14.305227272727272,
    "reward_std": 3.803500354998066,
    "timesteps": 99558720,
    "learntime": 0.1925447778776288,
    "sampletime": 18.8759174880106,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 277,
    "reward_mean": -12.509898755622638,
    "reward_max": -2.3177840909090794,
    "reward_min": -19.954644886363678,
    "reward_std": 3.4591106876429407,
    "timesteps": 99919440,
    "learntime": 0.29698569397442043,
    "sampletime": 18.782571187010035,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 278,
    "reward_mean": -11.492410685221364,
    "reward_max": -2.728423295454522,
    "reward_min": -19.30095170454553,
    "reward_std": 3.2832452552414226,
    "timesteps": 100280160,
    "learntime": 0.19956001709215343,
    "sampletime": 18.583377628820017,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 279,
    "reward_mean": -11.285304306492655,
    "reward_max": -3.6499573863636106,
    "reward_min": -18.301661931818234,
    "reward_std": 3.3779975733623746,
    "timesteps": 100640880,
    "learntime": 0.3196700511034578,
    "sampletime": 18.631134414114058,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 280,
    "reward_mean": -6.064095588452878,
    "reward_max": 1.7586079545454558,
    "reward_min": -16.079895833333364,
    "reward_std": 3.8690697696248315,
    "timesteps": 101001600,
    "learntime": 0.18782190000638366,
    "sampletime": 18.69806340499781,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 281,
    "reward_mean": -4.692382091175421,
    "reward_max": 4.1570596590908915,
    "reward_min": -12.088892045454543,
    "reward_std": 3.3626894844854545,
    "timesteps": 101362320,
    "learntime": 0.297785755014047,
    "sampletime": 18.531871971907094,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 282,
    "reward_mean": -10.95942297733192,
    "reward_max": -2.622851562500003,
    "reward_min": -18.705383522727324,
    "reward_std": 3.2153945363906264,
    "timesteps": 101723040,
    "learntime": 0.18961181212216616,
    "sampletime": 18.80089041707106,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 283,
    "reward_mean": -11.12161959561434,
    "reward_max": -4.107613636363597,
    "reward_min": -19.423451704545506,
    "reward_std": 3.3682409535033075,
    "timesteps": 102083760,
    "learntime": 0.2979736460838467,
    "sampletime": 18.485348948044702,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 284,
    "reward_mean": -14.134728060635672,
    "reward_max": -7.237272727272702,
    "reward_min": -20.229659090909134,
    "reward_std": 3.1155698618627,
    "timesteps": 102444480,
    "learntime": 0.20504328794777393,
    "sampletime": 18.996753483079374,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 285,
    "reward_mean": -14.184633585611998,
    "reward_max": -5.2409090909091045,
    "reward_min": -21.61500000000004,
    "reward_std": 3.5611277410191984,
    "timesteps": 102805200,
    "learntime": 0.2740660661365837,
    "sampletime": 18.897776695899665,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 286,
    "reward_mean": -14.20168194395126,
    "reward_max": -6.0650852272727,
    "reward_min": -22.972741477272844,
    "reward_std": 3.1541489367034115,
    "timesteps": 103165920,
    "learntime": 0.19393199612386525,
    "sampletime": 18.942324856994674,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 287,
    "reward_mean": -7.459920894738395,
    "reward_max": 1.673295454545493,
    "reward_min": -14.297982954545484,
    "reward_std": 3.57246488429604,
    "timesteps": 103526640,
    "learntime": 0.3030339351389557,
    "sampletime": 18.575242497958243,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 288,
    "reward_mean": -5.392251956824093,
    "reward_max": 2.549247159090874,
    "reward_min": -12.075127840909074,
    "reward_std": 3.32580611388216,
    "timesteps": 103887360,
    "learntime": 0.18568946910090744,
    "sampletime": 18.6106734580826,
    "best_max_mean": -5.77556019176135,
    "best_max": 7.604758522727284
  },
  {
    "gen": 289,
    "reward_mean": -2.326923791133998,
    "reward_max": 8.34898437499997,
    "reward_min": -11.033238636363599,
    "reward_std": 3.398694413353241,
    "timesteps": 104248080,
    "learntime": 0.32064826088026166,
    "sampletime": 18.381039650179446,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 290,
    "reward_mean": -7.1680953147194755,
    "reward_max": 5.095340909090878,
    "reward_min": -15.188749999999994,
    "reward_std": 4.234132489375349,
    "timesteps": 104608800,
    "learntime": 0.18207855289801955,
    "sampletime": 18.846340321935713,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 291,
    "reward_mean": -11.147770145300665,
    "reward_max": -3.727414772727296,
    "reward_min": -18.685651041666684,
    "reward_std": 2.9589162998852445,
    "timesteps": 104969520,
    "learntime": 0.3018757540266961,
    "sampletime": 18.592789884191006,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 292,
    "reward_mean": -13.910851699366717,
    "reward_max": -6.797883522727269,
    "reward_min": -21.86910156250006,
    "reward_std": 3.097890951869755,
    "timesteps": 105330240,
    "learntime": 0.20028394903056324,
    "sampletime": 18.753978764871135,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 293,
    "reward_mean": -13.593302741773213,
    "reward_max": -7.895965909090873,
    "reward_min": -19.42174715909093,
    "reward_std": 2.6629039507069496,
    "timesteps": 105690960,
    "learntime": 0.3052229732275009,
    "sampletime": 18.65351214306429,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 294,
    "reward_mean": -14.493558738014917,
    "reward_max": -9.268352272727244,
    "reward_min": -19.40039062500007,
    "reward_std": 2.2007515853509485,
    "timesteps": 106051680,
    "learntime": 0.18055250798352063,
    "sampletime": 21.377803110983223,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 295,
    "reward_mean": -13.005185861298536,
    "reward_max": -6.294573863636338,
    "reward_min": -19.554517045454585,
    "reward_std": 2.8342046975159927,
    "timesteps": 106412400,
    "learntime": 0.28458746685646474,
    "sampletime": 19.337142293108627,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 296,
    "reward_mean": -8.751488314541925,
    "reward_max": 0.49967447916660923,
    "reward_min": -21.94255681818189,
    "reward_std": 4.343258091439471,
    "timesteps": 106773120,
    "learntime": 0.18815316702239215,
    "sampletime": 18.520974489860237,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 297,
    "reward_mean": -8.394503895152697,
    "reward_max": 0.31039772727277465,
    "reward_min": -15.858835227272793,
    "reward_std": 3.371183992037847,
    "timesteps": 107133840,
    "learntime": 0.32941274903714657,
    "sampletime": 18.697176621994004,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 298,
    "reward_mean": -10.60363530939276,
    "reward_max": -2.8917329545454313,
    "reward_min": -17.00937500000005,
    "reward_std": 3.331160969486167,
    "timesteps": 107494560,
    "learntime": 0.19178432784974575,
    "sampletime": 18.792425032006577,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 299,
    "reward_mean": -12.909900938091862,
    "reward_max": -7.1825852272727415,
    "reward_min": -22.7120963541667,
    "reward_std": 3.6280169589461235,
    "timesteps": 107855280,
    "learntime": 0.29798238701187074,
    "sampletime": 18.719224507920444,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 300,
    "reward_mean": -9.788695974638959,
    "reward_max": -0.9045170454545509,
    "reward_min": -16.093551136363647,
    "reward_std": 3.242626060543503,
    "timesteps": 108216000,
    "learntime": 0.20342070003971457,
    "sampletime": 18.704649758990854,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 301,
    "reward_mean": -10.840940440784799,
    "reward_max": -2.933309659090899,
    "reward_min": -17.271931818181855,
    "reward_std": 3.2572710830494866,
    "timesteps": 108576720,
    "learntime": 0.15940530598163605,
    "sampletime": 20.261953162029386,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 302,
    "reward_mean": -11.987491381096127,
    "reward_max": -4.564616477272751,
    "reward_min": -20.706832386363725,
    "reward_std": 3.1298859575993903,
    "timesteps": 108937440,
    "learntime": 0.19756511691957712,
    "sampletime": 19.03852581884712,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 303,
    "reward_mean": -13.086013978900345,
    "reward_max": -4.846875000000022,
    "reward_min": -20.73880208333343,
    "reward_std": 3.370988631735385,
    "timesteps": 109298160,
    "learntime": 0.29967118706554174,
    "sampletime": 19.03479428915307,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 304,
    "reward_mean": -9.519730058149843,
    "reward_max": -4.175156249999959,
    "reward_min": -17.317855113636362,
    "reward_std": 3.0493249221288163,
    "timesteps": 109658880,
    "learntime": 0.19879818218760192,
    "sampletime": 18.66871139407158,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 305,
    "reward_mean": -9.690379620176365,
    "reward_max": -2.221590909090953,
    "reward_min": -16.457727272727254,
    "reward_std": 2.7921452161381572,
    "timesteps": 110019600,
    "learntime": 0.19732245500199497,
    "sampletime": 18.66151538095437,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 306,
    "reward_mean": -10.956712221087823,
    "reward_max": -4.159609374999967,
    "reward_min": -17.98481534090914,
    "reward_std": 3.0135835553026156,
    "timesteps": 110380320,
    "learntime": 0.3093921320978552,
    "sampletime": 18.828576470026746,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 307,
    "reward_mean": -10.337074936375476,
    "reward_max": -2.491093749999988,
    "reward_min": -17.485738636363656,
    "reward_std": 2.875060395024882,
    "timesteps": 110741040,
    "learntime": 0.19357381202280521,
    "sampletime": 21.154992314055562,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 308,
    "reward_mean": -7.865072280421404,
    "reward_max": -0.6096223958334012,
    "reward_min": -18.32748697916669,
    "reward_std": 3.4262560362712606,
    "timesteps": 111101760,
    "learntime": 0.19613094814121723,
    "sampletime": 18.814308570930734,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 309,
    "reward_mean": -9.347943318684887,
    "reward_max": -1.7547159090908715,
    "reward_min": -16.37323863636366,
    "reward_std": 3.3577392847167427,
    "timesteps": 111462480,
    "learntime": 0.188601931091398,
    "sampletime": 18.666122142923996,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 310,
    "reward_mean": -11.39529446688567,
    "reward_max": -2.396633522727267,
    "reward_min": -18.029105113636415,
    "reward_std": 3.260474403902438,
    "timesteps": 111823200,
    "learntime": 0.19422941794618964,
    "sampletime": 18.546978167956695,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 311,
    "reward_mean": -8.842063080758745,
    "reward_max": -2.347838541666655,
    "reward_min": -15.730568181818153,
    "reward_std": 2.7659881324423483,
    "timesteps": 112183920,
    "learntime": 0.18245683889836073,
    "sampletime": 18.586928648874164,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 312,
    "reward_mean": -12.012950199011602,
    "reward_max": -2.667304687499953,
    "reward_min": -19.125880681818202,
    "reward_std": 3.404957128729568,
    "timesteps": 112544640,
    "learntime": 0.19036896107718349,
    "sampletime": 18.63185903383419,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 313,
    "reward_mean": -12.345427819454303,
    "reward_max": -4.795042613636347,
    "reward_min": -20.11842329545458,
    "reward_std": 3.2517926191667774,
    "timesteps": 112905360,
    "learntime": 0.20486526796594262,
    "sampletime": 18.855052076047286,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 314,
    "reward_mean": -10.676903797496436,
    "reward_max": -1.9747301136363313,
    "reward_min": -18.681718750000023,
    "reward_std": 3.2777667487141744,
    "timesteps": 113266080,
    "learntime": 0.18562416196800768,
    "sampletime": 18.55466000107117,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 315,
    "reward_mean": -11.428556074662637,
    "reward_max": -1.6389488636363545,
    "reward_min": -17.322760416666657,
    "reward_std": 2.971022605587288,
    "timesteps": 113626800,
    "learntime": 0.1817084620706737,
    "sampletime": 18.60919313901104,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 316,
    "reward_mean": -10.311137658321494,
    "reward_max": -4.575742187499982,
    "reward_min": -19.224460227272807,
    "reward_std": 3.3695731882225037,
    "timesteps": 113987520,
    "learntime": 0.18675705115310848,
    "sampletime": 18.550717171048746,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 317,
    "reward_mean": -12.18887639825995,
    "reward_max": -5.2473567708333215,
    "reward_min": -22.33032670454548,
    "reward_std": 3.1702270499140814,
    "timesteps": 114348240,
    "learntime": 0.19267862918786705,
    "sampletime": 18.649850921006873,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 318,
    "reward_mean": -8.579638856830023,
    "reward_max": 1.2300852272727363,
    "reward_min": -15.89938920454544,
    "reward_std": 3.8267959138333283,
    "timesteps": 114708960,
    "learntime": 0.20498556783422828,
    "sampletime": 18.728479413082823,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 319,
    "reward_mean": -6.880200047348488,
    "reward_max": -0.39370738636360336,
    "reward_min": -14.564715909090967,
    "reward_std": 3.5340818464523225,
    "timesteps": 115069680,
    "learntime": 0.18202265491709113,
    "sampletime": 20.880367015022784,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 320,
    "reward_mean": -11.659038696289077,
    "reward_max": -1.4837500000000157,
    "reward_min": -17.916718750000054,
    "reward_std": 3.13722488170315,
    "timesteps": 115430400,
    "learntime": 0.2020278531126678,
    "sampletime": 18.96538061602041,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 321,
    "reward_mean": -10.192356696851318,
    "reward_max": -2.7403977272727507,
    "reward_min": -19.26917613636369,
    "reward_std": 2.898443901141102,
    "timesteps": 115791120,
    "learntime": 0.1907391829881817,
    "sampletime": 18.482027648948133,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 322,
    "reward_mean": -7.025494884144164,
    "reward_max": 0.6379403409090952,
    "reward_min": -15.15274147727274,
    "reward_std": 3.8125632392600606,
    "timesteps": 116151840,
    "learntime": 0.20517285587266088,
    "sampletime": 18.73504900187254,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 323,
    "reward_mean": -8.893146750710237,
    "reward_max": 0.9113151041666866,
    "reward_min": -19.70943181818184,
    "reward_std": 3.578600172737135,
    "timesteps": 116512560,
    "learntime": 0.189587261993438,
    "sampletime": 18.4962406931445,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 324,
    "reward_mean": -6.410800596294975,
    "reward_max": 0.16178977272727305,
    "reward_min": -13.059474431818165,
    "reward_std": 3.2475661204277566,
    "timesteps": 116873280,
    "learntime": 0.1984552899375558,
    "sampletime": 18.701747274026275,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 325,
    "reward_mean": -8.458409904711164,
    "reward_max": -0.28596354166667776,
    "reward_min": -16.151576704545473,
    "reward_std": 3.4548941334727274,
    "timesteps": 117234000,
    "learntime": 0.19005925813689828,
    "sampletime": 18.345349160954356,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 326,
    "reward_mean": -9.465593261718748,
    "reward_max": -0.6079119318181359,
    "reward_min": -16.60438802083337,
    "reward_std": 3.759858370372826,
    "timesteps": 117594720,
    "learntime": 0.18841029703617096,
    "sampletime": 18.91651811497286,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 327,
    "reward_mean": -5.559695712002825,
    "reward_max": 1.9714346590909222,
    "reward_min": -12.712258522727266,
    "reward_std": 3.2240083610424586,
    "timesteps": 117955440,
    "learntime": 0.20005499478429556,
    "sampletime": 19.392431674990803,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 328,
    "reward_mean": -7.070990878018447,
    "reward_max": -0.2884090909090453,
    "reward_min": -13.128096590909104,
    "reward_std": 3.1730176094661604,
    "timesteps": 118316160,
    "learntime": 0.19804682210087776,
    "sampletime": 18.49336505588144,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 329,
    "reward_mean": -6.215181755297104,
    "reward_max": 3.2072017045453993,
    "reward_min": -13.735260416666668,
    "reward_std": 3.368986378074015,
    "timesteps": 118676880,
    "learntime": 0.19509719987399876,
    "sampletime": 18.56872944603674,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 330,
    "reward_mean": -8.473036499023422,
    "reward_max": -2.252057291666673,
    "reward_min": -18.037301136363652,
    "reward_std": 3.277817470485451,
    "timesteps": 119037600,
    "learntime": 0.20009781909175217,
    "sampletime": 18.51893013296649,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 331,
    "reward_mean": -9.92059893983783,
    "reward_max": -1.6693181818181757,
    "reward_min": -18.515553977272784,
    "reward_std": 4.0112355947693565,
    "timesteps": 119398320,
    "learntime": 0.20184486196376383,
    "sampletime": 18.635660456959158,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 332,
    "reward_mean": -7.974590472597041,
    "reward_max": -0.039588068181804624,
    "reward_min": -14.79454545454544,
    "reward_std": 2.8358803457035546,
    "timesteps": 119759040,
    "learntime": 0.19930309592746198,
    "sampletime": 18.811720161000267,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 333,
    "reward_mean": -7.9781865345347995,
    "reward_max": 0.5200994318181877,
    "reward_min": -14.791477272727285,
    "reward_std": 3.257824264407965,
    "timesteps": 120119760,
    "learntime": 0.1954509390052408,
    "sampletime": 22.50021474994719,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 334,
    "reward_mean": -11.136839673591382,
    "reward_max": -1.8837215909090894,
    "reward_min": -18.81238281250008,
    "reward_std": 2.9433370752706454,
    "timesteps": 120480480,
    "learntime": 0.20438480097800493,
    "sampletime": 18.49946528719738,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 335,
    "reward_mean": -10.665636134292123,
    "reward_max": -3.5729261363636238,
    "reward_min": -16.520284090909083,
    "reward_std": 2.906180482987066,
    "timesteps": 120841200,
    "learntime": 0.1974433371797204,
    "sampletime": 18.560953931882977,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 336,
    "reward_mean": -11.93034606933593,
    "reward_max": -5.487613636363623,
    "reward_min": -18.262855113636434,
    "reward_std": 2.9183778728381427,
    "timesteps": 121201920,
    "learntime": 0.20041322312317789,
    "sampletime": 18.70532688195817,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 337,
    "reward_mean": -7.41417693167021,
    "reward_max": 4.791164772727251,
    "reward_min": -15.498451704545477,
    "reward_std": 4.363086596612206,
    "timesteps": 121562640,
    "learntime": 0.18514398694969714,
    "sampletime": 18.68776077008806,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 338,
    "reward_mean": -11.114521243933481,
    "reward_max": -2.841783854166677,
    "reward_min": -16.569999999999997,
    "reward_std": 2.861061972378542,
    "timesteps": 121923360,
    "learntime": 0.20169579796493053,
    "sampletime": 18.640975523972884,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 339,
    "reward_mean": -11.156447347005205,
    "reward_max": -5.898984374999963,
    "reward_min": -17.94840909090916,
    "reward_std": 2.772244049784931,
    "timesteps": 122284080,
    "learntime": 0.19978691707365215,
    "sampletime": 18.72569917095825,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 340,
    "reward_mean": -11.4657226747455,
    "reward_max": -3.0134244791666345,
    "reward_min": -19.741328125000084,
    "reward_std": 3.4703138732500465,
    "timesteps": 122644800,
    "learntime": 0.19032897893339396,
    "sampletime": 18.69997140695341,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 341,
    "reward_mean": -9.841123527758047,
    "reward_max": -1.2859801136363778,
    "reward_min": -16.83855468750002,
    "reward_std": 3.364490245380951,
    "timesteps": 123005520,
    "learntime": 0.1888111310545355,
    "sampletime": 18.60561652085744,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 342,
    "reward_mean": -8.10558127663351,
    "reward_max": -0.7277698863635716,
    "reward_min": -14.706860795454542,
    "reward_std": 3.093511225306902,
    "timesteps": 123366240,
    "learntime": 0.1997765761334449,
    "sampletime": 18.391418673098087,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 343,
    "reward_mean": -11.673047485351567,
    "reward_max": -3.9812926136363274,
    "reward_min": -18.818125000000034,
    "reward_std": 3.33649623718383,
    "timesteps": 123726960,
    "learntime": 0.1789423010777682,
    "sampletime": 18.45886773383245,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 344,
    "reward_mean": -8.947728179006866,
    "reward_max": 1.7303835227272861,
    "reward_min": -15.606676136363644,
    "reward_std": 3.4418000008153675,
    "timesteps": 124087680,
    "learntime": 0.18591361888684332,
    "sampletime": 18.53781292703934,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 345,
    "reward_mean": -11.489179188121447,
    "reward_max": -2.618963068181848,
    "reward_min": -19.28971590909094,
    "reward_std": 3.6645725418709025,
    "timesteps": 124448400,
    "learntime": 0.20651042414829135,
    "sampletime": 18.61982109490782,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 346,
    "reward_mean": -14.97459380178742,
    "reward_max": -9.13768465909088,
    "reward_min": -24.4519744318183,
    "reward_std": 3.3975870590306143,
    "timesteps": 124809120,
    "learntime": 0.21019178605638444,
    "sampletime": 18.535988199990243,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 347,
    "reward_mean": -12.093669969963301,
    "reward_max": -5.693210227272697,
    "reward_min": -19.269161931818232,
    "reward_std": 3.0935774100526965,
    "timesteps": 125169840,
    "learntime": 0.19443055195733905,
    "sampletime": 18.43744378001429,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 348,
    "reward_mean": -8.583091393673055,
    "reward_max": 0.8072395833333554,
    "reward_min": -16.565468750000054,
    "reward_std": 3.5510941864918077,
    "timesteps": 125530560,
    "learntime": 0.19876459101215005,
    "sampletime": 19.203197959810495,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 349,
    "reward_mean": -12.005619469844932,
    "reward_max": -7.242301136363605,
    "reward_min": -17.943338068181838,
    "reward_std": 2.6205843379287574,
    "timesteps": 125891280,
    "learntime": 0.1984021111857146,
    "sampletime": 18.69680630089715,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 350,
    "reward_mean": -10.630190836588538,
    "reward_max": -3.6016015624999973,
    "reward_min": -17.653977272727293,
    "reward_std": 3.593656227827562,
    "timesteps": 126252000,
    "learntime": 0.18348863907158375,
    "sampletime": 18.45103474589996,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 351,
    "reward_mean": -11.219879224372637,
    "reward_max": -4.114453124999989,
    "reward_min": -22.32142045454556,
    "reward_std": 3.182232387231155,
    "timesteps": 126612720,
    "learntime": 0.1967815039679408,
    "sampletime": 18.887958789942786,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 352,
    "reward_mean": -12.410402906013267,
    "reward_max": -3.6379403409091045,
    "reward_min": -18.30163352272732,
    "reward_std": 3.02921157774413,
    "timesteps": 126973440,
    "learntime": 0.19227038696408272,
    "sampletime": 18.540966467000544,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 353,
    "reward_mean": -11.655519150242672,
    "reward_max": -3.090170454545459,
    "reward_min": -18.74193181818185,
    "reward_std": 3.411711868266912,
    "timesteps": 127334160,
    "learntime": 0.18702428019605577,
    "sampletime": 18.69559304206632,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 354,
    "reward_mean": -12.923048817027706,
    "reward_max": -4.791458333333292,
    "reward_min": -21.99592329545464,
    "reward_std": 3.0843169419417293,
    "timesteps": 127694880,
    "learntime": 0.19636822305619717,
    "sampletime": 18.489767910912633,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 355,
    "reward_mean": -11.68395626183713,
    "reward_max": -2.9040234374999803,
    "reward_min": -21.09680397727277,
    "reward_std": 3.311722929365699,
    "timesteps": 128055600,
    "learntime": 0.19769854098558426,
    "sampletime": 18.70693069882691,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 356,
    "reward_mean": -10.103420021750708,
    "reward_max": -1.6502864583333114,
    "reward_min": -17.2394460227273,
    "reward_std": 3.03614847108597,
    "timesteps": 128416320,
    "learntime": 0.1946822099853307,
    "sampletime": 18.69250521203503,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 357,
    "reward_mean": -10.892582878343996,
    "reward_max": -4.094630681818192,
    "reward_min": -17.68946614583338,
    "reward_std": 3.104409324468461,
    "timesteps": 128777040,
    "learntime": 0.1969516018871218,
    "sampletime": 18.499243263853714,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 358,
    "reward_mean": -8.519268521395583,
    "reward_max": -3.8410677083333,
    "reward_min": -16.35002604166669,
    "reward_std": 2.905192405621165,
    "timesteps": 129137760,
    "learntime": 0.19374185800552368,
    "sampletime": 18.76523051294498,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 359,
    "reward_mean": -5.992786791252362,
    "reward_max": 2.4658806818181467,
    "reward_min": -13.229557291666657,
    "reward_std": 3.4244009236282986,
    "timesteps": 129498480,
    "learntime": 0.19499613484367728,
    "sampletime": 18.577188682043925,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 360,
    "reward_mean": -5.991292299212834,
    "reward_max": 3.4279971590909324,
    "reward_min": -13.892784090909087,
    "reward_std": 3.296461792309997,
    "timesteps": 129859200,
    "learntime": 0.2000009708572179,
    "sampletime": 18.41725899395533,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 361,
    "reward_mean": -10.886663818359386,
    "reward_max": -1.439232954545445,
    "reward_min": -18.754453125000072,
    "reward_std": 3.5894325574865866,
    "timesteps": 130219920,
    "learntime": 0.20025854790583253,
    "sampletime": 18.54567902116105,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 362,
    "reward_mean": -9.533953635475864,
    "reward_max": -2.2851302083333818,
    "reward_min": -15.972135416666688,
    "reward_std": 3.141608369617509,
    "timesteps": 130580640,
    "learntime": 0.18223629496060312,
    "sampletime": 18.48729246109724,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 363,
    "reward_mean": -9.923123631332857,
    "reward_max": 1.7322869318181737,
    "reward_min": -18.194517045454585,
    "reward_std": 4.079347581221891,
    "timesteps": 130941360,
    "learntime": 0.1961567981634289,
    "sampletime": 18.589612738927826,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 364,
    "reward_mean": -8.50391669995857,
    "reward_max": 1.6939322916666455,
    "reward_min": -18.475781250000036,
    "reward_std": 4.0030541411592875,
    "timesteps": 131302080,
    "learntime": 0.19271672097966075,
    "sampletime": 18.618590531870723,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 365,
    "reward_mean": -10.583668453332166,
    "reward_max": -0.917684659090881,
    "reward_min": -18.085937500000075,
    "reward_std": 3.9929976444245314,
    "timesteps": 131662800,
    "learntime": 0.1788016720674932,
    "sampletime": 18.6584255839698,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 366,
    "reward_mean": -11.698248420484134,
    "reward_max": -6.508210227272707,
    "reward_min": -18.98897135416671,
    "reward_std": 2.845653528716064,
    "timesteps": 132023520,
    "learntime": 0.18608339107595384,
    "sampletime": 18.59908679081127,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 367,
    "reward_mean": -12.455608705462845,
    "reward_max": -4.56404829545452,
    "reward_min": -25.557954545454674,
    "reward_std": 3.6054733018563923,
    "timesteps": 132384240,
    "learntime": 0.18986899894662201,
    "sampletime": 18.490697502857074,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 368,
    "reward_mean": -7.526338778409072,
    "reward_max": -1.2954557291666464,
    "reward_min": -14.710653409090874,
    "reward_std": 2.847545013964968,
    "timesteps": 132744960,
    "learntime": 0.1872062711045146,
    "sampletime": 18.620154635980725,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 369,
    "reward_mean": -7.317845421993363,
    "reward_max": 0.29353693181823065,
    "reward_min": -15.061946022727312,
    "reward_std": 3.272744488350707,
    "timesteps": 133105680,
    "learntime": 0.19875078392215073,
    "sampletime": 18.725361034972593,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 370,
    "reward_mean": -6.683445564038816,
    "reward_max": 1.7819460227272428,
    "reward_min": -18.163423295454596,
    "reward_std": 3.6399246072431413,
    "timesteps": 133466400,
    "learntime": 0.2068278081715107,
    "sampletime": 18.627718139905483,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 371,
    "reward_mean": -11.954407071200276,
    "reward_max": -3.0605965909091073,
    "reward_min": -17.801178977272745,
    "reward_std": 2.892427896349339,
    "timesteps": 133827120,
    "learntime": 0.1961008608341217,
    "sampletime": 18.667696385877207,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 372,
    "reward_mean": -13.049161210493612,
    "reward_max": -5.004417613636321,
    "reward_min": -20.100667613636393,
    "reward_std": 2.7438409392240555,
    "timesteps": 134187840,
    "learntime": 0.1939256521873176,
    "sampletime": 18.477223325055093,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 373,
    "reward_mean": -13.583587757457396,
    "reward_max": -5.224772727272713,
    "reward_min": -20.175426136363637,
    "reward_std": 3.634772531978481,
    "timesteps": 134548560,
    "learntime": 0.19712346885353327,
    "sampletime": 18.760902510024607,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 374,
    "reward_mean": -11.352362911339963,
    "reward_max": -3.974361979166646,
    "reward_min": -19.480994318181864,
    "reward_std": 2.876527701981894,
    "timesteps": 134909280,
    "learntime": 0.18731118994764984,
    "sampletime": 18.599273156141862,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 375,
    "reward_mean": -11.172621811375478,
    "reward_max": -2.4563210227272756,
    "reward_min": -19.728423295454597,
    "reward_std": 3.8218296287006828,
    "timesteps": 135270000,
    "learntime": 0.18878729501739144,
    "sampletime": 18.566318508936092,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 376,
    "reward_mean": -7.6913342840021315,
    "reward_max": 0.4285227272727383,
    "reward_min": -15.17238636363637,
    "reward_std": 3.593800064176842,
    "timesteps": 135630720,
    "learntime": 0.18334341887384653,
    "sampletime": 18.53157647512853,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 377,
    "reward_mean": -9.58461017030658,
    "reward_max": -3.25042613636362,
    "reward_min": -18.95498697916669,
    "reward_std": 2.903842503505534,
    "timesteps": 135991440,
    "learntime": 0.18780662794597447,
    "sampletime": 18.66355464118533,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 378,
    "reward_mean": -9.555211181640615,
    "reward_max": -3.139957386363598,
    "reward_min": -17.772713068181897,
    "reward_std": 3.0656507781948,
    "timesteps": 136352160,
    "learntime": 0.20519467000849545,
    "sampletime": 18.63616282516159,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 379,
    "reward_mean": -8.561364468661221,
    "reward_max": -0.8048579545454607,
    "reward_min": -15.582315340909133,
    "reward_std": 3.221445604273212,
    "timesteps": 136712880,
    "learntime": 0.1906981528736651,
    "sampletime": 18.47118495986797,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 380,
    "reward_mean": -8.159890562115276,
    "reward_max": 2.3415767045454743,
    "reward_min": -14.464218750000027,
    "reward_std": 3.255126764260731,
    "timesteps": 137073600,
    "learntime": 0.19515990698710084,
    "sampletime": 18.37596239312552,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 381,
    "reward_mean": -3.6975511585582206,
    "reward_max": 5.9347443181817985,
    "reward_min": -10.435156249999995,
    "reward_std": 3.146543153265643,
    "timesteps": 137434320,
    "learntime": 0.20238972804509103,
    "sampletime": 18.35135909006931,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 382,
    "reward_mean": -6.802013623786689,
    "reward_max": 0.33231770833333557,
    "reward_min": -13.987357954545455,
    "reward_std": 3.5817404344425596,
    "timesteps": 137795040,
    "learntime": 0.197205234086141,
    "sampletime": 18.608072424074635,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 383,
    "reward_mean": -12.204179262103475,
    "reward_max": -4.808815104166659,
    "reward_min": -17.268011363636386,
    "reward_std": 2.710194751856198,
    "timesteps": 138155760,
    "learntime": 0.18931441684253514,
    "sampletime": 18.749626340111718,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 384,
    "reward_mean": -13.96541847922587,
    "reward_max": -6.428835227272751,
    "reward_min": -22.63387784090914,
    "reward_std": 3.580817496562936,
    "timesteps": 138516480,
    "learntime": 0.19678376894444227,
    "sampletime": 18.703780276933685,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 385,
    "reward_mean": -12.901374844637793,
    "reward_max": -3.4657386363636182,
    "reward_min": -21.205807291666705,
    "reward_std": 3.3270911391081768,
    "timesteps": 138877200,
    "learntime": 0.18307495093904436,
    "sampletime": 18.624112914083526,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 386,
    "reward_mean": -11.78996694853813,
    "reward_max": -2.1224005681818365,
    "reward_min": -18.567386363636388,
    "reward_std": 3.1254998761685537,
    "timesteps": 139237920,
    "learntime": 0.18573967786505818,
    "sampletime": 18.878093891078606,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 387,
    "reward_mean": -12.696705451734154,
    "reward_max": -5.2810227272727355,
    "reward_min": -20.470156250000073,
    "reward_std": 3.5038789362433578,
    "timesteps": 139598640,
    "learntime": 0.1906396730337292,
    "sampletime": 18.78417293005623,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 388,
    "reward_mean": -10.599501842152,
    "reward_max": -2.39609375000003,
    "reward_min": -19.16500000000005,
    "reward_std": 3.8692805239771872,
    "timesteps": 139959360,
    "learntime": 0.19782165391370654,
    "sampletime": 18.667418045923114,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 389,
    "reward_mean": -9.538321033824573,
    "reward_max": -1.1771732954545473,
    "reward_min": -19.466519886363667,
    "reward_std": 3.693727064705538,
    "timesteps": 140320080,
    "learntime": 0.1966181460302323,
    "sampletime": 18.588111608987674,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 390,
    "reward_mean": -9.290723599520595,
    "reward_max": -2.404119318181806,
    "reward_min": -16.215497159090965,
    "reward_std": 2.8857384517629403,
    "timesteps": 140680800,
    "learntime": 0.1909637360367924,
    "sampletime": 18.67400189116597,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 391,
    "reward_mean": -10.47277843128552,
    "reward_max": -2.980156250000025,
    "reward_min": -16.359518229166707,
    "reward_std": 3.1774318125034675,
    "timesteps": 141041520,
    "learntime": 0.19910348812118173,
    "sampletime": 18.62221248401329,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 392,
    "reward_mean": -13.975349065607253,
    "reward_max": -6.325198863636351,
    "reward_min": -20.778863636363656,
    "reward_std": 3.1131293353441096,
    "timesteps": 141402240,
    "learntime": 0.1980863658245653,
    "sampletime": 18.696939383866265,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 393,
    "reward_mean": -14.144999963009008,
    "reward_max": -6.787201704545432,
    "reward_min": -20.197741477272814,
    "reward_std": 2.950943691107441,
    "timesteps": 141762960,
    "learntime": 0.21136049088090658,
    "sampletime": 18.68661760003306,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 394,
    "reward_mean": -13.653464410955275,
    "reward_max": -8.267997159090923,
    "reward_min": -19.979034090909153,
    "reward_std": 2.774084364552809,
    "timesteps": 142123680,
    "learntime": 0.19100890215486288,
    "sampletime": 18.688192851142958,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 395,
    "reward_mean": -13.03441173206676,
    "reward_max": 0.7888210227272946,
    "reward_min": -20.761562500000025,
    "reward_std": 3.567678662570805,
    "timesteps": 142484400,
    "learntime": 0.18684209906496108,
    "sampletime": 18.58293240889907,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 396,
    "reward_mean": -11.736504313151052,
    "reward_max": -0.1508380681817893,
    "reward_min": -19.765703125000083,
    "reward_std": 3.5146459697790324,
    "timesteps": 142845120,
    "learntime": 0.19412392587400973,
    "sampletime": 18.953940260922536,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 397,
    "reward_mean": -14.742058438387817,
    "reward_max": -1.8245880681819038,
    "reward_min": -22.741860795454677,
    "reward_std": 4.166998634018413,
    "timesteps": 143205840,
    "learntime": 0.2080590408295393,
    "sampletime": 18.925768346060067,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 398,
    "reward_mean": -12.728994103634022,
    "reward_max": -4.8320880681818315,
    "reward_min": -19.2223153409091,
    "reward_std": 3.3315060523216307,
    "timesteps": 143566560,
    "learntime": 0.19056805316358805,
    "sampletime": 18.830156906042248,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 399,
    "reward_mean": -9.658049112955748,
    "reward_max": -1.5706249999999984,
    "reward_min": -19.17642045454558,
    "reward_std": 3.7706590051247235,
    "timesteps": 143927280,
    "learntime": 0.20265591307543218,
    "sampletime": 18.598714185878634,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 400,
    "reward_mean": -11.286907089695811,
    "reward_max": -5.399417613636357,
    "reward_min": -22.49072443181829,
    "reward_std": 3.8620598937733415,
    "timesteps": 144288000,
    "learntime": 0.20227520703338087,
    "sampletime": 18.622792065842077,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 401,
    "reward_mean": -13.905912882486998,
    "reward_max": -6.072698863636341,
    "reward_min": -18.991497395833377,
    "reward_std": 2.9928118816328846,
    "timesteps": 144648720,
    "learntime": 0.16412384388968349,
    "sampletime": 18.625780911184847,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 402,
    "reward_mean": -14.225316421046415,
    "reward_max": -5.452812499999965,
    "reward_min": -20.642713068181898,
    "reward_std": 3.4310102880935536,
    "timesteps": 145009440,
    "learntime": 0.1950045581907034,
    "sampletime": 18.91271320404485,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 403,
    "reward_mean": -13.441113799124075,
    "reward_max": -3.3981107954545227,
    "reward_min": -19.894375000000075,
    "reward_std": 3.5904804656536635,
    "timesteps": 145370160,
    "learntime": 0.2014208270702511,
    "sampletime": 18.775563227944076,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 404,
    "reward_mean": -11.383919363310856,
    "reward_max": -5.229752604166668,
    "reward_min": -19.85507102272734,
    "reward_std": 3.1761512927913222,
    "timesteps": 145730880,
    "learntime": 0.19078904413618147,
    "sampletime": 18.730455345008522,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 405,
    "reward_mean": -8.679988310842795,
    "reward_max": -0.701718749999986,
    "reward_min": -15.811988636363639,
    "reward_std": 3.5170316065630622,
    "timesteps": 146091600,
    "learntime": 0.3073460180312395,
    "sampletime": 18.85157427098602,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 406,
    "reward_mean": -9.431444628166437,
    "reward_max": -0.42171875000000014,
    "reward_min": -18.32622159090911,
    "reward_std": 3.478526987821418,
    "timesteps": 146452320,
    "learntime": 0.18932652799412608,
    "sampletime": 18.446560957003385,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 407,
    "reward_mean": -9.891454097863395,
    "reward_max": -2.636676136363626,
    "reward_min": -15.220611979166689,
    "reward_std": 3.058407570526966,
    "timesteps": 146813040,
    "learntime": 0.18141741794534028,
    "sampletime": 18.514691313030198,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 408,
    "reward_mean": -14.589841345584759,
    "reward_max": -8.051676136363588,
    "reward_min": -22.055924479166706,
    "reward_std": 3.1563459046984437,
    "timesteps": 147173760,
    "learntime": 0.2004874579142779,
    "sampletime": 18.753026416059583,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 409,
    "reward_mean": -11.262753739790485,
    "reward_max": -4.570312499999987,
    "reward_min": -19.47370738636367,
    "reward_std": 3.3219769943817403,
    "timesteps": 147534480,
    "learntime": 0.2050280519761145,
    "sampletime": 18.72468726313673,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 410,
    "reward_mean": -9.11834411621093,
    "reward_max": -1.5694176136364282,
    "reward_min": -16.326796875000056,
    "reward_std": 3.562903444277844,
    "timesteps": 147895200,
    "learntime": 0.1927550700493157,
    "sampletime": 18.5991159719415,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 411,
    "reward_mean": -10.106024003462348,
    "reward_max": -3.2406818181818164,
    "reward_min": -19.802713068181838,
    "reward_std": 3.5051154840087544,
    "timesteps": 148255920,
    "learntime": 0.19495303183794022,
    "sampletime": 18.43670642701909,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 412,
    "reward_mean": -11.767275520093515,
    "reward_max": -4.112315340909067,
    "reward_min": -19.944908854166716,
    "reward_std": 3.0908753058982175,
    "timesteps": 148616640,
    "learntime": 0.2009636079892516,
    "sampletime": 18.60949062020518,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 413,
    "reward_mean": -15.410164369525372,
    "reward_max": -8.215582386363618,
    "reward_min": -24.572578125000067,
    "reward_std": 3.5082731970315115,
    "timesteps": 148977360,
    "learntime": 0.19864208297803998,
    "sampletime": 18.62995138997212,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 414,
    "reward_mean": -12.877147512724928,
    "reward_max": -5.529869791666701,
    "reward_min": -20.024674479166745,
    "reward_std": 3.1681143507064324,
    "timesteps": 149338080,
    "learntime": 0.2099162780214101,
    "sampletime": 18.641547315986827,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 415,
    "reward_mean": -7.7025791422526,
    "reward_max": 4.657670454545407,
    "reward_min": -16.601505681818235,
    "reward_std": 3.6361180291150488,
    "timesteps": 149698800,
    "learntime": 0.19325149501673877,
    "sampletime": 18.36364943603985,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 416,
    "reward_mean": -7.84305913751777,
    "reward_max": -2.0345703124999996,
    "reward_min": -16.46791193181819,
    "reward_std": 3.5307395951944573,
    "timesteps": 150059520,
    "learntime": 0.3007045239210129,
    "sampletime": 18.720125938998535,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 417,
    "reward_mean": -7.479256536310356,
    "reward_max": -2.3401278409090853,
    "reward_min": -17.547317708333356,
    "reward_std": 2.842436414423296,
    "timesteps": 150420240,
    "learntime": 0.17997979489155114,
    "sampletime": 18.608105619903654,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 418,
    "reward_mean": -10.332086533055152,
    "reward_max": -2.6642613636363635,
    "reward_min": -17.174375000000005,
    "reward_std": 2.8238831385784096,
    "timesteps": 150780960,
    "learntime": 0.32103070989251137,
    "sampletime": 18.434511156985536,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 419,
    "reward_mean": -10.201535977450273,
    "reward_max": -3.558167613636314,
    "reward_min": -15.410809659090893,
    "reward_std": 2.5012171115568482,
    "timesteps": 151141680,
    "learntime": 0.3252323940396309,
    "sampletime": 18.50028262892738,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 420,
    "reward_mean": -11.209139644738405,
    "reward_max": -0.294588068181829,
    "reward_min": -17.660710227272777,
    "reward_std": 3.5701346150330484,
    "timesteps": 151502400,
    "learntime": 0.20493969204835594,
    "sampletime": 18.68317295704037,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 421,
    "reward_mean": -13.662769830877146,
    "reward_max": -2.9721164772727375,
    "reward_min": -21.413082386363687,
    "reward_std": 3.8027140658552,
    "timesteps": 151863120,
    "learntime": 0.3206433567684144,
    "sampletime": 18.652588078053668,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 422,
    "reward_mean": -12.838999448834056,
    "reward_max": -4.677372159090897,
    "reward_min": -21.092059659090975,
    "reward_std": 3.145599985701231,
    "timesteps": 152223840,
    "learntime": 0.2063072680030018,
    "sampletime": 19.003566480008885,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 423,
    "reward_mean": -14.063223950935148,
    "reward_max": -6.15759943181817,
    "reward_min": -24.49738636363644,
    "reward_std": 3.565256394385493,
    "timesteps": 152584560,
    "learntime": 0.2829475549515337,
    "sampletime": 18.609230472007766,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 424,
    "reward_mean": -13.997202185428508,
    "reward_max": -5.481107954545422,
    "reward_min": -23.50383522727278,
    "reward_std": 2.9699823482480103,
    "timesteps": 152945280,
    "learntime": 0.20105205685831606,
    "sampletime": 18.855416839011014,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 425,
    "reward_mean": -13.013758729876901,
    "reward_max": 0.4539914772727343,
    "reward_min": -21.533963068181855,
    "reward_std": 4.099081662166073,
    "timesteps": 153306000,
    "learntime": 0.2984799640253186,
    "sampletime": 18.68302552518435,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 426,
    "reward_mean": -12.739332349372647,
    "reward_max": -6.173579545454558,
    "reward_min": -20.44228693181825,
    "reward_std": 2.8934541734725965,
    "timesteps": 153666720,
    "learntime": 0.21225604810751975,
    "sampletime": 18.687464002054185,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 427,
    "reward_mean": -14.467033284505225,
    "reward_max": -8.267698863636294,
    "reward_min": -23.28875000000005,
    "reward_std": 3.1004877096978047,
    "timesteps": 154027440,
    "learntime": 0.3097984360065311,
    "sampletime": 18.72696591494605,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 428,
    "reward_mean": -11.565425673976097,
    "reward_max": -1.7878124999999623,
    "reward_min": -20.597585227272816,
    "reward_std": 3.3608739180628864,
    "timesteps": 154388160,
    "learntime": 0.1839357998687774,
    "sampletime": 18.618060083827004,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 429,
    "reward_mean": -14.561386774236517,
    "reward_max": -5.516747159090913,
    "reward_min": -25.170894886363723,
    "reward_std": 3.8600757716165357,
    "timesteps": 154748880,
    "learntime": 0.28404992492869496,
    "sampletime": 18.61895136605017,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 430,
    "reward_mean": -16.961021099668574,
    "reward_max": -9.326647727272695,
    "reward_min": -24.74366477272736,
    "reward_std": 3.2226546301543375,
    "timesteps": 155109600,
    "learntime": 0.19796748599037528,
    "sampletime": 18.77167090610601,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 431,
    "reward_mean": -10.369591471354148,
    "reward_max": -1.3088920454545496,
    "reward_min": -15.886335227272722,
    "reward_std": 3.158204935936755,
    "timesteps": 155470320,
    "learntime": 0.31050394708290696,
    "sampletime": 18.53385361796245,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 432,
    "reward_mean": -11.683105598218514,
    "reward_max": -3.921484374999983,
    "reward_min": -18.530980113636414,
    "reward_std": 3.3374344311105286,
    "timesteps": 155831040,
    "learntime": 0.19546479498967528,
    "sampletime": 18.639399570878595,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 433,
    "reward_mean": -12.804635749585712,
    "reward_max": -6.753281250000014,
    "reward_min": -21.952471590909173,
    "reward_std": 2.93050864668827,
    "timesteps": 156191760,
    "learntime": 0.28462713095359504,
    "sampletime": 18.647555934032425,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 434,
    "reward_mean": -11.70671462550309,
    "reward_max": -2.4126704545454563,
    "reward_min": -20.27981534090913,
    "reward_std": 4.095956784464234,
    "timesteps": 156552480,
    "learntime": 0.19336641114205122,
    "sampletime": 18.69035877007991,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 435,
    "reward_mean": -13.164545731977995,
    "reward_max": -2.981960227272736,
    "reward_min": -22.812542613636452,
    "reward_std": 4.278938369672455,
    "timesteps": 156913200,
    "learntime": 0.2930583590641618,
    "sampletime": 18.812457664171234,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 436,
    "reward_mean": -13.059282189571503,
    "reward_max": -3.192727272727261,
    "reward_min": -27.510710227272785,
    "reward_std": 4.790169651866089,
    "timesteps": 157273920,
    "learntime": 0.19676417810842395,
    "sampletime": 18.684010786004364,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 437,
    "reward_mean": -14.899078054717107,
    "reward_max": -6.429389204545427,
    "reward_min": -26.163096590909163,
    "reward_std": 4.257957695874019,
    "timesteps": 157634640,
    "learntime": 0.3007572328206152,
    "sampletime": 18.788575349841267,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 438,
    "reward_mean": -13.691976669773911,
    "reward_max": -7.703451704545481,
    "reward_min": -24.807741477272785,
    "reward_std": 3.3401974153728977,
    "timesteps": 157995360,
    "learntime": 0.20236420189030468,
    "sampletime": 18.669797253096476,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 439,
    "reward_mean": -11.169024843158148,
    "reward_max": -4.035142045454497,
    "reward_min": -22.047215909090934,
    "reward_std": 3.73296979760796,
    "timesteps": 158356080,
    "learntime": 0.32392285484820604,
    "sampletime": 18.735474560875446,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 440,
    "reward_mean": -11.121978944720652,
    "reward_max": -0.7495596590908827,
    "reward_min": -21.46990056818188,
    "reward_std": 3.812960833300446,
    "timesteps": 158716800,
    "learntime": 0.1911979541182518,
    "sampletime": 18.521095572039485,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 441,
    "reward_mean": -14.660890613902717,
    "reward_max": -5.952457386363583,
    "reward_min": -23.351605113636456,
    "reward_std": 3.5726084837465435,
    "timesteps": 159077520,
    "learntime": 0.2905088060069829,
    "sampletime": 18.902447445783764,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 442,
    "reward_mean": -15.36887604684541,
    "reward_max": -6.456164772727228,
    "reward_min": -25.152940340909154,
    "reward_std": 3.872619836602886,
    "timesteps": 159438240,
    "learntime": 0.1885752200614661,
    "sampletime": 18.571073467144743,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 443,
    "reward_mean": -12.37183320016571,
    "reward_max": -5.545351562499968,
    "reward_min": -25.722698863636435,
    "reward_std": 3.266683986434239,
    "timesteps": 159798960,
    "learntime": 0.30220765504054725,
    "sampletime": 18.662970780860633,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 444,
    "reward_mean": -13.247435395211902,
    "reward_max": -4.881718750000036,
    "reward_min": -21.872073863636427,
    "reward_std": 3.946285560708227,
    "timesteps": 160159680,
    "learntime": 0.19120331201702356,
    "sampletime": 18.626851505134255,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 445,
    "reward_mean": -13.820497492009945,
    "reward_max": -4.736789772727247,
    "reward_min": -21.997954545454586,
    "reward_std": 3.6272457833939984,
    "timesteps": 160520400,
    "learntime": 0.2964891130104661,
    "sampletime": 18.922495257109404,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 446,
    "reward_mean": -14.79432038278292,
    "reward_max": -3.345028409090857,
    "reward_min": -28.115582386363748,
    "reward_std": 4.623114179518967,
    "timesteps": 160881120,
    "learntime": 0.1971297999843955,
    "sampletime": 18.689249254064634,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 447,
    "reward_mean": -12.41052800958807,
    "reward_max": -3.9619744318181485,
    "reward_min": -19.224900568181837,
    "reward_std": 2.895341308583872,
    "timesteps": 161241840,
    "learntime": 0.31431890884414315,
    "sampletime": 18.525654811179265,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 448,
    "reward_mean": -13.569152591589734,
    "reward_max": -5.699275568181817,
    "reward_min": -20.390553977272788,
    "reward_std": 2.977717435223734,
    "timesteps": 161602560,
    "learntime": 0.20842883316799998,
    "sampletime": 18.79490234516561,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 449,
    "reward_mean": -12.105516875295926,
    "reward_max": -2.2965056818181213,
    "reward_min": -20.574583333333393,
    "reward_std": 3.487069196080025,
    "timesteps": 161963280,
    "learntime": 0.29612899804487824,
    "sampletime": 18.730834249872714,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 450,
    "reward_mean": -12.948417117956922,
    "reward_max": -4.637997159090931,
    "reward_min": -22.753707386363722,
    "reward_std": 3.032324439518206,
    "timesteps": 162324000,
    "learntime": 0.19901054189540446,
    "sampletime": 18.665303837973624,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 451,
    "reward_mean": -10.266779711174246,
    "reward_max": -3.6178124999999457,
    "reward_min": -17.275681818181845,
    "reward_std": 3.2777836503447295,
    "timesteps": 162684720,
    "learntime": 0.29788667312823236,
    "sampletime": 18.995278146816418,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 452,
    "reward_mean": -13.257929206616975,
    "reward_max": -4.407571022727345,
    "reward_min": -20.4367755681819,
    "reward_std": 3.346051197671407,
    "timesteps": 163045440,
    "learntime": 0.19204495195299387,
    "sampletime": 18.960376046132296,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 453,
    "reward_mean": -12.033993030894885,
    "reward_max": -5.776789772727245,
    "reward_min": -21.350852272727323,
    "reward_std": 3.331840422496052,
    "timesteps": 163406160,
    "learntime": 0.2811818749178201,
    "sampletime": 18.701541383052245,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 454,
    "reward_mean": -14.432958337032451,
    "reward_max": -5.181321022727254,
    "reward_min": -23.09519886363645,
    "reward_std": 3.9844921721756394,
    "timesteps": 163766880,
    "learntime": 0.18587631010450423,
    "sampletime": 19.022226332919672,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 455,
    "reward_mean": -16.06272592255565,
    "reward_max": -6.433124999999964,
    "reward_min": -22.766321022727315,
    "reward_std": 3.343325232206174,
    "timesteps": 164127600,
    "learntime": 0.2801884619984776,
    "sampletime": 18.72628258704208,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 456,
    "reward_mean": -12.142622255267543,
    "reward_max": -1.295455729166677,
    "reward_min": -19.655497159090917,
    "reward_std": 4.161946518945035,
    "timesteps": 164488320,
    "learntime": 0.20463955402374268,
    "sampletime": 19.088258802890778,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 457,
    "reward_mean": -12.492247721354174,
    "reward_max": -2.917400568181799,
    "reward_min": -23.938880208333373,
    "reward_std": 4.446574191038671,
    "timesteps": 164849040,
    "learntime": 0.3019982180558145,
    "sampletime": 18.78654058696702,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 458,
    "reward_mean": -9.201107011274845,
    "reward_max": -0.5769140624999806,
    "reward_min": -18.946931818181863,
    "reward_std": 3.093972325533545,
    "timesteps": 165209760,
    "learntime": 0.19528670003637671,
    "sampletime": 18.51656852522865,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 459,
    "reward_mean": -10.081394708806812,
    "reward_max": -4.551264204545423,
    "reward_min": -18.11563802083337,
    "reward_std": 2.9102143265504776,
    "timesteps": 165570480,
    "learntime": 0.30827477388083935,
    "sampletime": 18.61053816904314,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 460,
    "reward_mean": -11.123049223928746,
    "reward_max": -2.2217613636364195,
    "reward_min": -17.676349431818196,
    "reward_std": 3.680485051629124,
    "timesteps": 165931200,
    "learntime": 0.19202971807681024,
    "sampletime": 18.717587357852608,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 461,
    "reward_mean": -11.468743249141813,
    "reward_max": -4.2887926136363195,
    "reward_min": -19.818153409090954,
    "reward_std": 3.8500398166762175,
    "timesteps": 166291920,
    "learntime": 0.31506905099377036,
    "sampletime": 18.751213821116835,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 462,
    "reward_mean": -15.486794932972344,
    "reward_max": -4.882825520833324,
    "reward_min": -26.055056818181924,
    "reward_std": 3.9780073929855715,
    "timesteps": 166652640,
    "learntime": 0.19661886617541313,
    "sampletime": 19.050578789087012,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 463,
    "reward_mean": -11.440387406782673,
    "reward_max": -5.534857954545445,
    "reward_min": -17.382102272727312,
    "reward_std": 2.693579691605423,
    "timesteps": 167013360,
    "learntime": 0.3011066869366914,
    "sampletime": 18.76260973396711,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 464,
    "reward_mean": -11.283522449840207,
    "reward_max": -4.607159090909101,
    "reward_min": -20.066718750000067,
    "reward_std": 3.5189398126241307,
    "timesteps": 167374080,
    "learntime": 0.20696313492953777,
    "sampletime": 18.593775116838515,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 465,
    "reward_mean": -11.141944802024156,
    "reward_max": -2.0286067708333193,
    "reward_min": -19.402585227272763,
    "reward_std": 3.8981025718398143,
    "timesteps": 167734800,
    "learntime": 0.31037450302392244,
    "sampletime": 18.5587213661056,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 466,
    "reward_mean": -8.248437222567468,
    "reward_max": -0.6385511363636357,
    "reward_min": -17.3549857954546,
    "reward_std": 3.295747751476029,
    "timesteps": 168095520,
    "learntime": 0.18876520707271993,
    "sampletime": 18.636518883984536,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 467,
    "reward_mean": -9.265532725941048,
    "reward_max": 2.4034517045454336,
    "reward_min": -18.458735795454558,
    "reward_std": 4.413814482795896,
    "timesteps": 168456240,
    "learntime": 0.3005653719883412,
    "sampletime": 18.601094376994297,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 468,
    "reward_mean": -8.777639511570788,
    "reward_max": -1.2730208333333248,
    "reward_min": -16.093309659090973,
    "reward_std": 3.6820597724294983,
    "timesteps": 168816960,
    "learntime": 0.1958767520263791,
    "sampletime": 18.624082583002746,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 469,
    "reward_mean": -11.546293260978938,
    "reward_max": 2.6676704545454832,
    "reward_min": -22.30014204545461,
    "reward_std": 4.0718340818445755,
    "timesteps": 169177680,
    "learntime": 0.3043371639214456,
    "sampletime": 18.824673474067822,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 470,
    "reward_mean": -10.924133300781255,
    "reward_max": 0.11098011363639415,
    "reward_min": -21.06807291666675,
    "reward_std": 3.86196087285891,
    "timesteps": 169538400,
    "learntime": 0.19036589888855815,
    "sampletime": 18.622257028939202,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 471,
    "reward_mean": -7.998391520182288,
    "reward_max": 0.137741477272771,
    "reward_min": -15.963963068181869,
    "reward_std": 4.042127950985666,
    "timesteps": 169899120,
    "learntime": 0.2854533880017698,
    "sampletime": 18.43093451904133,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 472,
    "reward_mean": -12.164086895567022,
    "reward_max": -2.4820028409090655,
    "reward_min": -19.398181818181882,
    "reward_std": 3.556613217119489,
    "timesteps": 170259840,
    "learntime": 0.2016216809861362,
    "sampletime": 19.03830233006738,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 473,
    "reward_mean": -9.360191188003077,
    "reward_max": -2.1559375000000203,
    "reward_min": -15.126406250000024,
    "reward_std": 2.9854293877252784,
    "timesteps": 170620560,
    "learntime": 0.2833452250342816,
    "sampletime": 18.572316077072173,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 474,
    "reward_mean": -9.081116573449336,
    "reward_max": -0.8120028409090924,
    "reward_min": -16.441448863636356,
    "reward_std": 3.2983886931066837,
    "timesteps": 170981280,
    "learntime": 0.20234036212787032,
    "sampletime": 18.48596445005387,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 475,
    "reward_mean": -12.216619114731316,
    "reward_max": -7.391633522727307,
    "reward_min": -22.345553977272804,
    "reward_std": 3.057895182061766,
    "timesteps": 171342000,
    "learntime": 0.3151832411531359,
    "sampletime": 18.537340672919527,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 476,
    "reward_mean": -15.499458414713564,
    "reward_max": -4.525184659090875,
    "reward_min": -21.44049479166675,
    "reward_std": 3.8157580598621963,
    "timesteps": 171702720,
    "learntime": 0.19251049193553627,
    "sampletime": 18.951411911984906,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 477,
    "reward_mean": -8.984066199100361,
    "reward_max": -0.6128124999999561,
    "reward_min": -17.430340909090916,
    "reward_std": 3.4412917358040165,
    "timesteps": 172063440,
    "learntime": 0.28965373197570443,
    "sampletime": 18.564326116116717,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 478,
    "reward_mean": -6.260559211499761,
    "reward_max": 2.210325520833343,
    "reward_min": -15.100937500000002,
    "reward_std": 3.8355188982741097,
    "timesteps": 172424160,
    "learntime": 0.21168506587855518,
    "sampletime": 18.292975982883945,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 479,
    "reward_mean": -7.692668900923294,
    "reward_max": 2.9103409090909422,
    "reward_min": -15.731988636363662,
    "reward_std": 3.99351827303184,
    "timesteps": 172784880,
    "learntime": 0.2748747579753399,
    "sampletime": 18.958042015088722,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 480,
    "reward_mean": -11.90074544270835,
    "reward_max": -4.317434895833329,
    "reward_min": -18.542698863636396,
    "reward_std": 3.186883727398963,
    "timesteps": 173145600,
    "learntime": 0.19745497801341116,
    "sampletime": 18.732251523062587,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 481,
    "reward_mean": -10.123687244762088,
    "reward_max": -1.105980113636382,
    "reward_min": -16.85536931818186,
    "reward_std": 3.2691895120940013,
    "timesteps": 173506320,
    "learntime": 0.30931253801099956,
    "sampletime": 18.67383817816153,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 482,
    "reward_mean": -8.503900090997863,
    "reward_max": -0.5242187499999887,
    "reward_min": -17.708309659090954,
    "reward_std": 3.199677547816077,
    "timesteps": 173867040,
    "learntime": 0.20679371105507016,
    "sampletime": 18.590008048107848,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 483,
    "reward_mean": -8.094235506924697,
    "reward_max": -1.1787357954545075,
    "reward_min": -13.189322916666653,
    "reward_std": 2.3342991231228756,
    "timesteps": 174227760,
    "learntime": 0.2902840038295835,
    "sampletime": 18.398229802958667,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 484,
    "reward_mean": -7.845316550514902,
    "reward_max": -0.16958806818179425,
    "reward_min": -16.1103551136364,
    "reward_std": 3.752047463381723,
    "timesteps": 174588480,
    "learntime": 0.20653313305228949,
    "sampletime": 18.56676066783257,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 485,
    "reward_mean": -11.334570904356077,
    "reward_max": -0.7659517045454695,
    "reward_min": -19.751505681818312,
    "reward_std": 3.9875077108237282,
    "timesteps": 174949200,
    "learntime": 0.301230848999694,
    "sampletime": 18.848497906001285,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 486,
    "reward_mean": -11.59228534120503,
    "reward_max": -5.637926136363618,
    "reward_min": -21.52193181818188,
    "reward_std": 3.321971405962166,
    "timesteps": 175309920,
    "learntime": 0.1968863841611892,
    "sampletime": 18.588197072967887,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 487,
    "reward_mean": -10.889187381628789,
    "reward_max": -6.092727272727251,
    "reward_min": -19.15080965909091,
    "reward_std": 2.9823467528592658,
    "timesteps": 175670640,
    "learntime": 0.31305737397633493,
    "sampletime": 18.627399178920314,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 488,
    "reward_mean": -9.386179698597289,
    "reward_max": 1.0759517045454543,
    "reward_min": -19.27213068181822,
    "reward_std": 3.712431718994148,
    "timesteps": 176031360,
    "learntime": 0.20849150395952165,
    "sampletime": 18.697760197799653,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 489,
    "reward_mean": -9.276834050958817,
    "reward_max": 3.2765624999999443,
    "reward_min": -22.42511363636372,
    "reward_std": 4.359906109270107,
    "timesteps": 176392080,
    "learntime": 0.3024718319065869,
    "sampletime": 18.72929343697615,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 490,
    "reward_mean": -15.388169296727064,
    "reward_max": -5.164531249999974,
    "reward_min": -25.206860795454602,
    "reward_std": 3.877952211005849,
    "timesteps": 176752800,
    "learntime": 0.20301561593078077,
    "sampletime": 18.83896326320246,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 491,
    "reward_mean": -13.148001246596845,
    "reward_max": -3.8281534090908793,
    "reward_min": -21.33709635416672,
    "reward_std": 3.877922136798344,
    "timesteps": 177113520,
    "learntime": 0.3092625788412988,
    "sampletime": 18.76058574905619,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 492,
    "reward_mean": -8.68093289462003,
    "reward_max": 1.308451704545413,
    "reward_min": -16.558877840909147,
    "reward_std": 3.820753729099097,
    "timesteps": 177474240,
    "learntime": 0.20013994397595525,
    "sampletime": 18.6429887060076,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 493,
    "reward_mean": -5.675454342004016,
    "reward_max": 2.7649005681817957,
    "reward_min": -16.76610795454545,
    "reward_std": 3.5124998088104014,
    "timesteps": 177834960,
    "learntime": 0.302228928077966,
    "sampletime": 18.431526153115556,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 494,
    "reward_mean": -5.053803230054434,
    "reward_max": 6.495284090909103,
    "reward_min": -12.205156249999987,
    "reward_std": 3.644887956754053,
    "timesteps": 178195680,
    "learntime": 0.1834167179185897,
    "sampletime": 18.65929400618188,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 495,
    "reward_mean": -8.156298532196967,
    "reward_max": -0.5669602272727274,
    "reward_min": -16.70742897727275,
    "reward_std": 3.6447463614890845,
    "timesteps": 178556400,
    "learntime": 0.3127984299790114,
    "sampletime": 18.591383968945593,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 496,
    "reward_mean": -11.131707356770832,
    "reward_max": -0.6290340909090464,
    "reward_min": -20.691519886363743,
    "reward_std": 3.5392046779571436,
    "timesteps": 178917120,
    "learntime": 0.19457096001133323,
    "sampletime": 18.81920207408257,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 497,
    "reward_mean": -10.225381007339,
    "reward_max": -4.219401041666617,
    "reward_min": -18.30205965909095,
    "reward_std": 3.4008947242513985,
    "timesteps": 179277840,
    "learntime": 0.19333964120596647,
    "sampletime": 18.707775355083868,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 498,
    "reward_mean": -12.924852535363392,
    "reward_max": -7.400481770833307,
    "reward_min": -20.791576704545466,
    "reward_std": 3.1574497954686693,
    "timesteps": 179638560,
    "learntime": 0.28554380196146667,
    "sampletime": 18.724275588057935,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 499,
    "reward_mean": -12.046333303740543,
    "reward_max": -1.571653645833342,
    "reward_min": -22.64210937500005,
    "reward_std": 4.255179803952152,
    "timesteps": 179999280,
    "learntime": 0.20088887913152575,
    "sampletime": 18.466501360060647,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  },
  {
    "gen": 500,
    "reward_mean": -9.706420657995972,
    "reward_max": 0.927670454545488,
    "reward_min": -18.848565340909133,
    "reward_std": 4.056155167704478,
    "timesteps": 180360000,
    "learntime": 0.30475172493606806,
    "sampletime": 18.41926133004017,
    "best_max_mean": -2.326923791133998,
    "best_max": 8.34898437499997
  }
]